remove backend='inductor' in local patch

This commit is contained in:
Sunny Liu
2025-04-07 17:05:08 -04:00
parent 4e8677027a
commit 421e0ee499

View File

@@ -40,7 +40,6 @@ def patch_flex_wrapper():
if not self._is_flex_compiled:
self._compiled_flex_attention = torch.compile(
flex_attention,
backend="inductor",
mode="max-autotune-no-cudagraphs",
fullgraph=True,
)