Set enable_attn_fusion=True by default now that attention fusion is fixed

micah-wil · micah-wil · commit bfe0b20db757 · 2025-09-02T18:27:02.000Z
diff --git a/vllm/config/compilation.py b/vllm/config/compilation.py
@@ -77,7 +77,7 @@ class PassConfig:
 
     enable_fusion: bool = field(default_factory=lambda: envs.VLLM_USE_V1)
     """Whether to enable the custom fusion (RMSNorm/SiluMul+quant) pass."""
-    enable_attn_fusion: bool = False
+    enable_attn_fusion: bool = field(default_factory=lambda: envs.VLLM_USE_V1)
     """Whether to enable the custom attention+quant fusion pass."""
     enable_noop: bool = field(default_factory=lambda: envs.VLLM_USE_V1)
     """Whether to enable the custom no-op elimination pass."""