We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 55cd9df commit bfe0b20Copy full SHA for bfe0b20
vllm/config/compilation.py
@@ -77,7 +77,7 @@ class PassConfig:
77
78
enable_fusion: bool = field(default_factory=lambda: envs.VLLM_USE_V1)
79
"""Whether to enable the custom fusion (RMSNorm/SiluMul+quant) pass."""
80
- enable_attn_fusion: bool = False
+ enable_attn_fusion: bool = field(default_factory=lambda: envs.VLLM_USE_V1)
81
"""Whether to enable the custom attention+quant fusion pass."""
82
enable_noop: bool = field(default_factory=lambda: envs.VLLM_USE_V1)
83
"""Whether to enable the custom no-op elimination pass."""
0 commit comments