@@ -75,11 +75,11 @@ class PassConfig:
75
75
don't all have access to full configuration - that would create a cycle as
76
76
the `PassManager` is set as a property of config."""
77
77
78
- enable_fusion : bool = field (default_factory = lambda : not envs .VLLM_USE_V1 )
78
+ enable_fusion : bool = field (default_factory = lambda : envs .VLLM_USE_V1 )
79
79
"""Whether to enable the custom fusion (RMSNorm/SiluMul+quant) pass."""
80
80
enable_attn_fusion : bool = False
81
81
"""Whether to enable the custom attention+quant fusion pass."""
82
- enable_noop : bool = field (default_factory = lambda : not envs .VLLM_USE_V1 )
82
+ enable_noop : bool = field (default_factory = lambda : envs .VLLM_USE_V1 )
83
83
"""Whether to enable the custom no-op elimination pass."""
84
84
enable_sequence_parallelism : bool = False
85
85
"""Whether to enable sequence parallelism."""
@@ -223,7 +223,7 @@ class CompilationConfig:
223
223
constructor, e.g. `CompilationConfig(inductor_passes={"a": func})`."""
224
224
225
225
# CudaGraph compilation
226
- cudagraph_mode : Optional [CUDAGraphMode ] = None
226
+ cudagraph_mode : Optional [CUDAGraphMode ] = CUDAGraphMode . FULL
227
227
"""
228
228
The mode of the cudagraph:
229
229
@@ -408,6 +408,16 @@ def __post_init__(self) -> None:
408
408
count_all = self .custom_ops .count ("all" )
409
409
assert count_none + count_all <= 1 , "Can only specify 'none' or 'all'"
410
410
411
+ if "+rms_norm" not in self .custom_ops and \
412
+ "-rms_norm" not in self .custom_ops :
413
+ self .custom_ops .append ("+rms_norm" )
414
+ if "+silu_and_mul" not in self .custom_ops and \
415
+ "-silu_and_mul" not in self .custom_ops :
416
+ self .custom_ops .append ("+silu_and_mul" )
417
+ if "+quant_fp8" not in self .custom_ops and \
418
+ "-quant_fp8" not in self .custom_ops :
419
+ self .custom_ops .append ("+quant_fp8" )
420
+
411
421
# TODO(zou3519/luka): There are 2 issues with auto-functionalization V2:
412
422
# 1. A bug in PyTorch, fixed in 2.7:
413
423
# https://github.com/pytorch/pytorch/issues/147924
0 commit comments