File tree Expand file tree Collapse file tree 1 file changed +9
-1
lines changed Expand file tree Collapse file tree 1 file changed +9
-1
lines changed Original file line number Diff line number Diff line change @@ -3711,7 +3711,15 @@ def __post_init__(self):
3711
3711
"Compilation level should be CompilationLevel.PIECEWISE " \
3712
3712
"when cudagraph_mode piecewise cudagraphs is used, " \
3713
3713
f"cudagraph_mode={ self .compilation_config .cudagraph_mode } "
3714
-
3714
+
3715
+ if self .parallel_config .enable_microbatching :
3716
+ a2a_backend = envs .VLLM_ALL2ALL_BACKEND
3717
+ assert a2a_backend == "deepep_low_latency" , \
3718
+ "Microbatching currently only supports the deepep_low_latency " \
3719
+ f"all2all backend. { a2a_backend } is not supported. To fix set " \
3720
+ "the VLLM_ALL2ALL_BACKEND environment variable to " \
3721
+ "deepep_low_latency and install the DeepEP kerenls."
3722
+
3715
3723
if not self .instance_id :
3716
3724
self .instance_id = random_uuid ()[:5 ]
3717
3725
You can’t perform that action at this time.
0 commit comments