Skip to content

Commit be263f7

Browse files
[BugFix] Fix AssertionError: DCP not support reorder_batch_threshold > 1 now. (#28751)
Signed-off-by: Lucas Wilkinson <[email protected]>
1 parent 2bb4435 commit be263f7

File tree

1 file changed

+0
-10
lines changed

1 file changed

+0
-10
lines changed

vllm/v1/worker/gpu_model_runner.py

Lines changed: 0 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -630,16 +630,6 @@ def _may_reorder_batch(self, scheduler_output: "SchedulerOutput") -> None:
630630
return
631631

632632
if self.reorder_batch_threshold is not None:
633-
# NOTE(lucas): currently no backend supports the custom masking
634-
# required for DCP with q_len > 1, so we assert here. Remove this
635-
# assert once the custom mask is support is added to FA3.
636-
if (
637-
self.dcp_world_size > 1
638-
and envs.VLLM_ATTENTION_BACKEND != "FLASH_ATTN_MLA"
639-
):
640-
assert self.reorder_batch_threshold == 1, (
641-
"DCP not support reorder_batch_threshold > 1 now."
642-
)
643633
reorder_batch_to_split_decodes_and_prefills(
644634
self.input_batch,
645635
scheduler_output,

0 commit comments

Comments
 (0)