We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 005ae9b commit 3fb686fCopy full SHA for 3fb686f
vllm/compilation/collective_fusion.py
@@ -176,7 +176,7 @@ def call_trtllm_fused_allreduce_norm(
176
use_flashinfer = allreduce_in.shape[0] * allreduce_in.shape[
177
1] * allreduce_in.element_size() <= min(
178
_FI_MAX_SIZES[world_size],
179
- max_token_num * allreduce_in.shape[0] *
+ max_token_num * allreduce_in.shape[1] *
180
allreduce_in.element_size(),
181
)
182
if use_flashinfer:
0 commit comments