We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c1c003f commit aebacdcCopy full SHA for aebacdc
vllm/model_executor/layers/fused_moe/pplx_prepare_finalize.py
@@ -249,10 +249,8 @@ def finalize(
249
if apply_router_weight_on_input:
250
topk_weights = torch.ones_like(topk_weights)
251
252
- self.a2a.combine(
253
- out_tokens=output,
254
- indices=topk_ids.view(dtype=torch.uint32),
255
- weights=topk_weights,
256
- expert_y=fused_expert_output,
257
- bound_m=bound_m,
258
- )
+ self.a2a.combine(out_tokens=output,
+ indices=topk_ids.view(dtype=torch.uint32),
+ weights=topk_weights,
+ expert_y=fused_expert_output,
+ bound_m=bound_m)
0 commit comments