remove valid pplx check

bnellnm · bnellnm · commit 48ba146818d2 · 2025-05-07T15:37:14.000Z
Signed-off-by: Bill Nell &lt;bnell@redhat.com&gt;
diff --git a/vllm/model_executor/layers/fused_moe/layer.py b/vllm/model_executor/layers/fused_moe/layer.py
@@ -1016,14 +1016,9 @@ def naive_multicast(self, x: torch.Tensor,
 
         return buffer
 
-    # TODO: will this be cudagraph-able? (probably not)
-    # This should not be necessary.
-    def invalid_pplx(self, hidden_states: torch.Tensor) -> bool:
-        return has_pplx and hidden_states.shape[0] < self.dp_size
-
     def forward(self, hidden_states: torch.Tensor,
                 router_logits: torch.Tensor):
-        if self.use_direct_call or self.invalid_pplx(hidden_states):
+        if self.use_direct_call:
             return self.forward_impl(hidden_states, router_logits)
         else:
             return torch.ops.vllm.moe_forward(hidden_states, router_logits,