[Misc] DeepEPHighThroughtput - Enable Inductor pass (#21311)

varun-sundar-rabindranath · Varun Sundar Rabindranath · web-flow · commit 8425f785ad58 · 2025-07-21T23:35:45.000-07:00
Signed-off-by: Varun Sundar Rabindranath &lt;vsundarr@redhat.com&gt;
Co-authored-by: Varun Sundar Rabindranath &lt;vsundarr@redhat.com&gt;
diff --git a/vllm/platforms/cuda.py b/vllm/platforms/cuda.py
@@ -182,9 +182,6 @@ def check_and_update_config(cls, vllm_config: "VllmConfig") -> None:
             compilation_config.use_cudagraph = False
             if model_config is not None:
                 model_config.enforce_eager = True
-            # TODO (varun): Turning this ON gives incorrect results for the
-            # Deepseek-V2-lite model.
-            vllm_config.compilation_config.use_inductor = False
 
     @classmethod
     def get_current_memory_usage(cls,