Skip to content

Commit 8425f78

Browse files
varun-sundar-rabindranathVarun Sundar Rabindranath
andauthored
[Misc] DeepEPHighThroughtput - Enable Inductor pass (#21311)
Signed-off-by: Varun Sundar Rabindranath <[email protected]> Co-authored-by: Varun Sundar Rabindranath <[email protected]>
1 parent c17231e commit 8425f78

File tree

1 file changed

+0
-3
lines changed

1 file changed

+0
-3
lines changed

vllm/platforms/cuda.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -182,9 +182,6 @@ def check_and_update_config(cls, vllm_config: "VllmConfig") -> None:
182182
compilation_config.use_cudagraph = False
183183
if model_config is not None:
184184
model_config.enforce_eager = True
185-
# TODO (varun): Turning this ON gives incorrect results for the
186-
# Deepseek-V2-lite model.
187-
vllm_config.compilation_config.use_inductor = False
188185

189186
@classmethod
190187
def get_current_memory_usage(cls,

0 commit comments

Comments
 (0)