Skip to content

Commit d3ab240

Browse files
authored
[Bug] Fix deepep low latency use nvlink by default (vllm-project#27677)
Signed-off-by: yewentao256 <zhyanwentao@126.com>
1 parent 9466661 commit d3ab240

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

vllm/envs.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -205,7 +205,7 @@
205205
VLLM_OBJECT_STORAGE_SHM_BUFFER_NAME: str = "VLLM_OBJECT_STORAGE_SHM_BUFFER"
206206
VLLM_DEEPEP_BUFFER_SIZE_MB: int = 1024
207207
VLLM_DEEPEP_HIGH_THROUGHPUT_FORCE_INTRA_NODE: bool = False
208-
VLLM_DEEPEP_LOW_LATENCY_ALLOW_NVLINK: bool = False
208+
VLLM_DEEPEP_LOW_LATENCY_ALLOW_NVLINK: bool = True
209209
VLLM_DEEPEP_LOW_LATENCY_USE_MNNVL: bool = False
210210
VLLM_DBO_COMM_SMS: int = 20
211211
GPT_OSS_SYSTEM_TOOL_MCP_LABELS: list[str] = []
@@ -1362,7 +1362,7 @@ def get_vllm_port() -> int | None:
13621362
# Allow DeepEP to use nvlink for internode_ll kernel, turn this on for
13631363
# better latency on GB200 like system
13641364
"VLLM_DEEPEP_LOW_LATENCY_ALLOW_NVLINK": lambda: bool(
1365-
int(os.getenv("VLLM_DEEPEP_LOW_LATENCY_ALLOW_NVLINK", "0"))
1365+
int(os.getenv("VLLM_DEEPEP_LOW_LATENCY_ALLOW_NVLINK", "1"))
13661366
),
13671367
# Allow DeepEP to use MNNVL (multi-node nvlink) for internode_ll kernel,
13681368
# turn this for better latency on GB200 like system

0 commit comments

Comments
 (0)