Skip to content

Commit 06c9f5c

Browse files
nvjullinamd-xiaoyu12
authored andcommitted
[Bugfix] Added more env vars to hash (vllm-project#22449)
Signed-off-by: Julien Lin <[email protected]> Signed-off-by: Xiao Yu <[email protected]>
1 parent 609b9c1 commit 06c9f5c

File tree

1 file changed

+36
-10
lines changed

1 file changed

+36
-10
lines changed

vllm/envs.py

Lines changed: 36 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1205,14 +1205,6 @@ def compute_hash() -> str:
12051205
affect the choice of different kernels or attention backends should
12061206
also be included in the factors list.
12071207
"""
1208-
factors: list[Any] = []
1209-
1210-
# summarize environment variables
1211-
def factorize(name: str):
1212-
if __getattr__(name):
1213-
factors.append(__getattr__(name))
1214-
else:
1215-
factors.append("None")
12161208

12171209
# The values of envs may affects the computation graph.
12181210
# TODO(DefTruth): hash all environment variables?
@@ -1227,11 +1219,45 @@ def factorize(name: str):
12271219
"VLLM_DP_SIZE",
12281220
"VLLM_USE_STANDALONE_COMPILE",
12291221
"VLLM_FUSED_MOE_CHUNK_SIZE",
1222+
"VLLM_FLASHINFER_MOE_BACKEND",
1223+
"VLLM_V1_USE_PREFILL_DECODE_ATTENTION",
1224+
"VLLM_USE_AITER_UNIFIED_ATTENTION",
1225+
"VLLM_ATTENTION_BACKEND",
1226+
"VLLM_USE_FLASHINFER_SAMPLER",
1227+
"VLLM_FLASHINFER_FORCE_TENSOR_CORES",
1228+
"VLLM_DISABLED_KERNELS",
1229+
"VLLM_USE_DEEP_GEMM",
12301230
"VLLM_USE_TRTLLM_FP4_GEMM",
1231+
"VLLM_USE_FLASHINFER_MOE_FP8",
1232+
"VLLM_USE_FLASHINFER_MOE_FP4",
1233+
"VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8",
1234+
"VLLM_USE_FLASHINFER_MOE_MXFP4_BF16",
1235+
"VLLM_USE_CUDNN_PREFILL",
1236+
"VLLM_USE_TRTLLM_ATTENTION",
1237+
"VLLM_ROCM_USE_AITER",
1238+
"VLLM_ROCM_USE_AITER_PAGED_ATTN",
1239+
"VLLM_ROCM_USE_AITER_LINEAR",
1240+
"VLLM_ROCM_USE_AITER_MOE",
1241+
"VLLM_ROCM_USE_AITER_RMSNORM",
1242+
"VLLM_ROCM_USE_AITER_MLA",
1243+
"VLLM_ROCM_USE_AITER_MHA",
1244+
"VLLM_ROCM_USE_SKINNY_GEMM",
1245+
"VLLM_ROCM_FP8_PADDING",
1246+
"VLLM_ROCM_MOE_PADDING",
1247+
"VLLM_ROCM_CUSTOM_PAGED_ATTN",
1248+
"VLLM_ROCM_QUICK_REDUCE_QUANTIZATION",
1249+
"VLLM_ROCM_QUICK_REDUCE_CAST_BF16_TO_FP16",
1250+
"VLLM_ROCM_QUICK_REDUCE_MAX_SIZE_BYTES_MB",
12311251
]
12321252
for key in environment_variables_to_hash:
1233-
if key in environment_variables:
1234-
factorize(key)
1253+
# if this goes out of sync with environment_variables,
1254+
# it's not a user error, it's a bug
1255+
assert key in environment_variables, \
1256+
"Please update environment_variables_to_hash in envs.py"
1257+
1258+
factors = [
1259+
environment_variables[key]() for key in environment_variables_to_hash
1260+
]
12351261

12361262
hash_str = hashlib.md5(str(factors).encode(),
12371263
usedforsecurity=False).hexdigest()

0 commit comments

Comments
 (0)