@@ -1207,14 +1207,6 @@ def compute_hash() -> str:
1207
1207
affect the choice of different kernels or attention backends should
1208
1208
also be included in the factors list.
1209
1209
"""
1210
- factors : list [Any ] = []
1211
-
1212
- # summarize environment variables
1213
- def factorize (name : str ):
1214
- if __getattr__ (name ):
1215
- factors .append (__getattr__ (name ))
1216
- else :
1217
- factors .append ("None" )
1218
1210
1219
1211
# The values of envs may affects the computation graph.
1220
1212
# TODO(DefTruth): hash all environment variables?
@@ -1229,11 +1221,45 @@ def factorize(name: str):
1229
1221
"VLLM_DP_SIZE" ,
1230
1222
"VLLM_USE_STANDALONE_COMPILE" ,
1231
1223
"VLLM_FUSED_MOE_CHUNK_SIZE" ,
1224
+ "VLLM_FLASHINFER_MOE_BACKEND" ,
1225
+ "VLLM_V1_USE_PREFILL_DECODE_ATTENTION" ,
1226
+ "VLLM_USE_AITER_UNIFIED_ATTENTION" ,
1227
+ "VLLM_ATTENTION_BACKEND" ,
1228
+ "VLLM_USE_FLASHINFER_SAMPLER" ,
1229
+ "VLLM_FLASHINFER_FORCE_TENSOR_CORES" ,
1230
+ "VLLM_DISABLED_KERNELS" ,
1231
+ "VLLM_USE_DEEP_GEMM" ,
1232
1232
"VLLM_USE_TRTLLM_FP4_GEMM" ,
1233
+ "VLLM_USE_FLASHINFER_MOE_FP8" ,
1234
+ "VLLM_USE_FLASHINFER_MOE_FP4" ,
1235
+ "VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8" ,
1236
+ "VLLM_USE_FLASHINFER_MOE_MXFP4_BF16" ,
1237
+ "VLLM_USE_CUDNN_PREFILL" ,
1238
+ "VLLM_USE_TRTLLM_ATTENTION" ,
1239
+ "VLLM_ROCM_USE_AITER" ,
1240
+ "VLLM_ROCM_USE_AITER_PAGED_ATTN" ,
1241
+ "VLLM_ROCM_USE_AITER_LINEAR" ,
1242
+ "VLLM_ROCM_USE_AITER_MOE" ,
1243
+ "VLLM_ROCM_USE_AITER_RMSNORM" ,
1244
+ "VLLM_ROCM_USE_AITER_MLA" ,
1245
+ "VLLM_ROCM_USE_AITER_MHA" ,
1246
+ "VLLM_ROCM_USE_SKINNY_GEMM" ,
1247
+ "VLLM_ROCM_FP8_PADDING" ,
1248
+ "VLLM_ROCM_MOE_PADDING" ,
1249
+ "VLLM_ROCM_CUSTOM_PAGED_ATTN" ,
1250
+ "VLLM_ROCM_QUICK_REDUCE_QUANTIZATION" ,
1251
+ "VLLM_ROCM_QUICK_REDUCE_CAST_BF16_TO_FP16" ,
1252
+ "VLLM_ROCM_QUICK_REDUCE_MAX_SIZE_BYTES_MB" ,
1233
1253
]
1234
1254
for key in environment_variables_to_hash :
1235
- if key in environment_variables :
1236
- factorize (key )
1255
+ # if this goes out of sync with environment_variables,
1256
+ # it's not a user error, it's a bug
1257
+ assert key in environment_variables , \
1258
+ "Please update environment_variables_to_hash in envs.py"
1259
+
1260
+ factors = [
1261
+ environment_variables [key ]() for key in environment_variables_to_hash
1262
+ ]
1237
1263
1238
1264
hash_str = hashlib .md5 (str (factors ).encode (),
1239
1265
usedforsecurity = False ).hexdigest ()
0 commit comments