@@ -1206,14 +1206,6 @@ def compute_hash() -> str:
1206
1206
affect the choice of different kernels or attention backends should
1207
1207
also be included in the factors list.
1208
1208
"""
1209
- factors : list [Any ] = []
1210
-
1211
- # summarize environment variables
1212
- def factorize (name : str ):
1213
- if __getattr__ (name ):
1214
- factors .append (__getattr__ (name ))
1215
- else :
1216
- factors .append ("None" )
1217
1209
1218
1210
# The values of envs may affects the computation graph.
1219
1211
# TODO(DefTruth): hash all environment variables?
@@ -1228,11 +1220,45 @@ def factorize(name: str):
1228
1220
"VLLM_DP_SIZE" ,
1229
1221
"VLLM_USE_STANDALONE_COMPILE" ,
1230
1222
"VLLM_FUSED_MOE_CHUNK_SIZE" ,
1223
+ "VLLM_FLASHINFER_MOE_BACKEND" ,
1224
+ "VLLM_V1_USE_PREFILL_DECODE_ATTENTION" ,
1225
+ "VLLM_USE_AITER_UNIFIED_ATTENTION" ,
1226
+ "VLLM_ATTENTION_BACKEND" ,
1227
+ "VLLM_USE_FLASHINFER_SAMPLER" ,
1228
+ "VLLM_FLASHINFER_FORCE_TENSOR_CORES" ,
1229
+ "VLLM_DISABLED_KERNELS" ,
1230
+ "VLLM_USE_DEEP_GEMM" ,
1231
1231
"VLLM_USE_TRTLLM_FP4_GEMM" ,
1232
+ "VLLM_USE_FLASHINFER_MOE_FP8" ,
1233
+ "VLLM_USE_FLASHINFER_MOE_FP4" ,
1234
+ "VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8" ,
1235
+ "VLLM_USE_FLASHINFER_MOE_MXFP4_BF16" ,
1236
+ "VLLM_USE_CUDNN_PREFILL" ,
1237
+ "VLLM_USE_TRTLLM_ATTENTION" ,
1238
+ "VLLM_ROCM_USE_AITER" ,
1239
+ "VLLM_ROCM_USE_AITER_PAGED_ATTN" ,
1240
+ "VLLM_ROCM_USE_AITER_LINEAR" ,
1241
+ "VLLM_ROCM_USE_AITER_MOE" ,
1242
+ "VLLM_ROCM_USE_AITER_RMSNORM" ,
1243
+ "VLLM_ROCM_USE_AITER_MLA" ,
1244
+ "VLLM_ROCM_USE_AITER_MHA" ,
1245
+ "VLLM_ROCM_USE_SKINNY_GEMM" ,
1246
+ "VLLM_ROCM_FP8_PADDING" ,
1247
+ "VLLM_ROCM_MOE_PADDING" ,
1248
+ "VLLM_ROCM_CUSTOM_PAGED_ATTN" ,
1249
+ "VLLM_ROCM_QUICK_REDUCE_QUANTIZATION" ,
1250
+ "VLLM_ROCM_QUICK_REDUCE_CAST_BF16_TO_FP16" ,
1251
+ "VLLM_ROCM_QUICK_REDUCE_MAX_SIZE_BYTES_MB" ,
1232
1252
]
1233
1253
for key in environment_variables_to_hash :
1234
- if key in environment_variables :
1235
- factorize (key )
1254
+ # if this goes out of sync with environment_variables,
1255
+ # it's not a user error, it's a bug
1256
+ assert key in environment_variables , \
1257
+ "Please update environment_variables_to_hash in envs.py"
1258
+
1259
+ factors = [
1260
+ environment_variables [key ]() for key in environment_variables_to_hash
1261
+ ]
1236
1262
1237
1263
hash_str = hashlib .md5 (str (factors ).encode (),
1238
1264
usedforsecurity = False ).hexdigest ()
0 commit comments