Skip to content
This repository was archived by the owner on Sep 4, 2025. It is now read-only.

Commit 507c005

Browse files
authored
disable moe padding by default and enable fp8 padding by default (#190)
1 parent 6bd99d2 commit 507c005

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

vllm/envs.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -69,8 +69,8 @@
6969
VLLM_ALLOW_RUNTIME_LORA_UPDATING: bool = False
7070
VLLM_SYNC_SERVER_ACCUM_REQUESTS: int = 1
7171
VLLM_SYNC_SERVER_ENGINE_STEPS_BETWEEN_POLLS: int = 1
72-
VLLM_MOE_PADDING: bool = True
73-
VLLM_FP8_PADDING: bool = False
72+
VLLM_MOE_PADDING: bool = False
73+
VLLM_FP8_PADDING: bool = True
7474

7575

7676
def get_default_cache_root():
@@ -468,11 +468,11 @@ def get_default_config_root():
468468

469469
# Pad the weight for moe kernel or not
470470
"VLLM_MOE_PADDING":
471-
lambda: bool(int(os.getenv("VLLM_MOE_PADDING", "1"))),
471+
lambda: bool(int(os.getenv("VLLM_MOE_PADDING", "0"))),
472472

473473
# Pad the weight for moe kernel or not
474474
"VLLM_FP8_PADDING":
475-
lambda: bool(int(os.getenv("VLLM_FP8_PADDING", "0"))),
475+
lambda: bool(int(os.getenv("VLLM_FP8_PADDING", "1"))),
476476
}
477477

478478
# end-env-vars-definition

0 commit comments

Comments
 (0)