Skip to content

Commit a258ad8

Browse files
authored
[Bugfix] fix qwen3 moe fp8 accuracy issue (#23031)
Signed-off-by: Jinzhen Lin <[email protected]>
1 parent bf7f470 commit a258ad8

File tree

1 file changed

+4
-0
lines changed
  • vllm/model_executor/layers/quantization

1 file changed

+4
-0
lines changed

vllm/model_executor/layers/quantization/fp8.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -125,6 +125,10 @@ def from_config(cls, config: dict[str, Any]) -> "Fp8Config":
125125
ignored_layers = cls.get_from_keys_or(config, ["ignored_layers"], None)
126126
weight_block_size = cls.get_from_keys_or(config, ["weight_block_size"],
127127
None)
128+
if not ignored_layers:
129+
ignored_layers = cls.get_from_keys_or(config,
130+
["modules_to_not_convert"],
131+
None)
128132
return cls(is_checkpoint_fp8_serialized=is_checkpoint_fp8_serialized,
129133
activation_scheme=activation_scheme,
130134
ignored_layers=ignored_layers,

0 commit comments

Comments
 (0)