We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent f58d9b6 commit 0484b64Copy full SHA for 0484b64
vllm/model_executor/layers/fused_moe/layer.py
@@ -1959,6 +1959,8 @@ def get_expert_weights(self) -> Iterable[torch.Tensor]:
1959
if name not in NON_EXPERT_WEIGHTS
1960
and weight.shape != torch.Size([])
1961
and not name.startswith("_shared_experts.")
1962
+ # exclude parameters from non-expert submodules (e.g. gate/shared)
1963
+ and not name.startswith("_gate.")
1964
]
1965
1966
def set_eplb_state(
0 commit comments