We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 176244a commit f83d4dfCopy full SHA for f83d4df
vllm/model_executor/models/qwen3_moe.py
@@ -149,7 +149,7 @@ def __init__(
149
self.gate = ReplicatedLinear(config.hidden_size,
150
config.num_experts,
151
bias=False,
152
- quant_config=quant_config,
+ quant_config=None,
153
prefix=f"{prefix}.gate")
154
155
def forward(self, hidden_states: torch.Tensor) -> torch.Tensor:
0 commit comments