We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
routed_scaling_factor
1 parent 457e471 commit 930a241Copy full SHA for 930a241
vllm/model_executor/models/deepseek_v2.py
@@ -160,7 +160,8 @@ def __init__(
160
topk_group=config.topk_group,
161
prefix=f"{prefix}.experts",
162
scoring_func=config.scoring_func,
163
- routed_scaling_factor=self.routed_scaling_factor,
+ # we do scaling outside, set factor to 1.0 to avoid double mul
164
+ routed_scaling_factor=1.0,
165
e_score_correction_bias=self.gate.e_score_correction_bias,
166
enable_eplb=self.enable_eplb,
167
num_redundant_experts=self.n_redundant_experts)
0 commit comments