File tree Expand file tree Collapse file tree 2 files changed +4
-2
lines changed
vllm/model_executor/models Expand file tree Collapse file tree 2 files changed +4
-2
lines changed Original file line number Diff line number Diff line change @@ -137,7 +137,8 @@ def __init__(
137
137
topk_group = config .topk_group ,
138
138
prefix = f"{ prefix } .experts" ,
139
139
scoring_func = config .scoring_func ,
140
- routed_scaling_factor = self .routed_scaling_factor ,
140
+ # we do scaling outside, set factor to 1.0 to avoid double mul
141
+ routed_scaling_factor = 1.0 ,
141
142
e_score_correction_bias = self .gate .e_score_correction_bias )
142
143
143
144
if config .n_shared_experts is not None :
Original file line number Diff line number Diff line change @@ -159,7 +159,8 @@ def __init__(
159
159
topk_group = config .topk_group ,
160
160
prefix = f"{ prefix } .experts" ,
161
161
scoring_func = "sigmoid" ,
162
- routed_scaling_factor = self .routed_scaling_factor ,
162
+ # we do scaling outside, set factor to 1.0 to avoid double mul
163
+ routed_scaling_factor = 1.0 ,
163
164
e_score_correction_bias = self .gate .e_score_correction_bias ,
164
165
enable_eplb = self .enable_eplb ,
165
166
num_redundant_experts = self .n_redundant_experts )
You can’t perform that action at this time.
0 commit comments