File tree Expand file tree Collapse file tree 1 file changed +1
-5
lines changed
vllm/model_executor/models Expand file tree Collapse file tree 1 file changed +1
-5
lines changed Original file line number Diff line number Diff line change @@ -139,7 +139,7 @@ def __init__(
139
139
top_k = config .num_experts_per_tok ,
140
140
hidden_size = config .hidden_size ,
141
141
intermediate_size = config .moe_intermediate_size ,
142
- reduce_results = False ,
142
+ reduce_results = True ,
143
143
renormalize = config .norm_topk_prob ,
144
144
quant_config = quant_config ,
145
145
prefix = f"{ prefix } .experts" ,
@@ -163,10 +163,6 @@ def forward(self, hidden_states: torch.Tensor) -> torch.Tensor:
163
163
final_hidden_states = self .experts (hidden_states = hidden_states ,
164
164
router_logits = router_logits )
165
165
166
- if self .tp_size > 1 :
167
- final_hidden_states = self .experts .maybe_all_reduce_tensor_model_parallel ( # noqa E501
168
- final_hidden_states )
169
-
170
166
return final_hidden_states .view (orig_shape )
171
167
172
168
You can’t perform that action at this time.
0 commit comments