Skip to content

Commit 1f8289e

Browse files
authored
fix expertwise_scale (#3181)
1 parent 3eb9a5d commit 1f8289e

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

fastdeploy/model_executor/layers/moe/fused_moe_cutlass_backend.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -213,7 +213,7 @@ def apply_ep_decode(
213213
"""
214214
# 1. Select topk experts and weights
215215
topk_idx, topk_weights = self.ep_decoder_runner.moe_select(layer, gate_out)
216-
expertwise_scale = getattr(layer, "up_gate_proj_in_scale_all_experts")
216+
expertwise_scale = getattr(layer, "up_gate_proj_in_scale_all_experts", None)
217217
# 2. EP Dispatch
218218
permute_input, token_nums_per_expert, handle = self.ep_decoder_runner.dispatch(
219219
x, topk_idx, topk_weights, expertwise_scale=expertwise_scale

0 commit comments

Comments
 (0)