We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ff83763 commit e3f1b62Copy full SHA for e3f1b62
paddlenlp/transformers/deepseek_v2/modeling_pp.py
@@ -1235,7 +1235,13 @@ def build_schedule_node(self):
1235
if self.mlp.using_flex_token:
1236
if DSV3_USE_FP8_GEMM:
1237
attn_and_gate_node = ScheduleNode(self.attn_compute_for_fusion, name="attn_and_gate_node")
1238
- fp8_fusion_moe_node = FusionMoeNode(self.mlp, name="fp8_fusion_moe_node")
+ fp8_fusion_moe_node = FusionMoeNode(
1239
+ self.mlp,
1240
+ recompute_fwd_gate_up=self.config.recompute_fwd_gate_up,
1241
+ dequant_input=self.config.dequant_input,
1242
+ is_split_group_gemm=self.config.is_split_group_gemm,
1243
+ name="fp8_fusion_moe_node",
1244
+ )
1245
post_process_node = PostProcessNode(
1246
self.config.send_mtp_embed,
1247
self.mlp.training,
0 commit comments