Skip to content

Commit e3f1b62

Browse files
authored
Add fp8 opt config for dualpipe (#10804)
* add fp8 control for dualpipe * change kitchen api to padddle api
1 parent ff83763 commit e3f1b62

File tree

2 files changed

+107
-125
lines changed

2 files changed

+107
-125
lines changed

paddlenlp/transformers/deepseek_v2/modeling_pp.py

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1235,7 +1235,13 @@ def build_schedule_node(self):
12351235
if self.mlp.using_flex_token:
12361236
if DSV3_USE_FP8_GEMM:
12371237
attn_and_gate_node = ScheduleNode(self.attn_compute_for_fusion, name="attn_and_gate_node")
1238-
fp8_fusion_moe_node = FusionMoeNode(self.mlp, name="fp8_fusion_moe_node")
1238+
fp8_fusion_moe_node = FusionMoeNode(
1239+
self.mlp,
1240+
recompute_fwd_gate_up=self.config.recompute_fwd_gate_up,
1241+
dequant_input=self.config.dequant_input,
1242+
is_split_group_gemm=self.config.is_split_group_gemm,
1243+
name="fp8_fusion_moe_node",
1244+
)
12391245
post_process_node = PostProcessNode(
12401246
self.config.send_mtp_embed,
12411247
self.mlp.training,

0 commit comments

Comments
 (0)