We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e1efedd commit b099c88Copy full SHA for b099c88
paddlenlp/transformers/deepseek_v2/modeling_pp.py
@@ -1536,7 +1536,7 @@ def overlapped_forward_backward(
1536
) = build_overlapped_nodes(forward_chunk, backward_chunk)
1537
forward_inputs = forward_pre_node.forward(forward_inputs)
1538
backward_input_grads = backward_pre_node.backward(backward_input_grads)
1539
- forward_inputs, backward_input_grads = overlap_node.forward_backward(
+ forward_inputs, backward_input_grads, _ = overlap_node.forward_backward(
1540
forward_inputs, backward_input_grads, event_to_wait
1541
)
1542
forward_inputs = forward_post_node.forward(forward_inputs)
0 commit comments