Skip to content

Commit 1852af7

Browse files
tastelikefeettastelikefeet
andauthored
fix (#6098)
Co-authored-by: tastelikefeet <[email protected]>
1 parent bfff243 commit 1852af7

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

swift/trainers/sequence_parallel/ulysses.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -354,7 +354,7 @@ def moe_aux_loss_hook(module, args, kwargs, output):
354354
if isinstance(router_logits, tuple):
355355
compute_device = router_logits[0].device
356356
router_logits = torch.cat([layer_gate.to(compute_device) for layer_gate in router_logits], dim=0)
357-
router_logits, _ = GatherLoss.apply(router_logits, None, self.sp_group)
357+
router_logits, _ = GatherLoss.apply(router_logits, None)
358358
router_logits = router_logits.reshape(self.sp_world_size, num_layers, sp_len,
359359
-1).transpose(0, 1).reshape(num_layers, self.sp_world_size * sp_len,
360360
-1)

0 commit comments

Comments
 (0)