Skip to content

Commit 5c5cb18

Browse files
committed
hotfix
1 parent e774ede commit 5c5cb18

File tree

1 file changed

+0
-14
lines changed

1 file changed

+0
-14
lines changed

applications/ColossalChat/coati/distributed/grpo_consumer.py

Lines changed: 0 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -371,20 +371,6 @@ def _criterion(outputs, inputs):
371371
kl = all_reduce_mean(torch.mean(torch.stack(kl)).to(loss.device), self.plugin).data
372372
mean_kl.append(kl)
373373
mean_loss.append(all_reduce_mean(loss, self.plugin).data)
374-
mini_batch_entropies.append(
375-
all_reduce_mean(
376-
(
377-
(
378-
(
379-
entropy_from_logits(policy_model_logits[:, -num_action:])
380-
* action_mask_forward_micro_batch
381-
).sum(-1)
382-
)
383-
/ action_mask_forward_micro_batch.sum(-1)
384-
).detach(),
385-
self.plugin,
386-
)
387-
)
388374
else:
389375
policy_model_logits = self.policy_model(
390376
input_ids=input_ids_forward_micro_batch,

0 commit comments

Comments
 (0)