We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent fee1061 commit 6362eb0Copy full SHA for 6362eb0
swift/megatron/trainers/grpo_trainer.py
@@ -54,7 +54,6 @@ def __init__(self, args: MegatronRLHFArguments, template: Template, **kwargs):
54
self._prepare_metrics()
55
self._init_grpo_params()
56
self._init_rollout_engine()
57
- self._init_rollout_engine()
58
self._prepare_rewards()
59
self._prepare_scheduler()
60
# Initialize trainer state for reward functions to access training progress
0 commit comments