fix

hjh0119 · hjh0119 · commit 6362eb095af4 · 2025-12-29T11:42:00.000+08:00
diff --git a/swift/megatron/trainers/grpo_trainer.py b/swift/megatron/trainers/grpo_trainer.py
@@ -54,7 +54,6 @@ def __init__(self, args: MegatronRLHFArguments, template: Template, **kwargs):
         self._prepare_metrics()
         self._init_grpo_params()
         self._init_rollout_engine()
-        self._init_rollout_engine()
         self._prepare_rewards()
         self._prepare_scheduler()
         # Initialize trainer state for reward functions to access training progress