fix config name

pan-x-c · pan-x-c · commit bfc78e57412f · 2025-05-22T16:50:15.000+08:00
diff --git a/examples/async_gsm8k/explorer.yaml b/examples/async_gsm8k/explorer.yaml
@@ -1,7 +1,7 @@
 project: "Trinity-RFT-gsm8k"
 name: "async-qwen2.5-1.5B-gsm8k"
 mode: explore
-checkpoint_root_dir: 'checkpoints/qwen2.5-1.5B-gsm8k'
+checkpoint_root_dir: '/PATH/TO/CHECKPOINT/'
 algorithm:
   algorithm_type: grpo
   repeat_times: 8
diff --git a/trinity/common/config.py b/trinity/common/config.py
@@ -266,7 +266,7 @@ class TrainerConfig:
     # trainer configs
     actor_use_kl_loss: bool = False
     actor_kl_loss_coef: float = 0.001
-    actor_entropy_coeff: float = 0.001
+    actor_entropy_coef: float = 0.001
     actor_grad_clip: float = 1.0
     actor_clip_ratio: float = 0.2
     # TODO: extract more train-related params from underlying trainer engine
diff --git a/trinity/manager/config_manager.py b/trinity/manager/config_manager.py
@@ -935,7 +935,7 @@ def _set_actor_clip_ratio(self):
             max_value=1.0,
         )
 
-    def _set_actor_entropy_coeff(self):
+    def _set_actor_entropy_coef(self):
         st.number_input(
             "Entropy Coeff",
             key="actor_entropy_coef",

Original file line number	Diff line number	Diff line change
`@@ -935,7 +935,7 @@ def _set_actor_clip_ratio(self):`
`935`	`935`	`max_value=1.0,`
`936`	`936`	`)`
`937`	`937`
`938`		`- def _set_actor_entropy_coeff(self):`
	`938`	`+ def _set_actor_entropy_coef(self):`
`939`	`939`	`st.number_input(`
`940`	`940`	`"Entropy Coeff",`
`941`	`941`	`key="actor_entropy_coef",`