File tree Expand file tree Collapse file tree 3 files changed +11
-14
lines changed
Expand file tree Collapse file tree 3 files changed +11
-14
lines changed Original file line number Diff line number Diff line change @@ -240,9 +240,9 @@ async def run_async(self) -> bool:
240240 # Pass the task input, not the whole task object
241241 result = await rollout_method (task .input , task .rollout_id , resources_update .resources )
242242 #降低最大rollout
243- if len (result ) > 40 :
243+ if len (result ) > 5 :
244244 import random
245- result = random .sample (result ,40 )
245+ result = random .sample (result ,5 )
246246 rollout_obj = self ._to_rollout_object (result , task .rollout_id )
247247 end_time = time .time ()
248248 logger .info (
@@ -254,14 +254,11 @@ async def run_async(self) -> bool:
254254 logger .exception (f"{ self ._log_prefix (rollout_id )} Exception during rollout." )
255255 MAX_TRY = MAX_TRY - 1
256256 finally :
257- if rollout_obj .triplets :
258- try :
259- self .agent .on_rollout_end (task , rollout_obj , self , self .tracer )
260- except Exception :
261- logger .exception (f"{ self ._log_prefix (rollout_id )} Exception during on_rollout_end hook." )
262- await self .client .post_rollout_async (rollout_obj )
263- else :
264- raise Exception ("rollout_obj.triplets is EMPTY" )
257+ try :
258+ self .agent .on_rollout_end (task , rollout_obj , self , self .tracer )
259+ except Exception :
260+ logger .exception (f"{ self ._log_prefix (rollout_id )} Exception during on_rollout_end hook." )
261+ await self .client .post_rollout_async (rollout_obj )
265262 return True
266263
267264 async def iter_async (self ) -> int :
Original file line number Diff line number Diff line change @@ -17,8 +17,8 @@ python -m agentlightning.verl \
1717 data.val_files=${DATA_DIR} /test.parquet \
1818 actor_rollout_ref.rollout.tensor_model_parallel_size=$ROLLOUT_TP_SIZE \
1919 trainer.n_gpus_per_node=${N_GPUS} \
20- data.train_batch_size=1 \
21- actor_rollout_ref.rollout.n=1 \
20+ data.train_batch_size=4 \
21+ actor_rollout_ref.rollout.n=4 \
2222 actor_rollout_ref.actor.ppo_mini_batch_size=8 \
2323 actor_rollout_ref.actor.ppo_micro_batch_size_per_gpu=1 \
2424 actor_rollout_ref.rollout.log_prob_micro_batch_size_per_gpu=1 \
Original file line number Diff line number Diff line change 11cd /root/verl && python scripts/legacy_model_merger.py merge \
22 --backend fsdp \
33 --hf_model_path /root/dataDisk/Qwen3-8B \
4- --local_dir /root/dataDisk/checkpoints/global_step_42 /actor \
5- --target_dir /root/dataDisk/DeepWereWolf-Qwen3-8B-Grpo-Agentic1
4+ --local_dir /root/dataDisk/checkpoints/global_step_47 /actor \
5+ --target_dir /root/dataDisk/DeepWereWolf-Qwen3-8B-Grpo-Agentic4
You can’t perform that action at this time.
0 commit comments