Skip to content

Commit 5987d32

Browse files
author
root
committed
限制最大rollout的同时 、拆分rollout
1 parent c8864b0 commit 5987d32

File tree

3 files changed

+11
-14
lines changed

3 files changed

+11
-14
lines changed

agentlightning/runner.py

Lines changed: 7 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -240,9 +240,9 @@ async def run_async(self) -> bool:
240240
# Pass the task input, not the whole task object
241241
result = await rollout_method(task.input, task.rollout_id, resources_update.resources)
242242
#降低最大rollout
243-
if len(result) > 40:
243+
if len(result) > 5:
244244
import random
245-
result = random.sample(result,40)
245+
result = random.sample(result,5)
246246
rollout_obj = self._to_rollout_object(result, task.rollout_id)
247247
end_time = time.time()
248248
logger.info(
@@ -254,14 +254,11 @@ async def run_async(self) -> bool:
254254
logger.exception(f"{self._log_prefix(rollout_id)} Exception during rollout.")
255255
MAX_TRY = MAX_TRY - 1
256256
finally:
257-
if rollout_obj.triplets:
258-
try:
259-
self.agent.on_rollout_end(task, rollout_obj, self, self.tracer)
260-
except Exception:
261-
logger.exception(f"{self._log_prefix(rollout_id)} Exception during on_rollout_end hook.")
262-
await self.client.post_rollout_async(rollout_obj)
263-
else:
264-
raise Exception("rollout_obj.triplets is EMPTY")
257+
try:
258+
self.agent.on_rollout_end(task, rollout_obj, self, self.tracer)
259+
except Exception:
260+
logger.exception(f"{self._log_prefix(rollout_id)} Exception during on_rollout_end hook.")
261+
await self.client.post_rollout_async(rollout_obj)
265262
return True
266263

267264
async def iter_async(self) -> int:

examples/werewolf/train.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -17,8 +17,8 @@ python -m agentlightning.verl \
1717
data.val_files=${DATA_DIR}/test.parquet \
1818
actor_rollout_ref.rollout.tensor_model_parallel_size=$ROLLOUT_TP_SIZE \
1919
trainer.n_gpus_per_node=${N_GPUS} \
20-
data.train_batch_size=1 \
21-
actor_rollout_ref.rollout.n=1 \
20+
data.train_batch_size=4 \
21+
actor_rollout_ref.rollout.n=4 \
2222
actor_rollout_ref.actor.ppo_mini_batch_size=8 \
2323
actor_rollout_ref.actor.ppo_micro_batch_size_per_gpu=1 \
2424
actor_rollout_ref.rollout.log_prob_micro_batch_size_per_gpu=1 \

merge.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
cd /root/verl && python scripts/legacy_model_merger.py merge \
22
--backend fsdp \
33
--hf_model_path /root/dataDisk/Qwen3-8B \
4-
--local_dir /root/dataDisk/checkpoints/global_step_42/actor \
5-
--target_dir /root/dataDisk/DeepWereWolf-Qwen3-8B-Grpo-Agentic1
4+
--local_dir /root/dataDisk/checkpoints/global_step_47/actor \
5+
--target_dir /root/dataDisk/DeepWereWolf-Qwen3-8B-Grpo-Agentic4

0 commit comments

Comments
 (0)