3 files changed
+3
-3
lines changed| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
109 | 109 | | |
110 | 110 | | |
111 | 111 | | |
112 | | - | |
| 112 | + | |
113 | 113 | | |
114 | 114 | | |
115 | 115 | | |
| |||
187 | 187 | | |
188 | 188 | | |
189 | 189 | | |
190 | | - | |
| 190 | + | |
191 | 191 | | |
192 | 192 | | |
193 | 193 | | |
| |||
Loading
- requirements.txt-1
- run_agents/convert_model_weights.sh
- run_agents/run_agent_test.sh+1-1
- run_agents/run_code_agent.sh+5-12
- run_agents/run_gui_agent.sh+7-5
- run_agents/run_multi_node.slurm+3-3
- run_agents/run_react_agent.sh+3-3
- run_agents/run_react_agent_alfworld.sh+3-3
- run_agents/run_react_agent_search.sh+6-4
- run_agents/run_react_code_agent.sh+3-3
- run_agents/run_science_world.slurm+10-8
- run_agents/run_vlm_qa.sh+12-6
- run_agents/run_webshop_agent.sh+6-3
- run_agents/test_thinking_agent.sh+2-2
- run_agents/train_example.sh+99
- verl/single_controller/ray/base.py+1-1
- verl/trainer/config/ppo_trainer.yaml+1-1
- verl/trainer/main_ppo.py-1
- verl/trainer/ppo/ray_trainer.py+7-7
- verl/utils/dataset/rl_dataset.py+70-3
- verl/workers/actor/dp_actor.py+4-1
- verl/workers/rollout/vllm_rollout/vllm_async_server.py+3-4
0 commit comments