Skip to content

Commit f95d594

Browse files
authored
Merge pull request #111 from JaaackHongggg/patch-1
Update train_grpo_vlagent_v2.sh
2 parents d356727 + 7fba2c1 commit f95d594

File tree

1 file changed

+3
-5
lines changed

1 file changed

+3
-5
lines changed

examples/agent/train_grpo_vlagent_v2.sh

Lines changed: 3 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,20 +1,18 @@
11
set -x
22

33
# export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
4-
DATA_DIR=/cpfs/user/honglingyi/DATA/LLM/VL_Agent/parquets
54

65
PROJECT_NAME="agent_vlagent"
76
EXPERIMENT_NAME="visual_agent_env_v2_model_v3"
87

98
export SAVE_CHECKPOINT_DIR=/diancpfs/user/fengyuan/verl_checkpoints
109
# export VLLM_ATTENTION_BACKEND=XFORMERS # vllm + qwen2-7b with flash_attn has some issues
1110

12-
VISUAL_DATASET_TRAIN=/cpfs/user/honglingyi/DATA/LLM/VL_Agent/parquets/vl_agent_V1_train_box.parquet
13-
VISUAL_DATASET_TEST=/cpfs/user/honglingyi/DATA/LLM/VL_Agent/parquets/vl_agent_V1_test_box.parquet
11+
VISUAL_DATASET_TRAIN=vl_agent_V1_train_box.parquet
12+
VISUAL_DATASET_TEST=vl_agent_V1_test_box.parquet
1413

15-
# data.train_files=${DATA_DIR}/vl_agent_V1.parquet \
1614

17-
REF_MODEL_PATH=/cpfs/user/honglingyi/MODEL/Qwen/Qwen2.5-VL-32B-Instruct
15+
REF_MODEL_PATH=Qwen/Qwen2.5-VL-32B-Instruct
1816
PYTHONUNBUFFERED=1 python3 -m verl.trainer.main_ppo \
1917
data.train_files=${VISUAL_DATASET_TRAIN} \
2018
data.val_files=${VISUAL_DATASET_TEST} \

0 commit comments

Comments
 (0)