File tree Expand file tree Collapse file tree 2 files changed +6
-4
lines changed
Expand file tree Collapse file tree 2 files changed +6
-4
lines changed Original file line number Diff line number Diff line change @@ -5,16 +5,17 @@ ROOT_DIR=$(dirname $SCRIPT_DIR)
55
66# support tp1 train eagle3 for Qwen3-VL-8B-Instruct
77NUM_GPUS=${1:- 1}
8+ BUILD_DATASET_NUM_PROC=${BUILD_DATASET_NUM_PROC:- 0}
89
910torchrun \
1011 --standalone \
1112 --nproc_per_node $NUM_GPUS \
12- $ROOT_DIR /scripts/train_eagle3_online .py \
13+ $ROOT_DIR /scripts/train_eagle3 .py \
1314 --target-model-path Qwen/Qwen3-VL-8B-Instruct \
1415 --draft-model-config $ROOT_DIR /configs/qwen3-vl-8b-eagle3.json \
1516 --train-data-path $ROOT_DIR /cache/dataset/allava4v_train.jsonl \
1617 --output-dir $ROOT_DIR /outputs/Qwen3-VL-8B-eagle3 \
17- --build-dataset-num-proc 0 \
18+ --build-dataset-num-proc $BUILD_DATASET_NUM_PROC \
1819 --num-epochs 10 \
1920 --batch-size 1 \
2021 --learning-rate 1e-4 \
Original file line number Diff line number Diff line change @@ -5,16 +5,17 @@ ROOT_DIR=$(dirname $SCRIPT_DIR)
55
66# support tp1 train eagle3 for Qwen3-VL-30B-A3B-Instruct
77NUM_GPUS=${1:- 1}
8+ BUILD_DATASET_NUM_PROC=${BUILD_DATASET_NUM_PROC:- 0}
89
910torchrun \
1011 --standalone \
1112 --nproc_per_node $NUM_GPUS \
12- $ROOT_DIR /scripts/train_eagle3_online .py \
13+ $ROOT_DIR /scripts/train_eagle3 .py \
1314 --target-model-path Qwen/Qwen3-VL-30B-A3B-Instruct \
1415 --draft-model-config $ROOT_DIR /configs/qwen3-vl-30b-a3b-eagle3.json \
1516 --train-data-path $ROOT_DIR /cache/dataset/allava4v_train.jsonl \
1617 --output-dir $ROOT_DIR /outputs/Qwen3-VL-30B-A3B-eagle3 \
17- --build-dataset-num-proc 0 \
18+ --build-dataset-num-proc $BUILD_DATASET_NUM_PROC \
1819 --num-epochs 10 \
1920 --batch-size 1 \
2021 --learning-rate 1e-4 \
You can’t perform that action at this time.
0 commit comments