Skip to content

Commit 6a6c38e

Browse files
committed
update configs
1 parent fbbcea7 commit 6a6c38e

File tree

2 files changed

+6
-4
lines changed

2 files changed

+6
-4
lines changed

examples/run_qwen3_vl_dense_eagle3_online.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -5,16 +5,17 @@ ROOT_DIR=$(dirname $SCRIPT_DIR)
55

66
# support tp1 train eagle3 for Qwen3-VL-8B-Instruct
77
NUM_GPUS=${1:-1}
8+
BUILD_DATASET_NUM_PROC=${BUILD_DATASET_NUM_PROC:-0}
89

910
torchrun \
1011
--standalone \
1112
--nproc_per_node $NUM_GPUS \
12-
$ROOT_DIR/scripts/train_eagle3_online.py \
13+
$ROOT_DIR/scripts/train_eagle3.py \
1314
--target-model-path Qwen/Qwen3-VL-8B-Instruct \
1415
--draft-model-config $ROOT_DIR/configs/qwen3-vl-8b-eagle3.json \
1516
--train-data-path $ROOT_DIR/cache/dataset/allava4v_train.jsonl \
1617
--output-dir $ROOT_DIR/outputs/Qwen3-VL-8B-eagle3 \
17-
--build-dataset-num-proc 0 \
18+
--build-dataset-num-proc $BUILD_DATASET_NUM_PROC \
1819
--num-epochs 10 \
1920
--batch-size 1 \
2021
--learning-rate 1e-4 \

examples/run_qwen3_vl_moe_eagle3_online.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -5,16 +5,17 @@ ROOT_DIR=$(dirname $SCRIPT_DIR)
55

66
# support tp1 train eagle3 for Qwen3-VL-30B-A3B-Instruct
77
NUM_GPUS=${1:-1}
8+
BUILD_DATASET_NUM_PROC=${BUILD_DATASET_NUM_PROC:-0}
89

910
torchrun \
1011
--standalone \
1112
--nproc_per_node $NUM_GPUS \
12-
$ROOT_DIR/scripts/train_eagle3_online.py \
13+
$ROOT_DIR/scripts/train_eagle3.py \
1314
--target-model-path Qwen/Qwen3-VL-30B-A3B-Instruct \
1415
--draft-model-config $ROOT_DIR/configs/qwen3-vl-30b-a3b-eagle3.json \
1516
--train-data-path $ROOT_DIR/cache/dataset/allava4v_train.jsonl \
1617
--output-dir $ROOT_DIR/outputs/Qwen3-VL-30B-A3B-eagle3 \
17-
--build-dataset-num-proc 0 \
18+
--build-dataset-num-proc $BUILD_DATASET_NUM_PROC \
1819
--num-epochs 10 \
1920
--batch-size 1 \
2021
--learning-rate 1e-4 \

0 commit comments

Comments
 (0)