Skip to content

Commit 0982de7

Browse files
committed
fix_yaml
1 parent 501554b commit 0982de7

File tree

2 files changed

+8
-6
lines changed

2 files changed

+8
-6
lines changed

tests/config/benchmark/config/sft/Qwen3-VL-30B-A3B-Instruct.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ train_dataset_prob: "1.0"
66
eval_dataset_path: /root/paddlejob/share-storage/gpfs/system-public/efficient_benchmark/dataset/coco_grounding/val.jsonl
77
eval_dataset_prob: "1.0"
88
max_seq_len: 8192
9-
packing: false
9+
packing: true
1010
mix_strategy: concat
1111
template_backend: custom
1212
template: qwen3_vl
@@ -31,7 +31,7 @@ evaluation_strategy: steps
3131
save_steps: 500
3232
save_strategy: steps
3333
logging_steps: 1
34-
gradient_accumulation_steps: 8
34+
gradient_accumulation_steps: 16
3535
logging_dir: ./vdl_log
3636
output_dir: ./checkpoints/qwen3-vl-sft-full
3737
disable_tqdm: true
@@ -61,7 +61,7 @@ moe_grouped_gemm: true
6161
moe_deep_gemm: true
6262

6363
apply_rope_fusion: False
64-
# moe_router_force_load_balancing: true
64+
moe_router_force_load_balancing: false
6565

6666
# sharding
6767
split_param: true

tests/config/benchmark/config/sft/Qwen3-VL-8B-Instruct.yaml

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@ save_steps: 500
3232
save_strategy: steps
3333
logging_steps: 1
3434
save_total_limit: 1
35-
gradient_accumulation_steps: 8
35+
gradient_accumulation_steps: 32
3636
logging_dir: ./vdl_log_sft_full_tp_8B_coco
3737
output_dir: ./checkpoints/qwen3-vl-sft-full-tp-8B_coco
3838
disable_tqdm: true
@@ -44,7 +44,7 @@ warmup_steps: 20
4444
learning_rate: 1.0e-5
4545

4646
# performance
47-
tensor_model_parallel_size: 4
47+
tensor_model_parallel_size: 2
4848
pipeline_model_parallel_size: 1
4949
sharding: stage1
5050
recompute_granularity: full
@@ -57,4 +57,6 @@ save_checkpoint_format: "flex_checkpoint"
5757
load_checkpoint_format: "flex_checkpoint"
5858
freeze_config: freeze_vision freeze_aligner
5959

60-
benchmark: true
60+
benchmark: true
61+
dataloader_num_workers: 8
62+
prefetch_factor: 8

0 commit comments

Comments
 (0)