Skip to content

Commit dc0141f

Browse files
authored
fix examples (#2719)
1 parent 4a280f7 commit dc0141f

File tree

8 files changed

+8
-7
lines changed

8 files changed

+8
-7
lines changed

examples/train/fsdp_qlora/train.sh

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,6 @@
11
# 14GiB * 2
22
nproc_per_node=2
33

4-
PYTHONPATH=. \
54
CUDA_VISIBLE_DEVICES=0,1 \
65
accelerate launch --config_file "./examples/train/fsdp_qlora/fsdp_offload.json" \
76
swift/cli/sft.py \

examples/train/multi-node/accelerate/train_node1.sh

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,6 @@ accelerate launch --config_file ./examples/train/multi-node/accelerate/multi_nod
1010
--lora_alpha 32 \
1111
--learning_rate 1e-4 \
1212
--gradient_accumulation_steps 16 \
13-
--gradient_checkpointing_kwargs '{"use_reentrant": false}' \
1413
--eval_steps 100 \
1514
--save_steps 100 \
1615
--save_total_limit 2 \

examples/train/multi-node/accelerate/train_node2.sh

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,6 @@ accelerate launch --config_file ./examples/train/multi-node/accelerate/multi_nod
1010
--lora_alpha 32 \
1111
--learning_rate 1e-4 \
1212
--gradient_accumulation_steps 16 \
13-
--gradient_checkpointing_kwargs '{"use_reentrant": false}' \
1413
--eval_steps 100 \
1514
--save_steps 100 \
1615
--save_total_limit 2 \

examples/train/multi-node/deepspeed/train.sh

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,6 @@ deepspeed --hostfile=./examples/train/multi-node-deepspeed/host.txt \
1111
--lora_alpha 32 \
1212
--learning_rate 1e-4 \
1313
--gradient_accumulation_steps 16 \
14-
--gradient_checkpointing_kwargs '{"use_reentrant": false}' \
1514
--eval_steps 100 \
1615
--save_steps 100 \
1716
--save_total_limit 2 \

examples/train/multimodal/dpo.sh

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,18 @@
1-
# --rlhf_type cpo/orpo/simpo are also supported
1+
# 4*32GiB
2+
# You can refer to `https://github.com/QwenLM/Qwen2-VL` for the meaning of the `MAX_PIXELS` parameter.
3+
# --rlhf_type cpo/orpo/simpo/rm/kto are also supported
24
nproc_per_node=4
35

46
CUDA_VISIBLE_DEVICES=0,1,2,3 \
57
NPROC_PER_NODE=$nproc_per_node \
8+
MAX_PIXELS=602112 \
69
swift rlhf \
710
--rlhf_type dpo \
811
--model Qwen/Qwen2-VL-7B-Instruct \
912
--train_type lora \
1013
--dataset swift/RLAIF-V-Dataset \
1114
--num_train_epochs 1 \
1215
--learning_rate 1e-4 \
13-
--gradient_checkpointing_kwargs '{"use_reentrant": false}' \
1416
--lora_rank 8 \
1517
--lora_alpha 32 \
1618
--gradient_accumulation_steps $(expr 16 / $nproc_per_node) \

examples/train/multimodal/train.sh

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,7 @@
11
# 22GiB
2+
# You can refer to `https://github.com/QwenLM/Qwen2-VL` for the meaning of the `MAX_PIXELS` parameter.
23
CUDA_VISIBLE_DEVICES=0 \
4+
MAX_PIXELS=602112 \
35
swift sft \
46
--model Qwen/Qwen2-VL-7B-Instruct \
57
--train_type lora \

examples/train/multimodal/train_grounding.sh

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,6 @@
1+
# You can refer to `https://github.com/QwenLM/Qwen2-VL` for the meaning of the `MAX_PIXELS` parameter.
12
CUDA_VISIBLE_DEVICES=0 \
3+
MAX_PIXELS=602112 \
24
swift sft \
35
--model Qwen/Qwen2-VL-7B-Instruct \
46
--train_type lora \

examples/train/rlhf/simpo.sh

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,6 @@ swift rlhf \
1010
--num_train_epochs 1 \
1111
--learning_rate 1e-5 \
1212
--gradient_accumulation_steps $(expr 16 / $nproc_per_node) \
13-
--gradient_checkpointing_kwargs '{"use_reentrant": false}' \
1413
--warmup_ratio 0.03 \
1514
--eval_steps 100 \
1615
--save_steps 100 \

0 commit comments

Comments
 (0)