Skip to content

Commit 2a29ec8

Browse files
committed
Change default finetune model to the plus version
Use --group_by_length to speed up training
1 parent 470e587 commit 2a29ec8

File tree

4 files changed

+7
-4
lines changed

4 files changed

+7
-4
lines changed

internvl_chat/evaluate.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -35,9 +35,9 @@ if [ ${DATASET} == "caption-coco" ]; then
3535
torchrun \
3636
--nnodes=1 \
3737
--node_rank=0 \
38-
--master_addr=127--master_port=${MASTER_PORT}.0.0.1 \
38+
--master_addr=127.0.0.1 \
3939
--nproc_per_node=${GPUS} \
40-
\
40+
--master_port=${MASTER_PORT} \
4141
eval/caption/evaluate_caption.py --checkpoint ${CHECKPOINT} --datasets coco
4242
fi
4343

internvl_chat/shell/hermes2_yi34b/internvl_chat_v1_2_hermes2_yi34b_448_finetune.sh

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -67,6 +67,7 @@ srun -p ${PARTITION} \
6767
--lr_scheduler_type "cosine" \
6868
--logging_steps 1 \
6969
--max_seq_length 2048 \
70+
--group_by_length True \
7071
--do_train True \
7172
--grad_checkpoint True \
7273
--deepspeed "zero_stage3_config.json" \

internvl_chat/shell/hermes2_yi34b/internvl_chat_v1_2_hermes2_yi34b_448_finetune_continue.sh

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,7 @@ srun -p ${PARTITION} \
3636
--quotatype=${QUOTA_TYPE} \
3737
${SRUN_ARGS} \
3838
python -u internvl/train/internvl_chat_finetune.py \
39-
--model_name_or_path "./pretrained/InternVL-Chat-Chinese-V1-2" \
39+
--model_name_or_path "./pretrained/InternVL-Chat-Chinese-V1-2-Plus" \
4040
--conv_style "Hermes-2" \
4141
--output_dir ${OUTPUT_DIR} \
4242
--meta_path "./path/to/your/custom/meta/file" \
@@ -65,6 +65,7 @@ srun -p ${PARTITION} \
6565
--lr_scheduler_type "cosine" \
6666
--logging_steps 1 \
6767
--max_seq_length 2048 \
68+
--group_by_length True \
6869
--do_train True \
6970
--grad_checkpoint True \
7071
--deepspeed "zero_stage3_config.json" \

internvl_chat/shell/hermes2_yi34b/internvl_chat_v1_2_hermes2_yi34b_448_finetune_continue_lora.sh

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@ torchrun \
2929
--master_port=${MASTER_PORT} \
3030
${SRUN_ARGS} \
3131
internvl/train/internvl_chat_finetune.py \
32-
--model_name_or_path "./pretrained/InternVL-Chat-Chinese-V1-2" \
32+
--model_name_or_path "./pretrained/InternVL-Chat-Chinese-V1-2-Plus" \
3333
--conv_style "Hermes-2" \
3434
--output_dir ${OUTPUT_DIR} \
3535
--meta_path "./path/to/your/custom/meta/file" \
@@ -59,6 +59,7 @@ torchrun \
5959
--lr_scheduler_type "cosine" \
6060
--logging_steps 1 \
6161
--max_seq_length 2048 \
62+
--group_by_length True \
6263
--do_train True \
6364
--grad_checkpoint True \
6465
--deepspeed "zero_stage3_config.json" \

0 commit comments

Comments
 (0)