update template (#286)

Jintao-Huang · web-flow · commit b441875401f1 · 2024-01-06T14:04:48.000+08:00
diff --git a/README.md b/README.md
@@ -170,7 +170,7 @@ Users can check the [documentation of SWIFT](docs/source/GetStarted/快速使用
   - Custom Dataset
 - Supported Templates:
   - Text Generation: default-generation, default-generation-bos, chatglm-generation
-  - Chat: default, chatml, baichuan, chatglm2, chatglm3, llama, openbuddy, internlm, yi, xverse, ziya, skywork, bluelm, zephyr, sus, deepseek
+  - Chat: default, qwen, baichuan, chatglm2, chatglm3, llama, openbuddy, internlm, yi, xverse, ziya, skywork, bluelm, zephyr, sus, deepseek
 
 ## 🔥SCEdit
 
diff --git a/README_CN.md b/README_CN.md
@@ -168,7 +168,7 @@ SWIFT（Scalable lightWeight Infrastructure for Fine-Tuning）是一个可扩展
   - 自定义数据集
 - 支持的对话模板:
   - 文本生成: default-generation, default-generation-bos, chatglm-generation
-  - 对话: default, chatml, baichuan, chatglm2, chatglm3, llama, openbuddy, internlm, yi, xverse, ziya, skywork, bluelm, zephyr, sus, deepseek
+  - 对话: default, qwen, baichuan, chatglm2, chatglm3, llama, openbuddy, internlm, yi, xverse, ziya, skywork, bluelm, zephyr, sus, deepseek
 
 ## 🔥SCEdit
 
diff --git a/docs/source/LLM/LLM推理文档.md b/docs/source/LLM/LLM推理文档.md
@@ -39,7 +39,7 @@ from swift.utils import seed_everything
 
 model_type = ModelType.qwen_7b_chat
 template_type = get_default_template_type(model_type)
-print(f'template_type: {template_type}')  # template_type: chatml
+print(f'template_type: {template_type}')  # template_type: qwen
 
 
 kwargs = {}
@@ -101,7 +101,7 @@ from swift.utils import seed_everything
 
 model_type = ModelType.qwen_7b_chat_int4
 template_type = get_default_template_type(model_type)
-print(f'template_type: {template_type}')  # template_type: chatml
+print(f'template_type: {template_type}')  # template_type: qwen
 
 model, tokenizer = get_model_tokenizer(model_type, model_kwargs={'device_map': 'auto'})
 
@@ -179,7 +179,7 @@ from swift.utils import seed_everything
 
 model_type = ModelType.qwen_7b_chat
 template_type = get_default_template_type(model_type)
-print(f'template_type: {template_type}')  # template_type: chatml
+print(f'template_type: {template_type}')  # template_type: qwen
 
 model, tokenizer = get_model_tokenizer(model_type, model_kwargs={'device_map': 'auto'})
 
@@ -220,7 +220,7 @@ from swift.utils import seed_everything
 
 model_type = ModelType.qwen_vl_chat
 template_type = get_default_template_type(model_type)
-print(f'template_type: {template_type}')  # template_type: chatml
+print(f'template_type: {template_type}')  # template_type: qwen
 
 model, tokenizer = get_model_tokenizer(model_type, model_kwargs={'device_map': 'auto'})
 
@@ -262,7 +262,7 @@ from swift.utils import seed_everything
 
 model_type = ModelType.qwen_audio_chat
 template_type = get_default_template_type(model_type)
-print(f'template_type: {template_type}')  # template_type: chatml
+print(f'template_type: {template_type}')  # template_type: qwen
 
 model, tokenizer = get_model_tokenizer(model_type, model_kwargs={'device_map': 'auto'})
 
diff --git a/docs/source/LLM/支持的模型和数据集.md b/docs/source/LLM/支持的模型和数据集.md
@@ -15,26 +15,26 @@
 | Model Type | Model ID | Default Lora Target Modules | Default Template | Support Flash Attn | Support VLLM | Requires |
 | ---------  | -------- | --------------------------- | ---------------- | ------------------ | ------------ | -------- |
 |qwen-1_8b|[qwen/Qwen-1_8B](https://modelscope.cn/models/qwen/Qwen-1_8B/summary)|c_attn|default-generation|&#x2714;|&#x2714;||
-|qwen-1_8b-chat|[qwen/Qwen-1_8B-Chat](https://modelscope.cn/models/qwen/Qwen-1_8B-Chat/summary)|c_attn|chatml|&#x2714;|&#x2714;||
-|qwen-1_8b-chat-int4|[qwen/Qwen-1_8B-Chat-Int4](https://modelscope.cn/models/qwen/Qwen-1_8B-Chat-Int4/summary)|c_attn|chatml|&#x2714;|&#x2718;|auto_gptq>=0.5|
-|qwen-1_8b-chat-int8|[qwen/Qwen-1_8B-Chat-Int8](https://modelscope.cn/models/qwen/Qwen-1_8B-Chat-Int8/summary)|c_attn|chatml|&#x2714;|&#x2718;|auto_gptq>=0.5|
+|qwen-1_8b-chat|[qwen/Qwen-1_8B-Chat](https://modelscope.cn/models/qwen/Qwen-1_8B-Chat/summary)|c_attn|qwen|&#x2714;|&#x2714;||
+|qwen-1_8b-chat-int4|[qwen/Qwen-1_8B-Chat-Int4](https://modelscope.cn/models/qwen/Qwen-1_8B-Chat-Int4/summary)|c_attn|qwen|&#x2714;|&#x2718;|auto_gptq>=0.5|
+|qwen-1_8b-chat-int8|[qwen/Qwen-1_8B-Chat-Int8](https://modelscope.cn/models/qwen/Qwen-1_8B-Chat-Int8/summary)|c_attn|qwen|&#x2714;|&#x2718;|auto_gptq>=0.5|
 |qwen-7b|[qwen/Qwen-7B](https://modelscope.cn/models/qwen/Qwen-7B/summary)|c_attn|default-generation|&#x2714;|&#x2714;||
-|qwen-7b-chat|[qwen/Qwen-7B-Chat](https://modelscope.cn/models/qwen/Qwen-7B-Chat/summary)|c_attn|chatml|&#x2714;|&#x2714;||
-|qwen-7b-chat-int4|[qwen/Qwen-7B-Chat-Int4](https://modelscope.cn/models/qwen/Qwen-7B-Chat-Int4/summary)|c_attn|chatml|&#x2714;|&#x2718;|auto_gptq>=0.5|
-|qwen-7b-chat-int8|[qwen/Qwen-7B-Chat-Int8](https://modelscope.cn/models/qwen/Qwen-7B-Chat-Int8/summary)|c_attn|chatml|&#x2714;|&#x2718;|auto_gptq>=0.5|
+|qwen-7b-chat|[qwen/Qwen-7B-Chat](https://modelscope.cn/models/qwen/Qwen-7B-Chat/summary)|c_attn|qwen|&#x2714;|&#x2714;||
+|qwen-7b-chat-int4|[qwen/Qwen-7B-Chat-Int4](https://modelscope.cn/models/qwen/Qwen-7B-Chat-Int4/summary)|c_attn|qwen|&#x2714;|&#x2718;|auto_gptq>=0.5|
+|qwen-7b-chat-int8|[qwen/Qwen-7B-Chat-Int8](https://modelscope.cn/models/qwen/Qwen-7B-Chat-Int8/summary)|c_attn|qwen|&#x2714;|&#x2718;|auto_gptq>=0.5|
 |qwen-14b|[qwen/Qwen-14B](https://modelscope.cn/models/qwen/Qwen-14B/summary)|c_attn|default-generation|&#x2714;|&#x2714;||
-|qwen-14b-chat|[qwen/Qwen-14B-Chat](https://modelscope.cn/models/qwen/Qwen-14B-Chat/summary)|c_attn|chatml|&#x2714;|&#x2714;||
-|qwen-14b-chat-int4|[qwen/Qwen-14B-Chat-Int4](https://modelscope.cn/models/qwen/Qwen-14B-Chat-Int4/summary)|c_attn|chatml|&#x2714;|&#x2718;|auto_gptq>=0.5|
-|qwen-14b-chat-int8|[qwen/Qwen-14B-Chat-Int8](https://modelscope.cn/models/qwen/Qwen-14B-Chat-Int8/summary)|c_attn|chatml|&#x2714;|&#x2718;|auto_gptq>=0.5|
+|qwen-14b-chat|[qwen/Qwen-14B-Chat](https://modelscope.cn/models/qwen/Qwen-14B-Chat/summary)|c_attn|qwen|&#x2714;|&#x2714;||
+|qwen-14b-chat-int4|[qwen/Qwen-14B-Chat-Int4](https://modelscope.cn/models/qwen/Qwen-14B-Chat-Int4/summary)|c_attn|qwen|&#x2714;|&#x2718;|auto_gptq>=0.5|
+|qwen-14b-chat-int8|[qwen/Qwen-14B-Chat-Int8](https://modelscope.cn/models/qwen/Qwen-14B-Chat-Int8/summary)|c_attn|qwen|&#x2714;|&#x2718;|auto_gptq>=0.5|
 |qwen-72b|[qwen/Qwen-72B](https://modelscope.cn/models/qwen/Qwen-72B/summary)|c_attn|default-generation|&#x2714;|&#x2714;||
-|qwen-72b-chat|[qwen/Qwen-72B-Chat](https://modelscope.cn/models/qwen/Qwen-72B-Chat/summary)|c_attn|chatml|&#x2714;|&#x2714;||
-|qwen-72b-chat-int4|[qwen/Qwen-72B-Chat-Int4](https://modelscope.cn/models/qwen/Qwen-72B-Chat-Int4/summary)|c_attn|chatml|&#x2714;|&#x2718;|auto_gptq>=0.5|
-|qwen-72b-chat-int8|[qwen/Qwen-72B-Chat-Int8](https://modelscope.cn/models/qwen/Qwen-72B-Chat-Int8/summary)|c_attn|chatml|&#x2714;|&#x2718;|auto_gptq>=0.5|
+|qwen-72b-chat|[qwen/Qwen-72B-Chat](https://modelscope.cn/models/qwen/Qwen-72B-Chat/summary)|c_attn|qwen|&#x2714;|&#x2714;||
+|qwen-72b-chat-int4|[qwen/Qwen-72B-Chat-Int4](https://modelscope.cn/models/qwen/Qwen-72B-Chat-Int4/summary)|c_attn|qwen|&#x2714;|&#x2718;|auto_gptq>=0.5|
+|qwen-72b-chat-int8|[qwen/Qwen-72B-Chat-Int8](https://modelscope.cn/models/qwen/Qwen-72B-Chat-Int8/summary)|c_attn|qwen|&#x2714;|&#x2718;|auto_gptq>=0.5|
 |qwen-vl|[qwen/Qwen-VL](https://modelscope.cn/models/qwen/Qwen-VL/summary)|c_attn|default-generation|&#x2714;|&#x2718;||
-|qwen-vl-chat|[qwen/Qwen-VL-Chat](https://modelscope.cn/models/qwen/Qwen-VL-Chat/summary)|c_attn|chatml|&#x2714;|&#x2718;||
-|qwen-vl-chat-int4|[qwen/Qwen-VL-Chat-Int4](https://modelscope.cn/models/qwen/Qwen-VL-Chat-Int4/summary)|c_attn|chatml|&#x2714;|&#x2718;|auto_gptq>=0.5|
+|qwen-vl-chat|[qwen/Qwen-VL-Chat](https://modelscope.cn/models/qwen/Qwen-VL-Chat/summary)|c_attn|qwen|&#x2714;|&#x2718;||
+|qwen-vl-chat-int4|[qwen/Qwen-VL-Chat-Int4](https://modelscope.cn/models/qwen/Qwen-VL-Chat-Int4/summary)|c_attn|qwen|&#x2714;|&#x2718;|auto_gptq>=0.5|
 |qwen-audio|[qwen/Qwen-Audio](https://modelscope.cn/models/qwen/Qwen-Audio/summary)|c_attn|default-generation|&#x2714;|&#x2718;||
-|qwen-audio-chat|[qwen/Qwen-Audio-Chat](https://modelscope.cn/models/qwen/Qwen-Audio-Chat/summary)|c_attn|chatml|&#x2714;|&#x2718;||
+|qwen-audio-chat|[qwen/Qwen-Audio-Chat](https://modelscope.cn/models/qwen/Qwen-Audio-Chat/summary)|c_attn|qwen|&#x2714;|&#x2718;||
 |chatglm2-6b|[ZhipuAI/chatglm2-6b](https://modelscope.cn/models/ZhipuAI/chatglm2-6b/summary)|query_key_value|chatglm2|&#x2718;|&#x2714;||
 |chatglm2-6b-32k|[ZhipuAI/chatglm2-6b-32k](https://modelscope.cn/models/ZhipuAI/chatglm2-6b-32k/summary)|query_key_value|chatglm2|&#x2718;|&#x2714;||
 |chatglm3-6b-base|[ZhipuAI/chatglm3-6b-base](https://modelscope.cn/models/ZhipuAI/chatglm3-6b-base/summary)|query_key_value|chatglm-generation|&#x2718;|&#x2714;||
@@ -100,8 +100,8 @@
 |polylm-13b|[damo/nlp_polylm_13b_text_generation](https://modelscope.cn/models/damo/nlp_polylm_13b_text_generation/summary)|c_attn|default-generation|&#x2718;|&#x2718;||
 |seqgpt-560m|[damo/nlp_seqgpt-560m](https://modelscope.cn/models/damo/nlp_seqgpt-560m/summary)|query_key_value|default-generation|&#x2718;|&#x2714;||
 |tongyi-finance-14b|[TongyiFinance/Tongyi-Finance-14B](https://modelscope.cn/models/TongyiFinance/Tongyi-Finance-14B/summary)|c_attn|default-generation|&#x2714;|&#x2714;||
-|tongyi-finance-14b-chat|[TongyiFinance/Tongyi-Finance-14B-Chat](https://modelscope.cn/models/TongyiFinance/Tongyi-Finance-14B-Chat/summary)|c_attn|chatml|&#x2714;|&#x2714;||
-|tongyi-finance-14b-chat-int4|[TongyiFinance/Tongyi-Finance-14B-Chat-Int4](https://modelscope.cn/models/TongyiFinance/Tongyi-Finance-14B-Chat-Int4/summary)|c_attn|chatml|&#x2714;|&#x2718;|auto_gptq>=0.5|
+|tongyi-finance-14b-chat|[TongyiFinance/Tongyi-Finance-14B-Chat](https://modelscope.cn/models/TongyiFinance/Tongyi-Finance-14B-Chat/summary)|c_attn|qwen|&#x2714;|&#x2714;||
+|tongyi-finance-14b-chat-int4|[TongyiFinance/Tongyi-Finance-14B-Chat-Int4](https://modelscope.cn/models/TongyiFinance/Tongyi-Finance-14B-Chat-Int4/summary)|c_attn|qwen|&#x2714;|&#x2718;|auto_gptq>=0.5|
 |codefuse-codellama-34b-chat|[codefuse-ai/CodeFuse-CodeLlama-34B](https://modelscope.cn/models/codefuse-ai/CodeFuse-CodeLlama-34B/summary)|q_proj, k_proj, v_proj|codefuse-codellama|&#x2714;|&#x2714;||
 |deepseek-coder-1_3b|[deepseek-ai/deepseek-coder-1.3b-base](https://modelscope.cn/models/deepseek-ai/deepseek-coder-1.3b-base/summary)|q_proj, k_proj, v_proj|default-generation-bos|&#x2714;|&#x2714;||
 |deepseek-coder-1_3b-chat|[deepseek-ai/deepseek-coder-1.3b-instruct](https://modelscope.cn/models/deepseek-ai/deepseek-coder-1.3b-instruct/summary)|q_proj, k_proj, v_proj|deepseek-coder|&#x2714;|&#x2714;||
diff --git a/examples/pytorch/llm/scripts/qwen_14b_chat/lora_ddp_ds/sft.sh b/examples/pytorch/llm/scripts/qwen_14b_chat/lora_ddp_ds/sft.sh
@@ -12,7 +12,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_14b_chat/qlora/sft.sh b/examples/pytorch/llm/scripts/qwen_14b_chat/qlora/sft.sh
@@ -8,7 +8,7 @@ python llm_sft.py \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --dataset blossom-math-zh \
diff --git a/examples/pytorch/llm/scripts/qwen_14b_chat/qlora_ddp_ds/sft.sh b/examples/pytorch/llm/scripts/qwen_14b_chat/qlora_ddp_ds/sft.sh
@@ -13,7 +13,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_14b_chat_int4/qlora/sft.sh b/examples/pytorch/llm/scripts/qwen_14b_chat_int4/qlora/sft.sh
@@ -7,7 +7,7 @@ python llm_sft.py \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype fp16 \
     --output_dir output \
     --dataset leetcode-python-en \
diff --git a/examples/pytorch/llm/scripts/qwen_14b_chat_int4/qlora_ddp_ds/sft.sh b/examples/pytorch/llm/scripts/qwen_14b_chat_int4/qlora_ddp_ds/sft.sh
@@ -12,7 +12,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype fp16 \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_14b_chat_int8/qlora/sft.sh b/examples/pytorch/llm/scripts/qwen_14b_chat_int8/qlora/sft.sh
@@ -7,7 +7,7 @@ python llm_sft.py \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype fp16 \
     --output_dir output \
     --dataset blossom-math-zh \
diff --git a/examples/pytorch/llm/scripts/qwen_14b_chat_int8/qlora_ddp_ds/sft.sh b/examples/pytorch/llm/scripts/qwen_14b_chat_int8/qlora_ddp_ds/sft.sh
@@ -12,7 +12,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype fp16 \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_72b_chat/lora_mp/sft.sh b/examples/pytorch/llm/scripts/qwen_72b_chat/lora_mp/sft.sh
@@ -7,7 +7,7 @@ python llm_sft.py \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --dataset leetcode-python-en \
diff --git a/examples/pytorch/llm/scripts/qwen_72b_chat/lora_mp_ddp/sft.sh b/examples/pytorch/llm/scripts/qwen_72b_chat/lora_mp_ddp/sft.sh
@@ -12,7 +12,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_72b_chat/qlora/sft.sh b/examples/pytorch/llm/scripts/qwen_72b_chat/qlora/sft.sh
@@ -8,7 +8,7 @@ python llm_sft.py \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --dataset blossom-math-zh \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat/full_mp/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat/full_mp/sft.sh
@@ -6,7 +6,7 @@ python llm_sft.py \
     --model_id_or_path qwen/Qwen-7B-Chat \
     --model_revision master \
     --sft_type full \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --dataset damo-agent-zh \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat/full_mp_ddp/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat/full_mp_ddp/sft.sh
@@ -11,7 +11,7 @@ torchrun \
     --model_id_or_path qwen/Qwen-7B-Chat \
     --model_revision master \
     --sft_type full \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --dataset medical-en medical-zh \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat/lora/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat/lora/sft.sh
@@ -7,7 +7,7 @@ python llm_sft.py \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --dataset blossom-math-zh \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat/lora_ddp/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat/lora_ddp/sft.sh
@@ -12,7 +12,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat/lora_ddp_ds/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat/lora_ddp_ds/sft.sh
@@ -12,7 +12,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat/lora_mp_ddp/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat/lora_mp_ddp/sft.sh
@@ -12,7 +12,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat/qlora/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat/qlora/sft.sh
@@ -8,7 +8,7 @@ python llm_sft.py \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --dataset damo-agent-mini-zh \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat/qlora_ddp/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat/qlora_ddp/sft.sh
@@ -13,7 +13,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat/qlora_ddp_ds/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat/qlora_ddp_ds/sft.sh
@@ -13,7 +13,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat_int4/qlora/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat_int4/qlora/sft.sh
@@ -7,7 +7,7 @@ python llm_sft.py \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype fp16 \
     --output_dir output \
     --dataset leetcode-python-en \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat_int4/qlora_ddp_ds/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat_int4/qlora_ddp_ds/sft.sh
@@ -12,7 +12,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype fp16 \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat_int8/qlora/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat_int8/qlora/sft.sh
@@ -7,7 +7,7 @@ python llm_sft.py \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype fp16 \
     --output_dir output \
     --dataset leetcode-python-en \
diff --git a/examples/pytorch/llm/scripts/qwen_7b_chat_int8/qlora_ddp_ds/sft.sh b/examples/pytorch/llm/scripts/qwen_7b_chat_int8/qlora_ddp_ds/sft.sh
@@ -12,7 +12,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype fp16 \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/qwen_vl_chat/qlora/sft.sh b/examples/pytorch/llm/scripts/qwen_vl_chat/qlora/sft.sh
@@ -8,7 +8,7 @@ python llm_sft.py \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype AUTO \
     --output_dir output \
     --dataset coco-mini-en \
diff --git a/examples/pytorch/llm/scripts/qwen_vl_chat_int4/qlora/sft.sh b/examples/pytorch/llm/scripts/qwen_vl_chat_int4/qlora/sft.sh
@@ -7,7 +7,7 @@ python llm_sft.py \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype fp16 \
     --output_dir output \
     --dataset coco-mini-en \
diff --git a/examples/pytorch/llm/scripts/qwen_vl_chat_int4/qlora_ddp_ds/sft.sh b/examples/pytorch/llm/scripts/qwen_vl_chat_int4/qlora_ddp_ds/sft.sh
@@ -12,7 +12,7 @@ torchrun \
     --model_revision master \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype fp16 \
     --output_dir output \
     --ddp_backend nccl \
diff --git a/examples/pytorch/llm/scripts/tongyi_finance_14b_chat_int4/qlora/sft.sh b/examples/pytorch/llm/scripts/tongyi_finance_14b_chat_int4/qlora/sft.sh
@@ -6,7 +6,7 @@ python llm_sft.py \
     --model_type tongyi-finance-14b-chat-int4 \
     --sft_type lora \
     --tuner_backend swift \
-    --template_type chatml \
+    --template_type qwen \
     --dtype fp16 \
     --output_dir output \
     --custom_train_dataset_path xxx.jsonl \
diff --git a/swift/llm/utils/argument.py b/swift/llm/utils/argument.py
@@ -589,8 +589,8 @@ def handle_compatibility(args: Union[SftArguments, InferArguments]) -> None:
         args.dataset = args.dataset[0].split(',')
     if args.template_type == 'chatglm2-generation':
         args.template_type = 'chatglm-generation'
-    if args.template_type == 'qwen':
-        args.template_type = TemplateType.chatml
+    if args.template_type == 'chatml':
+        args.template_type = TemplateType.qwen
     if (isinstance(args, InferArguments) and args.show_dataset_sample != 10
             and args.val_dataset_sample == 10):
         # args.val_dataset_sample is the default value and args.show_dataset_sample is not the default value.
diff --git a/swift/llm/utils/model.py b/swift/llm/utils/model.py
diff --git a/swift/llm/utils/template.py b/swift/llm/utils/template.py
diff --git a/swift/llm/utils/vllm_utils.py b/swift/llm/utils/vllm_utils.py
diff --git a/tests/llm/test_template.py b/tests/llm/test_template.py