fix qwen 2.5 vl

DylanChen-NV · DylanChen-NV · commit 44cecced81dc · 2025-09-17T02:24:53.000Z
Signed-off-by: Dylan Chen &lt;191843203+DylanChen-NV@users.noreply.github.com&gt;
diff --git a/examples/llm_ptq/example_utils.py b/examples/llm_ptq/example_utils.py
@@ -56,7 +56,7 @@ def get_tokenizer(ckpt_path, trust_remote_code=False, **kwargs):
         ckpt_path, trust_remote_code=trust_remote_code, **kwargs
     )
 
-    if "qwen" in type(tokenizer).__name__.lower():
+    if "qwen" in type(tokenizer).__name__.lower() and "vl" not in ckpt_path.lower():
         # qwen use token id 151643 as pad and eos tokens
         tokenizer.pad_token = tokenizer.convert_ids_to_tokens(151643)
         tokenizer.eos_token = tokenizer.convert_ids_to_tokens(151643)
diff --git a/examples/vlm_ptq/scripts/huggingface_example.sh b/examples/vlm_ptq/scripts/huggingface_example.sh
@@ -145,6 +145,10 @@ case "${MODEL_TYPE}" in
         VISUAL_FEATURE=576
         VLM_ARGS=" --max_multimodal_len=$((BUILD_MAX_BATCH_SIZE * VISUAL_FEATURE)) "
         ;;
+    "qwen")
+        VISUAL_FEATURE=1280
+        VLM_ARGS=" --max_multimodal_len=$((BUILD_MAX_BATCH_SIZE * VISUAL_FEATURE)) "
+        ;;
     "mllama")
         PTQ_ARGS+=" --kv_cache_qformat none "
         VLM_ARGS=" --max_encoder_input_len=6404 --skip_run"

Original file line number	Diff line number	Diff line change
`@@ -56,7 +56,7 @@ def get_tokenizer(ckpt_path, trust_remote_code=False, **kwargs):`
`56`	`56`	`ckpt_path, trust_remote_code=trust_remote_code, **kwargs`
`57`	`57`	`)`
`58`	`58`
`59`		`- if "qwen" in type(tokenizer).__name__.lower():`
	`59`	`+ if "qwen" in type(tokenizer).__name__.lower() and "vl" not in ckpt_path.lower():`
`60`	`60`	`# qwen use token id 151643 as pad and eos tokens`
`61`	`61`	`tokenizer.pad_token = tokenizer.convert_ids_to_tokens(151643)`
`62`	`62`	`tokenizer.eos_token = tokenizer.convert_ids_to_tokens(151643)`