[MUSA] add qwen-image i2i example (#683)

yeahdongcn · web-flow · commit 0a125cbfcc28 · 2025-12-29T12:09:22.000+08:00
diff --git a/configs/platforms/mthreads_musa/qwen_image_i2i_2511.json b/configs/platforms/mthreads_musa/qwen_image_i2i_2511.json
@@ -0,0 +1,21 @@
+{
+    "vae_scale_factor": 8,
+    "infer_steps": 40,
+    "transformer_in_channels": 64,
+    "prompt_template_encode": "<|im_start|>system\nDescribe the key features of the input image (color, shape, size, texture, objects, background), then explain how the user's text instruction should alter or modify the image. Generate a new image that meets the user's requirements while maintaining consistency with the original input where appropriate.<|im_end|>\n<|im_start|>user\n{}<|im_end|>\n<|im_start|>assistant\n",
+    "prompt_template_encode_start_idx": 64,
+    "_auto_resize": true,
+    "num_layers": 60,
+    "attention_out_dim": 3072,
+    "attention_dim_head": 128,
+    "attn_type": "torch_sdpa",
+    "enable_cfg": true,
+    "sample_guide_scale": 4.0,
+    "CONDITION_IMAGE_SIZE": 147456,
+    "USE_IMAGE_ID_IN_PROMPT": true,
+    "zero_cond_t": true,
+    "modulate_type": "torch",
+    "rope_type": "torch",
+    "ln_type": "Default",
+    "rms_type": "Default"
+}
diff --git a/configs/platforms/mthreads_musa/wan_t2v.json b/configs/platforms/mthreads_musa/wan_t2v.json
@@ -11,5 +11,8 @@
     "sample_shift": 8,
     "enable_cfg": true,
     "cpu_offload": false,
-    "rope_type": "torch"
+    "modulate_type": "torch",
+    "rope_type": "torch",
+    "ln_type": "Default",
+    "rms_type": "Default"
 }
diff --git a/scripts/platforms/mthreads_musa/qwen_image_i2i_2511.sh b/scripts/platforms/mthreads_musa/qwen_image_i2i_2511.sh
@@ -0,0 +1,24 @@
+#!/bin/bash
+
+# System management interface: mx-smi
+
+# set path and first
+lightx2v_path=
+model_path=
+
+export PLATFORM=musa
+export MUSA_VISIBLE_DEVICES=0
+
+# set environment variables
+source ${lightx2v_path}/scripts/base/base.sh
+
+python -m lightx2v.infer \
+    --model_cls qwen_image \
+    --task i2i \
+    --model_path $model_path \
+    --config_json ${lightx2v_path}/configs/platforms/mthreads_musa/qwen_image_i2i_2511.json \
+    --prompt "Make the girl from Image 1 wear the black dress from Image 2 and sit in the pose from Image 3." \
+    --negative_prompt " " \
+    --image_path "1.png,2.png,3.png" \
+    --save_result_path ${lightx2v_path}/save_results/qwen_image_i2i_2511.png \
+    --seed 0