Add more comments on embedding deployment (#4929)

tastelikefeet · web-flow · commit 26eb2079e369 · 2025-07-13T00:10:07.000+08:00
diff --git a/examples/deploy/embedding/client.py b/examples/deploy/embedding/client.py
@@ -49,7 +49,7 @@ def run_client(host: str = '127.0.0.1', port: int = 8000):
     from swift.llm import run_deploy, DeployArguments
     with run_deploy(
             DeployArguments(
-                model='Qwen/Qwen3-Embedding-0.6B',
+                model='Qwen/Qwen3-Embedding-0.6B',  # GME/GTE models or your checkpoints are also supported
                 task_type='embedding',
                 infer_backend='vllm',
                 verbose=False,
diff --git a/examples/deploy/embedding/server.sh b/examples/deploy/embedding/server.sh
@@ -1,3 +1,5 @@
+# GME/GTE models or your checkpoints are also supported
+# pt/vllm/sglang supported
 CUDA_VISIBLE_DEVICES=0 swift deploy \
     --host 0.0.0.0 \
     --port 8000 \

Original file line number	Diff line number	Diff line change
`@@ -1,3 +1,5 @@`
	`1`	`+# GME/GTE models or your checkpoints are also supported`
	`2`	`+# pt/vllm/sglang supported`
`1`	`3`	`CUDA_VISIBLE_DEVICES=0 swift deploy \`
`2`	`4`	`--host 0.0.0.0 \`
`3`	`5`	`--port 8000 \`