vllm-project
diff --git a/‎docs/assets/sample-output1.png‎
-75.6 KB b/‎docs/assets/sample-output1.png‎
-75.6 KB
diff --git a/‎docs/assets/sample-output2.png‎
30.6 KB b/‎docs/assets/sample-output2.png‎
30.6 KB
diff --git a/‎docs/assets/sample-output3.png‎
17.2 KB b/‎docs/assets/sample-output3.png‎
17.2 KB
diff --git a/‎docs/examples/practice_on_vllm_simulator.md‎
Lines changed: 6 additions & 3 deletions b/‎docs/examples/practice_on_vllm_simulator.md‎
Lines changed: 6 additions & 3 deletions
@@ -80,8 +80,11 @@ curl --request POST 'http://localhost:8000/v1/completions' \
 
 #### 1.5 Download Tokenizer
 
-Download Qwen/Qwen3-0.6B tokenizer.json from [Qwen/Qwen3-0.6B](https://modelscope.cn/models/Qwen/Qwen3-0.6B/files) save to local path.
-
+Download Qwen/Qwen2.5-1.5B-Instruct tokenizer files from [Qwen/Qwen2.5-1.5B-Instruct](https://modelscope.cn/models/Qwen/Qwen2.5-1.5B-Instruct/files) save to local path such as ${local_path}/Qwen2.5-1.5B-Instruct
+```bash
+ls ./Qwen2.5-1.5B-Instruct
+merges.txt              tokenizer.json          tokenizer_config.json   vocab.json
+```
 ______________________________________________________________________
 
 ## 🚀 2. Running Benchmarks
@@ -90,7 +93,7 @@ ______________________________________________________________________
 guidellm benchmark \
 --target "http://localhost:8000/" \
 --model "tweet-summary-0" \
---processor "${local_path}/Qwen3-0.6B" \
+--processor "${local_path}/Qwen2.5-1.5B-Instruct" \
 --rate-type sweep \
 --max-seconds 10 \
 --max-requests 10 \