File tree Expand file tree Collapse file tree 3 files changed +0
-6
lines changed
docs/source/user-guide/pd-disaggregation Expand file tree Collapse file tree 3 files changed +0
-6
lines changed Original file line number Diff line number Diff line change @@ -20,7 +20,6 @@ vllm serve /home/models/Qwen2.5-7B-Instruct \
2020--tensor-parallel-size 1 \
2121--gpu_memory_utilization 0.87 \
2222--trust-remote-code \
23- --enforce-eager \
2423--no-enable-prefix-caching \
2524--port 7800 \
2625--block-size 128 \
@@ -49,7 +48,6 @@ vllm serve /home/models/Qwen2.5-7B-Instruct \
4948--tensor-parallel-size 1 \
5049--gpu_memory_utilization 0.87 \
5150--trust-remote-code \
52- --enforce-eager \
5351--no-enable-prefix-caching \
5452--port 7801 \
5553--block-size 128 \
Original file line number Diff line number Diff line change @@ -26,7 +26,6 @@ vllm serve /home/models/Qwen2.5-7B-Instruct \
2626--tensor-parallel-size 1 \
2727--gpu_memory_utilization 0.87 \
2828--trust-remote-code \
29- --enforce-eager \
3029--no-enable-prefix-caching \
3130--port 7800 \
3231--block-size 128 \
@@ -56,7 +55,6 @@ vllm serve /home/models/Qwen2.5-7B-Instruct \
5655--tensor-parallel-size 1 \
5756--gpu_memory_utilization 0.87 \
5857--trust-remote-code \
59- --enforce-eager \
6058--no-enable-prefix-caching \
6159--port 7801 \
6260--block-size 128 \
Original file line number Diff line number Diff line change @@ -20,7 +20,6 @@ vllm serve /home/models/Qwen2.5-7B-Instruct \
2020--tensor-parallel-size 1 \
2121--gpu_memory_utilization 0.87 \
2222--trust-remote-code \
23- --enforce-eager \
2423--no-enable-prefix-caching \
2524--port 7800 \
2625--block-size 128 \
@@ -48,7 +47,6 @@ vllm serve /home/models/Qwen2.5-7B-Instruct \
4847--tensor-parallel-size 1 \
4948--gpu_memory_utilization 0.87 \
5049--trust-remote-code \
51- --enforce-eager \
5250--no-enable-prefix-caching \
5351--port 7801 \
5452--block-size 128 \
You can’t perform that action at this time.
0 commit comments