We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9010b45 commit 17ef2d1Copy full SHA for 17ef2d1
scripts/quickstart/start_vllm.sh
@@ -31,7 +31,7 @@ max_num_seqs=128
31
host=0.0.0.0
32
max_model_len=16384
33
34
-KV_CACHE_DTYPE=auto
+KV_CACHE_DTYPE=fp8_inc
35
36
while getopts hw:u:p:l:b:c:sq flag; do
37
case $flag in
0 commit comments