File tree Expand file tree Collapse file tree 3 files changed +4
-4
lines changed
Expand file tree Collapse file tree 3 files changed +4
-4
lines changed Original file line number Diff line number Diff line change 3434 description : " vLLM version"
3535 required : false
3636 type : string
37- default : " 0.12 .0"
37+ default : " 0.17 .0"
3838 sglangVersion :
3939 description : " SGLang version"
4040 required : false
@@ -230,7 +230,7 @@ jobs:
230230 env :
231231 RELEASE_TAG : ${{ needs.prepare.outputs.release_tag }}
232232 LLAMA_SERVER_VERSION : ${{ inputs.llamaServerVersion || 'latest' }}
233- VLLM_VERSION : ${{ inputs.vllmVersion || '0.12.0' }}
233+ VLLM_VERSION : ${{ inputs.vllmVersion }}
234234 SGLANG_VERSION : ${{ inputs.sglangVersion || '0.4.0' }}
235235 PUSH_LATEST : ${{ inputs.pushLatest || 'false' }}
236236 BUILD_MUSA_CANN : ${{ inputs.buildMusaCann || 'false' }}
Original file line number Diff line number Diff line change @@ -90,7 +90,7 @@ ENTRYPOINT ["/app/model-runner"]
9090# --- vLLM variant ---
9191FROM llamacpp AS vllm
9292
93- ARG VLLM_VERSION=0.12 .0
93+ ARG VLLM_VERSION=0.17 .0
9494ARG VLLM_CUDA_VERSION=cu130
9595ARG VLLM_PYTHON_TAG=cp38-abi3
9696ARG TARGETARCH
Original file line number Diff line number Diff line change @@ -5,7 +5,7 @@ LLAMA_SERVER_VERSION := latest
55LLAMA_SERVER_VARIANT := cpu
66BASE_IMAGE := ubuntu:24.04
77VLLM_BASE_IMAGE := nvidia/cuda:13.0.2-runtime-ubuntu24.04
8- VLLM_VERSION ?= 0.12 .0
8+ VLLM_VERSION ?= 0.17 .0
99DOCKER_IMAGE := docker/model-runner:latest
1010DOCKER_IMAGE_VLLM := docker/model-runner:latest-vllm-cuda
1111DOCKER_IMAGE_SGLANG := docker/model-runner:latest-sglang
You can’t perform that action at this time.
0 commit comments