We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 32bb10d commit 6acccf0Copy full SHA for 6acccf0
Dockerfile.ubi
@@ -195,6 +195,10 @@ RUN --mount=type=cache,target=/root/.cache/uv \
195
"$(echo /workspace/dist/*.whl)[audio,video,tensorizer]" \
196
vllm-tgis-adapter==${VLLM_TGIS_ADAPTER_VERSION}
197
198
+# Upgrade NCCL back to required version after vllm-tgis-adapter installation
199
+RUN --mount=type=cache,target=/root/.cache/uv \
200
+ HOME=/root uv pip install -U nvidia-nccl-cu12==2.26.5
201
+
202
ENV GRPC_PORT=8033 \
203
PORT=8000 \
204
# As an optimization, vLLM disables logprobs when using spec decoding by
@@ -204,4 +208,3 @@ ENV GRPC_PORT=8033 \
208
DISABLE_LOGPROBS_DURING_SPEC_DECODING=false
205
209
206
210
USER 2000
207
-ENTRYPOINT ["python3", "-m", "vllm.entrypoints.openai.api_server"]
0 commit comments