|
1 |
| -# Please update any changes made here to |
2 |
| -# docs/source/dev/dockerfile-ubi/dockerfile-ubi.rst |
3 |
| - |
4 | 1 | ## Global Args #################################################################
|
5 | 2 | ARG BASE_UBI_IMAGE_TAG=9.4
|
6 | 3 | ARG PYTHON_VERSION=3.11
|
@@ -120,21 +117,6 @@ RUN --mount=type=cache,target=/root/.cache/pip \
|
120 | 117 | -r requirements-cuda.txt \
|
121 | 118 | -r requirements-dev.txt
|
122 | 119 |
|
123 |
| -## Proto Compilation ########################################################### |
124 |
| -FROM python-install AS gen-protos |
125 |
| - |
126 |
| -ENV PATH=/opt/vllm/bin/:$PATH |
127 |
| - |
128 |
| -RUN microdnf install -y \ |
129 |
| - make \ |
130 |
| - findutils \ |
131 |
| - && microdnf clean all |
132 |
| - |
133 |
| -RUN --mount=type=cache,target=/root/.cache/pip \ |
134 |
| - --mount=type=bind,source=Makefile,target=Makefile \ |
135 |
| - --mount=type=bind,source=proto,target=proto \ |
136 |
| - make gen-protos |
137 |
| - |
138 | 120 | ## Builder #####################################################################
|
139 | 121 | FROM dev AS build
|
140 | 122 |
|
@@ -175,9 +157,6 @@ ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64:$LD_LIBRARY_PATH
|
175 | 157 | # Copy the entire directory before building wheel
|
176 | 158 | COPY vllm vllm
|
177 | 159 |
|
178 |
| -# Copy over the generated *.pb2 files |
179 |
| -COPY --from=gen-protos /workspace/vllm/entrypoints/grpc/pb vllm/entrypoints/grpc/pb |
180 |
| - |
181 | 160 | ENV CCACHE_DIR=/root/.cache/ccache
|
182 | 161 | RUN --mount=type=cache,target=/root/.cache/ccache \
|
183 | 162 | --mount=type=cache,target=/root/.cache/pip \
|
@@ -216,18 +195,8 @@ RUN pip install \
|
216 | 195 | chmod 0755 /opt/vllm/lib/libnccl.so.2.18.1
|
217 | 196 |
|
218 | 197 |
|
219 |
| -RUN --mount=type=cache,target=/root/.cache/pip \ |
220 |
| - pip install \ |
221 |
| - # additional dependencies for the TGIS gRPC server |
222 |
| - grpcio-tools==1.63.0 \ |
223 |
| - # additional dependencies for openai api_server |
224 |
| - accelerate==0.30.0 \ |
225 |
| - # hf_transfer for faster HF hub downloads |
226 |
| - hf_transfer==0.1.6 |
227 |
| - |
228 | 198 | ENV HF_HUB_OFFLINE=1 \
|
229 | 199 | PORT=8000 \
|
230 |
| - GRPC_PORT=8033 \ |
231 | 200 | HOME=/home/vllm \
|
232 | 201 | VLLM_NCCL_SO_PATH=/opt/vllm/lib/libnccl.so.2.18.1 \
|
233 | 202 | VLLM_USAGE_SOURCE=production-docker-image \
|
|
0 commit comments