@@ -32,7 +32,7 @@ ENV CUDA_VERSION=11.8.0 \
32
32
NV_CUDA_COMPAT_VERSION=520.61.05-1
33
33
34
34
RUN dnf config-manager \
35
- --add-repo https://developer.download.nvidia.com/compute/cuda/repos/rhel8 /x86_64/cuda-rhel8 .repo \
35
+ --add-repo https://developer.download.nvidia.com/compute/cuda/repos/rhel9 /x86_64/cuda-rhel9 .repo \
36
36
&& dnf install -y \
37
37
cuda-cudart-11-8-${NV_CUDA_CUDART_VERSION} \
38
38
cuda-compat-11-8-${NV_CUDA_COMPAT_VERSION} \
@@ -53,7 +53,7 @@ ENV NV_NVTX_VERSION=11.8.86-1 \
53
53
NV_LIBNCCL_PACKAGE_VERSION=2.15.5-1+cuda11.8
54
54
55
55
RUN dnf config-manager \
56
- --add-repo https://developer.download.nvidia.com/compute/cuda/repos/rhel8 /x86_64/cuda-rhel8 .repo \
56
+ --add-repo https://developer.download.nvidia.com/compute/cuda/repos/rhel9 /x86_64/cuda-rhel9 .repo \
57
57
&& dnf install -y \
58
58
cuda-libraries-11-8-${NV_CUDA_LIB_VERSION} \
59
59
cuda-nvtx-11-8-${NV_NVTX_VERSION} \
@@ -72,7 +72,7 @@ ENV NV_CUDA_CUDART_DEV_VERSION=11.8.89-1 \
72
72
NV_LIBNCCL_DEV_PACKAGE_VERSION=2.15.5-1+cuda11.8
73
73
74
74
RUN dnf config-manager \
75
- --add-repo https://developer.download.nvidia.com/compute/cuda/repos/rhel8 /x86_64/cuda-rhel8 .repo \
75
+ --add-repo https://developer.download.nvidia.com/compute/cuda/repos/rhel9 /x86_64/cuda-rhel9 .repo \
76
76
&& dnf install -y \
77
77
cuda-command-line-tools-11-8-${NV_CUDA_LIB_VERSION} \
78
78
cuda-libraries-devel-11-8-${NV_CUDA_LIB_VERSION} \
@@ -158,7 +158,7 @@ RUN cd server && \
158
158
make gen-server && \
159
159
pip install ".[accelerate]" --no-cache-dir
160
160
161
- # Patch codegen model changes into transformers 4.34
161
+ # Patch codegen model changes into transformers 4.35
162
162
RUN cp server/transformers_patch/modeling_codegen.py ${SITE_PACKAGES}/transformers/models/codegen/modeling_codegen.py
163
163
164
164
# Install router
@@ -277,7 +277,7 @@ COPY proto proto
277
277
COPY server server
278
278
RUN cd server && make gen-server && pip install ".[accelerate, onnx-gpu, quantize]" --no-cache-dir
279
279
280
- # Patch codegen model changes into transformers 4.34.0
280
+ # Patch codegen model changes into transformers 4.35
281
281
RUN cp server/transformers_patch/modeling_codegen.py ${SITE_PACKAGES}/transformers/models/codegen/modeling_codegen.py
282
282
283
283
# Install router
0 commit comments