File tree Expand file tree Collapse file tree 1 file changed +5
-2
lines changed Expand file tree Collapse file tree 1 file changed +5
-2
lines changed Original file line number Diff line number Diff line change @@ -183,6 +183,9 @@ ARG PYTORCH_VERSION
183
183
ARG PYTHON_VERSION
184
184
ARG MINIFORGE_VERSION=23.3.1-1
185
185
186
+ # consistent arch support anywhere we compile CUDA code
187
+ ENV TORCH_CUDA_ARCH_LIST="8.0;8.6+PTX;8.9"
188
+
186
189
RUN dnf install -y unzip git ninja-build && dnf clean all
187
190
188
191
RUN curl -fsSL -v -o ~/miniforge3.sh -O "https://github.com/conda-forge/miniforge/releases/download/${MINIFORGE_VERSION}/Miniforge3-$(uname)-$(uname -m).sh" && \
@@ -231,15 +234,15 @@ FROM python-builder as exllama-kernels-builder
231
234
WORKDIR /usr/src
232
235
233
236
COPY server/exllama_kernels/ .
234
- RUN TORCH_CUDA_ARCH_LIST= "8.0;8.6+PTX;8.9" python setup.py build
237
+ RUN python setup.py build
235
238
236
239
# # Build transformers exllamav2 kernels ########################################
237
240
FROM python-builder as exllamav2-kernels-builder
238
241
239
242
WORKDIR /usr/src
240
243
241
244
COPY server/exllamav2_kernels/ .
242
- RUN TORCH_CUDA_ARCH_LIST= "8.0;8.6+PTX;8.9" python setup.py build
245
+ RUN python setup.py build
243
246
244
247
# # Flash attention cached build image ##########################################
245
248
FROM base as flash-att-cache
You can’t perform that action at this time.
0 commit comments