1- FROM nvidia/cuda:12.6.3 -devel-ubuntu24.04 AS base-builder
1+ FROM nvidia/cuda:12.9.1 -devel-ubuntu24.04 AS base-builder
22
33ENV SCCACHE=0.10.0
44ENV RUSTC_WRAPPER=/usr/local/bin/sccache
@@ -64,6 +64,14 @@ RUN --mount=type=secret,id=actions_results_url,env=ACTIONS_RESULTS_URL \
6464 --mount=type=secret,id=actions_runtime_token,env=ACTIONS_RUNTIME_TOKEN \
6565 CUDA_COMPUTE_CAP=90 cargo chef cook --release --features candle-cuda --recipe-path recipe.json && sccache -s;
6666
67+ RUN --mount=type=secret,id=actions_results_url,env=ACTIONS_RESULTS_URL \
68+ --mount=type=secret,id=actions_runtime_token,env=ACTIONS_RUNTIME_TOKEN \
69+ CUDA_COMPUTE_CAP=100 cargo chef cook --release --features candle-cuda --recipe-path recipe.json && sccache -s;
70+
71+ RUN --mount=type=secret,id=actions_results_url,env=ACTIONS_RESULTS_URL \
72+ --mount=type=secret,id=actions_runtime_token,env=ACTIONS_RUNTIME_TOKEN \
73+ CUDA_COMPUTE_CAP=120 cargo chef cook --release --features candle-cuda --recipe-path recipe.json && sccache -s;
74+
6775COPY backends backends
6876COPY core core
6977COPY router router
@@ -88,7 +96,19 @@ RUN --mount=type=secret,id=actions_results_url,env=ACTIONS_RESULTS_URL \
8896
8997RUN mv /usr/src/target/release/text-embeddings-router /usr/src/target/release/text-embeddings-router-90
9098
91- FROM nvidia/cuda:12.6.3-base-ubuntu24.04 AS base
99+ RUN --mount=type=secret,id=actions_results_url,env=ACTIONS_RESULTS_URL \
100+ --mount=type=secret,id=actions_runtime_token,env=ACTIONS_RUNTIME_TOKEN \
101+ CUDA_COMPUTE_CAP=100 cargo build --release --bin text-embeddings-router -F candle-cuda && sccache -s;
102+
103+ RUN mv /usr/src/target/release/text-embeddings-router /usr/src/target/release/text-embeddings-router-100
104+
105+ RUN --mount=type=secret,id=actions_results_url,env=ACTIONS_RESULTS_URL \
106+ --mount=type=secret,id=actions_runtime_token,env=ACTIONS_RUNTIME_TOKEN \
107+ CUDA_COMPUTE_CAP=120 cargo build --release --bin text-embeddings-router -F candle-cuda && sccache -s;
108+
109+ RUN mv /usr/src/target/release/text-embeddings-router /usr/src/target/release/text-embeddings-router-120
110+
111+ FROM nvidia/cuda:12.9.1-runtime-ubuntu24.04 AS base
92112
93113ARG DEFAULT_USE_FLASH_ATTENTION=True
94114
@@ -101,12 +121,14 @@ RUN apt-get update && DEBIAN_FRONTEND=noninteractive apt-get install -y --no-ins
101121 ca-certificates \
102122 libssl-dev \
103123 curl \
104- cuda-compat-12-6 \
124+ cuda-compat-12-9 \
105125 && rm -rf /var/lib/apt/lists/*
106126
107127COPY --from=builder /usr/src/target/release/text-embeddings-router-75 /usr/local/bin/text-embeddings-router-75
108128COPY --from=builder /usr/src/target/release/text-embeddings-router-80 /usr/local/bin/text-embeddings-router-80
109129COPY --from=builder /usr/src/target/release/text-embeddings-router-90 /usr/local/bin/text-embeddings-router-90
130+ COPY --from=builder /usr/src/target/release/text-embeddings-router-100 /usr/local/bin/text-embeddings-router-100
131+ COPY --from=builder /usr/src/target/release/text-embeddings-router-120 /usr/local/bin/text-embeddings-router-120
110132
111133COPY --chmod=775 cuda-all-entrypoint.sh entrypoint.sh
112134
0 commit comments