-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathDockerfile
More file actions
33 lines (27 loc) · 828 Bytes
/
Dockerfile
File metadata and controls
33 lines (27 loc) · 828 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
FROM nvidia/cuda:12.8.0-devel-ubuntu24.04 AS builder
ARG RUST_VERSION
WORKDIR /src
RUN apt update && \
apt install -y \
curl \
libssl-dev \
&& \
rm -rf /var/lib/apt/lists/* \
curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh -s -- -y \
--default-toolchain $RUST_VERSION \
--component cargo,rustc,rust-std
COPY . .
ENV CUDA_COMPUTE_CAP=75
RUN . /root/.cargo/env && \
apt install -y \
pkg-config \
&& \
cargo install --path embeddings-server --features cuda
FROM nvidia/cuda:12.8.0-runtime-ubuntu24.04
#RUN apt-get update && \
# apt-get install -y \
# extra-runtime-dependencies \
# && \
# rm -rf /var/lib/apt/lists/*
COPY --from=builder /root/.cargo/bin/embeddings-server /usr/local/bin/embeddings-server
ENTRYPOINT ["embeddings-server"]