|
| 1 | +ARG PLATFORM=cpu |
| 2 | +FROM lukemathwalker/cargo-chef:latest-rust-1.75-bookworm AS chef |
| 3 | +WORKDIR /usr/src |
| 4 | +ENV SCCACHE=0.5.4 |
| 5 | +ENV RUSTC_WRAPPER=/usr/local/bin/sccache |
| 6 | + |
| 7 | +# Download and configure sccache |
| 8 | +RUN curl -fsSL https://github.com/mozilla/sccache/releases/download/v$SCCACHE/sccache-v$SCCACHE-x86_64-unknown-linux-musl.tar.gz | tar -xzv --strip-components=1 -C /usr/local/bin sccache-v$SCCACHE-x86_64-unknown-linux-musl/sccache && \ |
| 9 | + chmod +x /usr/local/bin/sccache |
| 10 | + |
| 11 | +FROM chef AS planner |
| 12 | + |
| 13 | +COPY backends backends |
| 14 | +COPY core core |
| 15 | +COPY router router |
| 16 | +COPY Cargo.toml ./ |
| 17 | +COPY Cargo.lock ./ |
| 18 | + |
| 19 | +RUN cargo chef prepare --recipe-path recipe.json |
| 20 | + |
| 21 | +FROM chef AS builder |
| 22 | + |
| 23 | +ARG GIT_SHA |
| 24 | +ARG DOCKER_LABEL |
| 25 | + |
| 26 | +# sccache specific variables |
| 27 | +ARG ACTIONS_CACHE_URL |
| 28 | +ARG ACTIONS_RUNTIME_TOKEN |
| 29 | +ARG SCCACHE_GHA_ENABLED |
| 30 | + |
| 31 | +COPY --from=planner /usr/src/recipe.json recipe.json |
| 32 | + |
| 33 | +RUN cargo chef cook --release --features python --no-default-features --recipe-path recipe.json && sccache -s |
| 34 | + |
| 35 | +COPY backends backends |
| 36 | +COPY core core |
| 37 | +COPY router router |
| 38 | +COPY Cargo.toml ./ |
| 39 | +COPY Cargo.lock ./ |
| 40 | + |
| 41 | +RUN PROTOC_ZIP=protoc-21.12-linux-x86_64.zip && \ |
| 42 | + curl -OL https://github.com/protocolbuffers/protobuf/releases/download/v21.12/$PROTOC_ZIP && \ |
| 43 | + unzip -o $PROTOC_ZIP -d /usr/local bin/protoc && \ |
| 44 | + unzip -o $PROTOC_ZIP -d /usr/local 'include/*' && \ |
| 45 | + rm -f $PROTOC_ZIP |
| 46 | + |
| 47 | +FROM builder as http-builder |
| 48 | + |
| 49 | +RUN cargo build --release --bin text-embeddings-router -F python -F http --no-default-features && sccache -s |
| 50 | + |
| 51 | +FROM builder as grpc-builder |
| 52 | + |
| 53 | +COPY proto proto |
| 54 | + |
| 55 | +RUN cargo build --release --bin text-embeddings-router -F grpc -F python --no-default-features && sccache -s |
| 56 | + |
| 57 | +FROM intel/intel-optimized-pytorch:2.4.0-pip-base AS cpu |
| 58 | +ENV HUGGINGFACE_HUB_CACHE=/data \ |
| 59 | + PORT=80 |
| 60 | + |
| 61 | +RUN apt-get update && DEBIAN_FRONTEND=noninteractive apt-get install -y --no-install-recommends \ |
| 62 | + build-essential \ |
| 63 | + git \ |
| 64 | + cmake \ |
| 65 | + ninja-build \ |
| 66 | + python3-dev &&\ |
| 67 | + rm -rf /var/lib/apt/lists/* |
| 68 | + |
| 69 | +WORKDIR /usr/src |
| 70 | +COPY backends backends |
| 71 | +COPY backends/python/server/text_embeddings_server/models/__init__.py backends/python/server/text_embeddings_server/models/__init__.py |
| 72 | +COPY backends/python/server/pyproject.toml backends/python/server/pyproject.toml |
| 73 | +COPY backends/python/server/requirements-intel.txt backends/python/server/requirements.txt |
| 74 | + |
| 75 | +RUN python -m pip install torch==2.4.0 torchvision torchaudio==2.4.0 --index-url https://download.pytorch.org/whl/cpu |
| 76 | + |
| 77 | +RUN cd backends/python/server && \ |
| 78 | + make install |
| 79 | + |
| 80 | +FROM vault.habana.ai/gaudi-docker/1.17.1/ubuntu22.04/habanalabs/pytorch-installer-2.3.1:latest AS hpu |
| 81 | +ENV HUGGINGFACE_HUB_CACHE=/data \ |
| 82 | + PORT=80 |
| 83 | + |
| 84 | +RUN apt-get update && DEBIAN_FRONTEND=noninteractive apt-get install -y --no-install-recommends \ |
| 85 | + build-essential \ |
| 86 | + git \ |
| 87 | + cmake \ |
| 88 | + ninja-build \ |
| 89 | + python3-dev &&\ |
| 90 | + rm -rf /var/lib/apt/lists/* |
| 91 | + |
| 92 | +WORKDIR /usr/src |
| 93 | +COPY backends backends |
| 94 | +COPY backends/python/server/text_embeddings_server/models/__init__.py backends/python/server/text_embeddings_server/models/__init__.py |
| 95 | +COPY backends/python/server/pyproject.toml backends/python/server/pyproject.toml |
| 96 | +COPY backends/python/server/requirements-hpu.txt backends/python/server/requirements.txt |
| 97 | + |
| 98 | +RUN cd backends/python/server && \ |
| 99 | + make install |
| 100 | + |
| 101 | +FROM intel/intel-extension-for-pytorch:2.3.110-xpu AS xpu |
| 102 | + |
| 103 | +ENV HUGGINGFACE_HUB_CACHE=/data \ |
| 104 | + PORT=80 |
| 105 | +RUN wget http://nz2.archive.ubuntu.com/ubuntu/pool/main/o/openssl/libssl1.1_1.1.1f-1ubuntu2_amd64.deb && \ |
| 106 | + dpkg -i ./libssl1.1_1.1.1f-1ubuntu2_amd64.deb |
| 107 | + |
| 108 | +RUN wget -qO - https://repositories.intel.com/gpu/intel-graphics.key | gpg --dearmor | tee /usr/share/keyrings/intel-graphics.gpg > /dev/null |
| 109 | + |
| 110 | +RUN wget -O- https://apt.repos.intel.com/intel-gpg-keys/GPG-PUB-KEY-INTEL-SW-PRODUCTS.PUB \ |
| 111 | +| gpg --dearmor | tee /usr/share/keyrings/oneapi-archive-keyring.gpg > /dev/null && echo "deb [signed-by=/usr/share/keyrings/oneapi-archive-keyring.gpg] https://apt.repos.intel.com/oneapi all main" | tee /etc/apt/sources.list.d/oneAPI.list |
| 112 | + |
| 113 | +RUN apt-get update && apt install -y intel-basekit xpu-smi cmake python3-dev ninja-build pciutils |
| 114 | +WORKDIR /usr/src |
| 115 | +RUN pip install torch==2.3.1+cxx11.abi torchvision==0.18.1+cxx11.abi torchaudio==2.3.1+cxx11.abi intel-extension-for-pytorch==2.3.110+xpu oneccl_bind_pt==2.3.100+xpu --extra-index-url https://pytorch-extension.intel.com/release-whl/stable/xpu/us/ --no-cache-dir |
| 116 | + |
| 117 | +ENV CCL_ROOT=/opt/intel/oneapi/ccl/latest |
| 118 | +ENV I_MPI_ROOT=/opt/intel/oneapi/mpi/latest |
| 119 | +ENV FI_PROVIDER_PATH=/opt/intel/oneapi/mpi/latest/opt/mpi/libfabric/lib/prov:/usr/lib/x86_64-linux-gnu/libfabric |
| 120 | +ENV LIBRARY_PATH=/opt/intel/oneapi/mpi/latest/lib:/opt/intel/oneapi/ccl/latest/lib/:/opt/intel/oneapi/mkl/latest/lib/:/opt/intel/oneapi/compiler/latest/lib |
| 121 | +ENV LD_LIBRARY_PATH=/opt/intel/oneapi/ccl/latest/lib/:/opt/intel/oneapi/mpi/latest/opt/mpi/libfabric/lib:/opt/intel/oneapi/mpi/latest/lib:/opt/intel/oneapi/mkl/latest/lib:/opt/intel/oneapi/compiler/latest/opt/compiler/lib:/opt/intel/oneapi/compiler/latest/lib:/opt/intel/oneapi/lib:/opt/intel/oneapi/lib/intel64: |
| 122 | +ENV PATH=/opt/intel/oneapi/mpi/latest/opt/mpi/libfabric/bin:/opt/intel/oneapi/mpi/latest/bin:/opt/intel/oneapi/mpi/latest/opt/mpi/libfabric/bin:/opt/intel/oneapi/mkl/latest/bin/:/opt/intel/oneapi/compiler/latest/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin |
| 123 | +ENV CCL_ZE_IPC_EXCHANGE=sockets |
| 124 | +ENV CMAKE_PREFIX_PATH=/opt/intel/oneapi/mkl/latest/lib/cmake:/opt/intel/oneapi/compiler/latest |
| 125 | +ENV CPATH=/opt/intel/oneapi/mpi/latest/include:/opt/intel/oneapi/ccl/latest/include:/opt/intel/oneapi/mkl/latest/include |
| 126 | + |
| 127 | +COPY backends backends |
| 128 | +COPY backends/python/server/text_embeddings_server/models/__init__.py backends/python/server/text_embeddings_server/models/__init__.py |
| 129 | +COPY backends/python/server/pyproject.toml backends/python/server/pyproject.toml |
| 130 | +COPY backends/python/server/requirements-intel.txt backends/python/server/requirements.txt |
| 131 | +RUN cd backends/python/server && \ |
| 132 | + make install |
| 133 | + |
| 134 | +FROM ${PLATFORM} AS grpc |
| 135 | + |
| 136 | +COPY --from=grpc-builder /usr/src/target/release/text-embeddings-router /usr/local/bin/text-embeddings-router |
| 137 | + |
| 138 | +ENTRYPOINT ["text-embeddings-router"] |
| 139 | +CMD ["--json-output"] |
| 140 | + |
| 141 | +FROM ${PLATFORM} |
| 142 | + |
| 143 | +COPY --from=http-builder /usr/src/target/release/text-embeddings-router /usr/local/bin/text-embeddings-router |
| 144 | + |
| 145 | +ENTRYPOINT ["text-embeddings-router"] |
| 146 | +CMD ["--json-output"] |
0 commit comments