@@ -20,6 +20,8 @@ FROM quay.io/ascend/cann:8.5.1-910b-ubuntu22.04-py3.11
2020ARG PIP_INDEX_URL="https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple"
2121ARG MOONCAKE_TAG="v0.3.8.post1"
2222ARG SOC_VERSION="ascend910b1"
23+ ARG SCCACHE_GHA_ENABLED
24+ ARG MATRIX_ARCH
2325
2426# Define environments
2527ENV DEBIAN_FRONTEND=noninteractive
@@ -31,17 +33,28 @@ WORKDIR /workspace
3133
3234COPY . /vllm-workspace/vllm-ascend/
3335
36+ RUN --mount=type=secret,id=ACTIONS_RESULTS_URL,required=false \
37+ --mount=type=secret,id=ACTIONS_RUNTIME_TOKEN,required=false \
38+ bash /vllm-workspace/vllm-ascend/tools/sccache_installer.sh
39+
3440# Install Mooncake dependencies
35- RUN apt-get update -y && \
41+ RUN --mount=type=secret,id=ACTIONS_RESULTS_URL,required=false \
42+ --mount=type=secret,id=ACTIONS_RUNTIME_TOKEN,required=false \
43+ apt-get update -y && \
3644 apt-get install -y git vim wget net-tools gcc g++ cmake libnuma-dev libjemalloc2 && \
3745 git clone --depth 1 --branch ${MOONCAKE_TAG} https://github.com/kvcache-ai/Mooncake /vllm-workspace/Mooncake && \
3846 cp /vllm-workspace/vllm-ascend/tools/mooncake_installer.sh /vllm-workspace/Mooncake/ && \
3947 cd /vllm-workspace/Mooncake && bash mooncake_installer.sh -y && \
4048 ARCH=$(uname -m) && \
4149 source /usr/local/Ascend/ascend-toolkit/set_env.sh && \
50+ export ACTIONS_RESULTS_URL=$(cat /run/secrets/ACTIONS_RESULTS_URL 2>/dev/null || echo "" ) && \
51+ export ACTIONS_RUNTIME_TOKEN=$(cat /run/secrets/ACTIONS_RUNTIME_TOKEN 2>/dev/null || echo "" ) && \
52+ export ACTIONS_CACHE_SERVICE_V2=on && \
53+ export SCCACHE_GHA_ENABLED=${SCCACHE_GHA_ENABLED} && \
4254 export LD_LIBRARY_PATH=/usr/local/Ascend/ascend-toolkit/latest/${ARCH}-linux/devlib:/usr/local/Ascend/ascend-toolkit/latest/${ARCH}-linux/lib64:$LD_LIBRARY_PATH && \
43- mkdir -p build && cd build && cmake .. -DUSE_ASCEND_DIRECT=ON && \
55+ mkdir -p build && cd build && cmake .. -DUSE_ASCEND_DIRECT=ON -DENABLE_SCCACHE=ON && \
4456 make -j$(nproc) && make install && \
57+ sccache --show-stats && \
4558 rm -fr /vllm-workspace/Mooncake/build && \
4659 rm -rf /var/cache/apt/* && \
4760 rm -rf /var/lib/apt/lists/*
@@ -60,11 +73,19 @@ RUN VLLM_TARGET_DEVICE="empty" python3 -m pip install -v -e /vllm-workspace/vllm
6073# Install vllm-ascend
6174# Append `libascend_hal.so` path (devlib) to LD_LIBRARY_PATH
6275# Installing vllm-ascend on x86 can pull upstream triton back in alongside triton-ascend. Remove it immediately after this step.
63- RUN export PIP_EXTRA_INDEX_URL=https://mirrors.huaweicloud.com/ascend/repos/pypi && \
76+ RUN --mount=type=secret,id=ACTIONS_RESULTS_URL,required=false \
77+ --mount=type=secret,id=ACTIONS_RUNTIME_TOKEN,required=false \
78+ export PIP_EXTRA_INDEX_URL=https://mirrors.huaweicloud.com/ascend/repos/pypi && \
6479 source /usr/local/Ascend/ascend-toolkit/set_env.sh && \
6580 source /usr/local/Ascend/nnal/atb/set_env.sh && \
81+ export ACTIONS_RESULTS_URL=$(cat /run/secrets/ACTIONS_RESULTS_URL 2>/dev/null || echo "" ) && \
82+ export ACTIONS_RUNTIME_TOKEN=$(cat /run/secrets/ACTIONS_RUNTIME_TOKEN 2>/dev/null || echo "" ) && \
83+ export ACTIONS_CACHE_SERVICE_V2=on && \
84+ export SCCACHE_GHA_ENABLED=${SCCACHE_GHA_ENABLED} && \
6685 export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/Ascend/ascend-toolkit/latest/`uname -i`-linux/devlib && \
6786 python3 -m pip install -v -e /vllm-workspace/vllm-ascend/ --extra-index https://download.pytorch.org/whl/cpu/ && \
87+ sccache --show-stats && \
88+ rm -f /usr/bin/sccache && \
6889 if [ "$(uname -i)" = "x86_64" ]; then python3 -m pip uninstall -y triton; fi && \
6990 python3 -m pip cache purge
7091
0 commit comments