File tree Expand file tree Collapse file tree 1 file changed +7
-5
lines changed
Expand file tree Collapse file tree 1 file changed +7
-5
lines changed Original file line number Diff line number Diff line change @@ -7,20 +7,22 @@ RUN apt-get update -y \
77
88RUN ldconfig /usr/local/cuda-12.1/compat/
99
10- # install sglang's dependencies
10+ # update pip
11+ RUN --mount=type=cache,target=/root/.cache/pip python3 -m pip install --upgrade pip
1112
13+ # install sglang's dependencies
1214# EFRON:
1315# these guys are unbelivably huge - >80GiB. Took well over ten minutes to install on my machine and used 28GiB(!) of RAM.
1416# we should consider having a base image with them pre-installed or seeing if we can knock it down a little bit.
1517RUN --mount=type=cache,target=/root/.cache/pip python3 -m pip install "sglang[all]"
1618RUN --mount=type=cache,target=/root/.cache/pip python3 -m pip install flashinfer -i https://flashinfer.ai/whl/cu121/torch2.3
19+
20+ # install our own python dependencies
1721COPY requirements.txt ./requirements.txt
18- RUN --mount=type=cache,target=/root/.cache/pip \
19- python3 -m pip install --upgrade pip && \
20- python3 -m pip install --upgrade -r app/requirements.txt
22+ RUN --mount-type=cache,target=/root/.cache/pip python3 -m pip install --upgrade -r ./requirements.txt
2123
2224# not sure why this is here: is a vllm-workspace even in our image?
23- ENV PYTHONPATH="/:/vllm-workspace"
25+ # ENV PYTHONPATH="/:/vllm-workspace"
2426COPY ./src/handler.py ./handler.py
2527
2628# run the serverless worker
You can’t perform that action at this time.
0 commit comments