Skip to content

Commit c221240

Browse files
authored
BLD: fix cu128 Dockerfile (#4145)
1 parent 8f92d04 commit c221240

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

xinference/deploy/docker/Dockerfile.cu128

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -43,14 +43,14 @@ RUN pip install --upgrade -i "$PIP_INDEX" pip setuptools wheel && \
4343
pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements_12.8/requirements-cu128-base.txt && \
4444
pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements_12.8/requirements-cu128-ml.txt && \
4545
pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements_12.8/requirements-cu128-models.txt && \
46-
pip install -i "$PIP_INDEX" transformers>=4.51.3 && \
47-
pip install -i "$PIP_INDEX" --no-deps sglang==0.4.6.post5 && \
48-
pip install https://github.com/sgl-project/whl/releases/download/v0.2.6/sgl_kernel-0.2.6+cu128-cp39-abi3-manylinux2014_x86_64.whl && \
46+
pip install -i "$PIP_INDEX" transformers>=4.55.2 && \
47+
pip install -i "$PIP_INDEX" --no-deps sglang==0.4.9.post5 && \
48+
pip install -i "$PIP_INDEX" sgl-kernel==0.3.15 && \
4949
pip install -i "$PIP_INDEX" wetext && \
5050
pip uninstall flashinfer -y && \
51-
pip install -i "$PIP_INDEX" flashinfer-python && \
51+
pip install -i "$PIP_INDEX" flashinfer-python==0.4.0rc3 && \
5252
pip install -i "$PIP_INDEX" SQLAlchemy==1.4.54 && \
53-
pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.7-cp312-cp312-linux_x86_64.whl && \
53+
pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.8.2+cu128torch2.8-cp312-cp312-linux_x86_64.whl && \
5454
cd /opt/inference && \
5555
python3 setup.py build_web && \
5656
git restore . && \

0 commit comments

Comments
 (0)