Skip to content

Commit ae840bb

Browse files
committed
update to run from release script, as intended
1 parent 7a76fc3 commit ae840bb

File tree

3 files changed

+20
-34
lines changed

3 files changed

+20
-34
lines changed

Dockerfile.ubi

Lines changed: 7 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,6 @@ ENV PYTHON_VERSION=${PYTHON_VERSION}
3232
RUN microdnf install -y --nodocs \
3333
python${PYTHON_VERSION}-devel && \
3434
python${PYTHON_VERSION} -m venv $VIRTUAL_ENV && \
35-
pip install --no-cache -U pip wheel uv && \
3635
microdnf clean all
3736

3837

@@ -113,17 +112,14 @@ COPY examples/*.jinja /app/data/template/
113112

114113
# install vllm by running the payload script and then install flashinfer
115114

116-
ARG VLLM_WHEEL_VERSION
117-
ARG VLLM_WHEEL_INDEX
118-
ARG FLASHINFER_VERSION
115+
ARG WHEEL_RELEASE
119116
RUN --mount=type=cache,target=/root/.cache/uv \
120117
--mount=type=bind,src=payload,target=/workspace/payload \
121118
--mount=type=secret,id=rhel-ai-private-index-auth/BOT_PAT \
119+
source ${VIRTUAL_ENV}/bin/activate && \
122120
env BOT_PAT=$(cat /run/secrets/rhel-ai-private-index-auth/BOT_PAT) \
123-
VLLM_WHEEL_VERSION=${VLLM_VERSION} \
124-
VLLM_WHEEL_INDEX=${VLLM_WHEEL_INDEX} \
125-
./payload/run.sh && \
126-
uv pip install "${FLASHINFER_VERSION}"
121+
WHEEL_RELEASE=${WHEEL_RELEASE} \
122+
./payload/run.sh
127123

128124
ENV HF_HUB_OFFLINE=1 \
129125
HOME=/home/vllm \
@@ -161,17 +157,15 @@ FROM vllm-openai AS vllm-grpc-adapter
161157

162158
USER root
163159

164-
ARG VLLM_TGIS_ADAPTER_VERSION
160+
ARG WHEEL_RELEASE
165161
RUN --mount=type=cache,target=/root/.cache/uv \
166162
--mount=type=bind,src=payload,target=/workspace/payload \
167163
--mount=type=secret,id=rhel-ai-private-index-auth/BOT_PAT \
168164
cd /workspace && \
169-
ls && \
165+
source ${VIRTUAL_ENV}/bin/activate && \
170166
env HOME=/root \
171167
BOT_PAT=$(cat /run/secrets/rhel-ai-private-index-auth/BOT_PAT) \
172-
VLLM_WHEEL_VERSION=${VLLM_VERSION} \
173-
VLLM_TGIS_ADAPTER_VERSION=${VLLM_TGIS_ADAPTER_VERSION} \
174-
VLLM_WHEEL_INDEX=${VLLM_WHEEL_INDEX} \
168+
WHEEL_RELEASE=${WHEEL_RELEASE} \
175169
./payload/run.sh
176170

177171

argfile.konflux

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,5 @@
11
BASE_UBI_IMAGE_TAG=9.5-1739420147
22
PYTHON_VERSION=3.11
33
LIBSODIUM_VERSION=1.0.20
4-
VLLM_TGIS_ADAPTER_VERSION=0.6.3
5-
FLASHINFER_VERSION=https://github.com/flashinfer-ai/flashinfer/releases/download/v0.2.1.post1/flashinfer_python-0.2.1.post1+cu124torch2.5-cp38-abi3-linux_x86_64.whl
6-
VLLM_WHEEL_VERSION=0.7.2
7-
VLLM_WHEEL_INDEX=https://gitlab.com/api/v4/projects/66664052/packages/pypi/simple
4+
WHEEL_RELEASE=2.20.55+vllm-cuda-ubi9-x86_64
5+
# can view releases at https://gitlab.com/redhat/rhel-ai/rhoai/pipeline/-/releases

payload/run.sh

Lines changed: 11 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,9 @@
11
#!/bin/bash
2+
# Script assumes python venv is already properly configured
23
# required env vars:
34
# $BOT_PAT
4-
# $WHEEL_RELEASE_ARTIFACTS
5-
# optional:
6-
# $VLLM_TGIS_ADAPTER_VERSION
7-
# $VLLM_WHEEL_VERSION
5+
# $WHEEL_RELEASE
6+
# $WHEEL_BASEURL
87
set -ex
98

109
cat <<EOF > ${HOME}/.netrc
@@ -13,22 +12,17 @@ login rhel-ai-wheels-prefetch-token-rhoai
1312
password $BOT_PAT
1413
EOF
1514

16-
trap "rm ${HOME}/.netrc" EXIT
15+
trap "rm -rf ${HOME}/.netrc release release.tar.gz" EXIT
1716

18-
# https://docs.astral.sh/uv/configuration/indexes/#searching-across-multiple-indexes
19-
# This will prefer to use the custom index, and fall back to pypi if needed
20-
export UV_EXTRA_INDEX_URL=${VLLM_WHEEL_INDEX}
21-
export UV_INDEX_STRATEGY=unsafe-first-match
17+
# WHEEL_RELEASE="2.20.55+vllm-cuda-ubi9-x86_64"
2218

23-
vllm="vllm[tensorizer,audio,video]"
19+
# Gitlab project ID, etc should be static
20+
WHEEL_RELEASE_ARTIFACTS="https://gitlab.com/api/v4/projects/68045055/packages/generic/rhelai-wheels/${WHEEL_RELEASE}/wheels-${WHEEL_RELEASE}.tar.gz"
2421

25-
if [[ -n "$VLLM_TGIS_ADAPTER_VERSION" ]]; then
26-
vllm_tgis_adapter="vllm-tgis-adapter==${VLLM_TGIS_ADAPTER_VERSION}"
27-
fi
2822

29-
if [[ -n "$VLLM_WHEEL_VERSION" ]]; then
30-
vllm="${vllm}==${$VLLM_WHEEL_VERSION}"
31-
fi
23+
# NOTE - ensure that flashinfer is included in wheel thing
3224

33-
uv pip install $vllm $vllm_tgis_adapter
25+
curl --netrc -o release.tar.gz ${WHEEL_RELEASE_ARTIFACTS}
26+
tar zxvf release.tar.gz
27+
./release/install_wheels.sh
3428

0 commit comments

Comments
 (0)