|
29 | 29 | RELEASE_TAG="v${MAJOR}.${MINOR}.0-rc.${RC}"
|
30 | 30 | fi
|
31 | 31 |
|
32 |
| -# vLLM image version (default to 0.7.2 if not defined) |
33 |
| -VLLM="${VLLM:-0.7.2}" |
| 32 | +# The vLLM image versions |
| 33 | +# The GPU image is from https://hub.docker.com/layers/vllm/vllm-openai |
| 34 | +VLLM_GPU="${VLLM_GPU:-0.9.1}" |
| 35 | +# The CPU image is from https://gallery.ecr.aws/q9t5s3a7/vllm-cpu-release-repo |
| 36 | +VLLM_CPU="${VLLM_CPU:-0.9.1}" |
| 37 | +# The sim image is from https://github.com/llm-d/llm-d-inference-sim/pkgs/container/llm-d-inference-sim |
| 38 | +VLLM_SIM="${VLLM_SIM:-0.1.1}" |
34 | 39 |
|
35 | 40 | echo "Using release tag: ${RELEASE_TAG}"
|
36 |
| -echo "Using vLLM image version: ${VLLM}" |
| 41 | +echo "Using vLLM GPU image version: ${VLLM_GPU}" |
| 42 | +echo "Using vLLM CPU image version: ${VLLM_CPU}" |
| 43 | +echo "Using vLLM Simulator image version: ${VLLM_SIM}" |
37 | 44 |
|
38 | 45 | # -----------------------------------------------------------------------------
|
39 | 46 | # Update pkg/README.md
|
@@ -64,30 +71,48 @@ sed -i.bak -E "s|(tag: )[^\"[:space:]]+|\1${RELEASE_TAG}|g" "$EPP_HELM"
|
64 | 71 | sed -i.bak -E "s|(tag: )[^\"[:space:]]+|\1${RELEASE_TAG}|g" "$BBR_HELM"
|
65 | 72 |
|
66 | 73 | # Update the container image pull policy.
|
67 |
| -sed -i.bak '/us-central1-docker.pkg.dev\/k8s-staging-images\/gateway-api-inference-extension\/epp/ { n; s/Always/IfNotPresent/ }' "$EPP" |
| 74 | +sed -i.bak '/us-central1-docker.pkg.dev\/k8s-staging-images\/gateway-api-inference-extension\/epp/{n;s/Always/IfNotPresent/;}' "$EPP" |
68 | 75 |
|
69 | 76 | # Update the container registry.
|
70 | 77 | sed -i.bak -E "s|us-central1-docker\.pkg\.dev/k8s-staging-images|registry.k8s.io|g" "$EPP"
|
71 | 78 | sed -i.bak -E "s|us-central1-docker\.pkg\.dev/k8s-staging-images|registry.k8s.io|g" "$EPP_HELM"
|
72 | 79 | sed -i.bak -E "s|us-central1-docker\.pkg\.dev/k8s-staging-images|registry.k8s.io|g" "$BBR_HELM"
|
73 | 80 |
|
74 | 81 | # -----------------------------------------------------------------------------
|
75 |
| -# Update config/manifests/vllm/gpu-deployment.yaml |
| 82 | +# Update vLLM deployment manifests |
76 | 83 | # -----------------------------------------------------------------------------
|
77 |
| -VLLM_DEPLOY="config/manifests/vllm/gpu-deployment.yaml" |
78 |
| -echo "Updating ${VLLM_DEPLOY} ..." |
| 84 | +VLLM_GPU_DEPLOY="config/manifests/vllm/gpu-deployment.yaml" |
| 85 | +echo "Updating ${VLLM_GPU_DEPLOY} ..." |
79 | 86 |
|
80 |
| -# Update the vLLM image version |
81 |
| -sed -i.bak -E "s|(vllm/vllm-openai:)[^\"[:space:]]+|\1v${VLLM}|g" "$VLLM_DEPLOY" |
| 87 | +# Update the vLLM GPU image version |
| 88 | +sed -i.bak -E "s|(vllm/vllm-openai:)[^\"[:space:]]+|\1v${VLLM_GPU}|g" "$VLLM_GPU_DEPLOY" |
82 | 89 |
|
83 | 90 | # Also change the imagePullPolicy from Always to IfNotPresent on lines containing the vLLM image.
|
84 |
| -sed -i.bak '/vllm\/vllm-openai/ { n; s/Always/IfNotPresent/ }' "$VLLM_DEPLOY" |
| 91 | +sed -i.bak '/vllm\/vllm-openai/{n;s/Always/IfNotPresent/;}' "$VLLM_GPU_DEPLOY" |
| 92 | + |
| 93 | +VLLM_CPU_DEPLOY="config/manifests/vllm/cpu-deployment.yaml" |
| 94 | +echo "Updating ${VLLM_CPU_DEPLOY} ..." |
| 95 | + |
| 96 | +# Update the vLLM CPU image version |
| 97 | +sed -i.bak -E "s|(q9t5s3a7/vllm-cpu-release-repo:)[^\"[:space:]]+|\1v${VLLM_CPU}|g" "$VLLM_CPU_DEPLOY" |
| 98 | + |
| 99 | +# Also change the imagePullPolicy from Always to IfNotPresent on lines containing the vLLM CPU image. |
| 100 | +sed -i.bak '/q9t5s3a7\/vllm-cpu-release-repo/{n;s/Always/IfNotPresent/;}' "$VLLM_CPU_DEPLOY" |
| 101 | + |
| 102 | +VLLM_SIM_DEPLOY="config/manifests/vllm/sim-deployment.yaml" |
| 103 | +echo "Updating ${VLLM_SIM_DEPLOY} ..." |
| 104 | + |
| 105 | +# Update the vLLM Simulator image version |
| 106 | +sed -i.bak -E "s|(llm-d/llm-d-inference-sim:)[^\"[:space:]]+|\1v${VLLM_SIM}|g" "$VLLM_SIM_DEPLOY" |
| 107 | + |
| 108 | +# Also change the imagePullPolicy from Always to IfNotPresent on lines containing the vLLM image. |
| 109 | +sed -i.bak '/llm-d\/llm-d-inference-sim/{n;s/Always/IfNotPresent/;}' "$VLLM_SIM_DEPLOY" |
85 | 110 |
|
86 | 111 | # -----------------------------------------------------------------------------
|
87 | 112 | # Stage the changes
|
88 | 113 | # -----------------------------------------------------------------------------
|
89 |
| -echo "Staging $README $EPP $EPP_HELM $BBR_HELM $VLLM_DEPLOY files..." |
90 |
| -git add $README $EPP $EPP_HELM $BBR_HELM $VLLM_DEPLOY |
| 114 | +echo "Staging $README $EPP $EPP_HELM $BBR_HELM $VLLM_GPU_DEPLOY $VLLM_CPU_DEPLOY $VLLM_SIM_DEPLOY files..." |
| 115 | +git add $README $EPP $EPP_HELM $BBR_HELM $VLLM_GPU_DEPLOY $VLLM_CPU_DEPLOY $VLLM_SIM_DEPLOY |
91 | 116 |
|
92 | 117 | # -----------------------------------------------------------------------------
|
93 | 118 | # Cleanup backup files and finish
|
|
0 commit comments