Skip to content

Commit 392a8cc

Browse files
committed
Updates artifacts for v0.5.0-rc.1 release
Signed-off-by: Nir Rozenbaum <[email protected]>
1 parent c46a7e7 commit 392a8cc

File tree

6 files changed

+11
-11
lines changed

6 files changed

+11
-11
lines changed

config/charts/body-based-routing/values.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,8 +3,8 @@ bbr:
33
replicas: 1
44
image:
55
name: bbr
6-
hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension
7-
tag: main
6+
hub: registry.k8s.io/gateway-api-inference-extension
7+
tag: v0.5.0-rc.1
88
pullPolicy: Always
99
port: 9004
1010
healthCheckPort: 9005

config/charts/inferencepool/values.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,8 +2,8 @@ inferenceExtension:
22
replicas: 1
33
image:
44
name: epp
5-
hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension
6-
tag: main
5+
hub: registry.k8s.io/gateway-api-inference-extension
6+
tag: v0.5.0-rc.1
77
pullPolicy: Always
88
extProcPort: 9002
99
env: {}

config/manifests/inferencepool-resources.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -48,8 +48,8 @@ spec:
4848
terminationGracePeriodSeconds: 130
4949
containers:
5050
- name: epp
51-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/epp:main
52-
imagePullPolicy: Always
51+
image: registry.k8s.io/gateway-api-inference-extension/epp:v0.5.0-rc.1
52+
imagePullPolicy: IfNotPresent
5353
args:
5454
- -poolName
5555
- "vllm-llama3-8b-instruct"

config/manifests/vllm/cpu-deployment.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,8 @@ spec:
1414
spec:
1515
containers:
1616
- name: lora
17-
image: "public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.9.1" # formal images can be found in https://gallery.ecr.aws/q9t5s3a7/vllm-cpu-release-repo
18-
imagePullPolicy: Always
17+
image: "public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.9.2" # formal images can be found in https://gallery.ecr.aws/q9t5s3a7/vllm-cpu-release-repo
18+
imagePullPolicy: IfNotPresent
1919
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
2020
args:
2121
- "--model"

config/manifests/vllm/gpu-deployment.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,8 @@ spec:
1414
spec:
1515
containers:
1616
- name: vllm
17-
image: "vllm/vllm-openai:latest"
18-
imagePullPolicy: Always
17+
image: "vllm/vllm-openai:v0.9.2"
18+
imagePullPolicy: IfNotPresent
1919
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
2020
args:
2121
- "--model"

config/manifests/vllm/sim-deployment.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ spec:
1515
containers:
1616
- name: vllm-sim
1717
image: ghcr.io/llm-d/llm-d-inference-sim:v0.1.2
18-
imagePullPolicy: Always
18+
imagePullPolicy: IfNotPresent
1919
args:
2020
- --model
2121
- meta-llama/Llama-3.1-8B-Instruct

0 commit comments

Comments
 (0)