Skip to content

Commit 318cd7c

Browse files
committed
Updates artifacts for v1.2.0-rc.1 release
Signed-off-by: Nir Rozenbaum <[email protected]>
1 parent f357ece commit 318cd7c

13 files changed

+47
-47
lines changed

config/charts/body-based-routing/values.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,8 +3,8 @@ bbr:
33
replicas: 1
44
image:
55
name: bbr
6-
hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension
7-
tag: main
6+
hub: registry.k8s.io/gateway-api-inference-extension
7+
tag: v1.2.0-rc.1
88
pullPolicy: Always
99
port: 9004
1010
healthCheckPort: 9005

config/charts/inferencepool/values.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,8 +2,8 @@ inferenceExtension:
22
replicas: 1
33
image:
44
name: epp
5-
hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension
6-
tag: main
5+
hub: registry.k8s.io/gateway-api-inference-extension
6+
tag: v1.2.0-rc.1
77
pullPolicy: Always
88
extProcPort: 9002
99
env: []

config/crd/bases/inference.networking.k8s.io_inferencepools.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ kind: CustomResourceDefinition
33
metadata:
44
annotations:
55
api-approved.kubernetes.io: https://github.com/kubernetes-sigs/gateway-api-inference-extension/pull/1173
6-
inference.networking.k8s.io/bundle-version: main-dev
6+
inference.networking.k8s.io/bundle-version: v1.2.0-rc.1
77
name: inferencepools.inference.networking.k8s.io
88
spec:
99
group: inference.networking.k8s.io

config/crd/bases/inference.networking.x-k8s.io_inferencemodelrewrites.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ apiVersion: apiextensions.k8s.io/v1
22
kind: CustomResourceDefinition
33
metadata:
44
annotations:
5-
inference.networking.k8s.io/bundle-version: main-dev
5+
inference.networking.k8s.io/bundle-version: v1.2.0-rc.1
66
name: inferencemodelrewrites.inference.networking.x-k8s.io
77
spec:
88
group: inference.networking.x-k8s.io

config/crd/bases/inference.networking.x-k8s.io_inferenceobjectives.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ apiVersion: apiextensions.k8s.io/v1
22
kind: CustomResourceDefinition
33
metadata:
44
annotations:
5-
inference.networking.k8s.io/bundle-version: main-dev
5+
inference.networking.k8s.io/bundle-version: v1.2.0-rc.1
66
name: inferenceobjectives.inference.networking.x-k8s.io
77
spec:
88
group: inference.networking.x-k8s.io

config/crd/bases/inference.networking.x-k8s.io_inferencepoolimports.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ apiVersion: apiextensions.k8s.io/v1
22
kind: CustomResourceDefinition
33
metadata:
44
annotations:
5-
inference.networking.k8s.io/bundle-version: main-dev
5+
inference.networking.k8s.io/bundle-version: v1.2.0-rc.1
66
name: inferencepoolimports.inference.networking.x-k8s.io
77
spec:
88
group: inference.networking.x-k8s.io

config/crd/bases/inference.networking.x-k8s.io_inferencepools.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ kind: CustomResourceDefinition
33
metadata:
44
annotations:
55
api-approved.kubernetes.io: unapproved, experimental-only
6-
inference.networking.k8s.io/bundle-version: main-dev
6+
inference.networking.k8s.io/bundle-version: v1.2.0-rc.1
77
name: inferencepools.inference.networking.x-k8s.io
88
spec:
99
group: inference.networking.x-k8s.io

config/manifests/vllm/cpu-deployment.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,8 @@ spec:
1414
spec:
1515
containers:
1616
- name: lora
17-
image: "public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.8.5" # formal images can be found in https://gallery.ecr.aws/q9t5s3a7/vllm-cpu-release-repo
18-
imagePullPolicy: Always
17+
image: "public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.9.3" # formal images can be found in https://gallery.ecr.aws/q9t5s3a7/vllm-cpu-release-repo
18+
imagePullPolicy: IfNotPresent
1919
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
2020
args:
2121
- "--model"
@@ -77,8 +77,8 @@ spec:
7777
- name: lora-adapter-syncer
7878
tty: true
7979
stdin: true
80-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/lora-syncer:main
81-
restartPolicy: Always
80+
image: registry.k8s.io/gateway-api-inference-extension/lora-syncer:v1.2.0-rc.1
81+
restartPolicy: IfNotPresent
8282
imagePullPolicy: Always
8383
env:
8484
- name: DYNAMIC_LORA_ROLLOUT_CONFIG

config/manifests/vllm/gpu-deployment.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ spec:
1515
containers:
1616
- name: vllm
1717
image: "vllm/vllm-openai:v0.8.5"
18-
imagePullPolicy: Always
18+
imagePullPolicy: IfNotPresent
1919
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
2020
args:
2121
- "--model"
@@ -155,8 +155,8 @@ spec:
155155
- name: lora-adapter-syncer
156156
tty: true
157157
stdin: true
158-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/lora-syncer:main
159-
restartPolicy: Always
158+
image: registry.k8s.io/gateway-api-inference-extension/lora-syncer:v1.2.0-rc.1
159+
restartPolicy: IfNotPresent
160160
imagePullPolicy: Always
161161
env:
162162
- name: DYNAMIC_LORA_ROLLOUT_CONFIG

config/manifests/vllm/sim-deployment.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ spec:
1515
containers:
1616
- name: vllm-sim
1717
image: ghcr.io/llm-d/llm-d-inference-sim:v0.5.0
18-
imagePullPolicy: Always
18+
imagePullPolicy: IfNotPresent
1919
args:
2020
- --model
2121
- meta-llama/Llama-3.1-8B-Instruct

0 commit comments

Comments
 (0)