diff --git a/config/charts/inferencepool/templates/inferencepool.yaml b/config/charts/inferencepool/templates/inferencepool.yaml index f9d04df0f..435014679 100644 --- a/config/charts/inferencepool/templates/inferencepool.yaml +++ b/config/charts/inferencepool/templates/inferencepool.yaml @@ -16,3 +16,25 @@ spec: {{- end }} extensionRef: name: {{ include "gateway-api-inference-extension.name" . }} +--- +# IMPORTANT: Compatibility workaround: Mirror InferencePool with v1alpha2 API version +# Reference implementation EPP uses v1, but most Gateway API providers haven't transitioned to v1 yet +# This duplicate resource ensures compatibility across different provider versions +# TODO: Remove once all providers migrate to v1 +apiVersion: inference.networking.x-k8s.io/v1alpha2 +kind: InferencePool +metadata: + name: {{ .Release.Name }} + namespace: {{ .Release.Namespace }} + labels: + {{- include "gateway-api-inference-extension.labels" . | nindent 4 }} +spec: + targetPortNumber: {{ .Values.inferencePool.targetPortNumber }} + selector: + {{- if .Values.inferencePool.modelServers.matchLabels }} + {{- range $key, $value := .Values.inferencePool.modelServers.matchLabels }} + {{ $key }}: {{ quote $value }} + {{- end }} + {{- end }} + extensionRef: + name: {{ include "gateway-api-inference-extension.name" . }} diff --git a/config/charts/inferencepool/templates/rbac.yaml b/config/charts/inferencepool/templates/rbac.yaml index 0c432f4b9..dc14332a7 100644 --- a/config/charts/inferencepool/templates/rbac.yaml +++ b/config/charts/inferencepool/templates/rbac.yaml @@ -42,6 +42,9 @@ rules: - apiGroups: ["inference.networking.x-k8s.io"] resources: ["inferencemodels", "inferencepools"] verbs: ["get", "watch", "list"] +- apiGroups: [ "inference.networking.k8s.io" ] + resources: [ "inferencepools" ] + verbs: [ "get", "watch", "list" ] - apiGroups: [""] resources: ["pods"] verbs: ["get", "watch", "list"]