Skip to content

Commit 503b050

Browse files
committed
update chart
1 parent cce635d commit 503b050

File tree

6 files changed

+25
-20
lines changed

6 files changed

+25
-20
lines changed

config/charts/inferencepool/templates/epp-deployment.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -62,6 +62,9 @@ spec:
6262
- "--{{ .name }}"
6363
- "{{ .value }}"
6464
{{- end }}
65+
{{- if not .Values.inferenceExtension.serviceMonitor.auth.enabled }}
66+
- --metrics-endpoint-auth=false
67+
{{- end }}
6568
ports:
6669
- name: grpc
6770
containerPort: 9002

config/charts/inferencepool/templates/epp-sa-token-secret.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
1-
{{- if .Values.inferenceExtension.monitoring.prometheus.enabled }}
1+
{{- if and .Values.inferenceExtension.serviceMonitor.enabled .Values.inferenceExtension.serviceMonitor.auth.enabled (ne (lower .Values.provider.name) "gke") }}
22
apiVersion: v1
33
kind: Secret
44
metadata:
5-
name: {{ .Values.inferenceExtension.monitoring.secret.name }}
5+
name: {{ .Values.inferenceExtension.serviceMonitor.auth.secretName }}
66
namespace: {{ .Release.Namespace }}
77
labels:
88
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}

config/charts/inferencepool/templates/epp-servicemonitor.yaml

Lines changed: 8 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,20 +1,25 @@
1-
{{- if .Values.inferenceExtension.monitoring.prometheus.enabled }}
1+
{{- if and .Values.inferenceExtension.serviceMonitor.enabled (ne (lower .Values.provider.name) "gke") }}
22
apiVersion: monitoring.coreos.com/v1
33
kind: ServiceMonitor
44
metadata:
55
name: {{ include "gateway-api-inference-extension.name" . }}-monitor
66
namespace: {{ .Release.Namespace }}
77
labels:
88
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
9+
{{- with .Values.inferenceExtension.serviceMonitor.extraLabels }}
10+
{{- toYaml . | nindent 4 }}
11+
{{- end }}
912
spec:
1013
endpoints:
11-
- interval: {{ .Values.inferenceExtension.monitoring.interval }}
14+
- interval: {{ .Values.inferenceExtension.serviceMonitor.interval }}
1215
port: "http-metrics"
1316
path: "/metrics"
17+
{{- if .Values.inferenceExtension.serviceMonitor.auth.enabled }}
1418
authorization:
1519
credentials:
1620
key: token
17-
name: {{ .Values.inferenceExtension.monitoring.secret.name }}
21+
name: {{ .Values.inferenceExtension.serviceMonitor.auth.secretName }}
22+
{{- end }}
1823
jobLabel: {{ include "gateway-api-inference-extension.name" . }}
1924
namespaceSelector:
2025
matchNames:

config/charts/inferencepool/templates/gke.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -40,7 +40,7 @@ spec:
4040
logging:
4141
enabled: true # log all requests by default
4242
---
43-
{{- if .Values.inferenceExtension.monitoring.gke.enabled }}
43+
{{- if and .Values.inferenceExtension.serviceMonitor.enabled .Values.inferenceExtension.serviceMonitor.auth.enabled }}
4444
{{- $metricsReadSA := printf "%s-metrics-reader-sa" .Release.Name -}}
4545
{{- $metricsReadSecretName := printf "%s-metrics-reader-secret" .Release.Name -}}
4646
{{- $metricsReadRoleName := printf "%s-%s-metrics-reader" .Release.Namespace .Release.Name -}}
@@ -83,7 +83,7 @@ spec:
8383
endpoints:
8484
- port: metrics
8585
scheme: http
86-
interval: {{ .Values.inferenceExtension.monitoring.interval }}
86+
interval: {{ .Values.inferenceExtension.serviceMonitor.interval }}
8787
path: /metrics
8888
authorization:
8989
type: Bearer

config/charts/inferencepool/templates/rbac.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ rules:
1717
- subjectaccessreviews
1818
verbs:
1919
- create
20-
{{- if .Values.inferenceExtension.monitoring.prometheus.enabled }}
20+
{{- if .Values.inferenceExtension.serviceMonitor.enabled }}
2121
- nonResourceURLs:
2222
- "/metrics"
2323
verbs:

config/charts/inferencepool/values.yaml

Lines changed: 9 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -40,19 +40,16 @@ inferenceExtension:
4040

4141
tolerations: []
4242

43-
# Monitoring configuration for EPP
44-
monitoring:
43+
# Prometheus ServiceMonitor will be created when enabled for EPP metrics collection
44+
serviceMonitor:
45+
enabled: true
4546
interval: "10s"
46-
# Service account token secret for authentication
47-
secret:
48-
name: inference-gateway-sa-metrics-reader-secret
49-
50-
# Prometheus ServiceMonitor will be created when enabled for EPP metrics collection
51-
prometheus:
52-
enabled: false
53-
54-
gke:
55-
enabled: false
47+
auth:
48+
enabled: true
49+
# Service account token secret for authentication
50+
secretName: inference-gateway-sa-metrics-reader-secret
51+
# additional labels for the ServiceMonitor
52+
extraLabels: {}
5653

5754
inferencePool:
5855
targetPorts:

0 commit comments

Comments
 (0)