File tree Expand file tree Collapse file tree 6 files changed +23
-21
lines changed
config/charts/inferencepool Expand file tree Collapse file tree 6 files changed +23
-21
lines changed Original file line number Diff line number Diff line change 62
62
- " --{{ .name }}"
63
63
- " {{ .value }}"
64
64
{{- end }}
65
- {{- if not .Values.inferenceExtension.serviceMonitor.auth .enabled }}
65
+ {{- if not .Values.inferenceExtension.monitoring.prometheus .enabled }}
66
66
- --metrics-endpoint-auth=false
67
67
{{- end }}
68
68
ports :
Original file line number Diff line number Diff line change 1
- {{- if and .Values.inferenceExtension.serviceMonitor. enabled .Values.inferenceExtension.serviceMonitor .auth.enabled (ne (lower .Values.provider.name) "gke") }}
1
+ {{- if and .Values.inferenceExtension.monitoring.prometheus. enabled .Values.inferenceExtension.monitoring.prometheus .auth.enabled (ne (lower .Values.provider.name) "gke") }}
2
2
apiVersion : v1
3
3
kind : Secret
4
4
metadata :
5
- name : {{ .Values.inferenceExtension.serviceMonitor .auth.secretName }}
5
+ name : {{ .Values.inferenceExtension.monitoring.prometheus .auth.secretName }}
6
6
namespace : {{ .Release.Namespace }}
7
7
labels :
8
8
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
Original file line number Diff line number Diff line change 1
- {{- if and .Values.inferenceExtension.serviceMonitor .enabled (ne (lower .Values.provider.name) "gke") }}
1
+ {{- if and .Values.inferenceExtension.monitoring.prometheus .enabled (ne (lower .Values.provider.name) "gke") }}
2
2
apiVersion : monitoring.coreos.com/v1
3
3
kind : ServiceMonitor
4
4
metadata :
5
5
name : {{ include "gateway-api-inference-extension.name" . }}-monitor
6
6
namespace : {{ .Release.Namespace }}
7
7
labels :
8
8
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
9
- {{- with .Values.inferenceExtension.serviceMonitor .extraLabels }}
9
+ {{- with .Values.inferenceExtension.monitoring.prometheus .extraLabels }}
10
10
{{- toYaml . | nindent 4 }}
11
11
{{- end }}
12
12
spec :
13
13
endpoints :
14
- - interval : {{ .Values.inferenceExtension.serviceMonitor .interval }}
14
+ - interval : {{ .Values.inferenceExtension.monitoring.prometheus .interval }}
15
15
port : " http-metrics"
16
16
path : " /metrics"
17
- {{- if .Values.inferenceExtension.serviceMonitor .auth.enabled }}
17
+ {{- if .Values.inferenceExtension.monitoring.prometheus .auth.enabled }}
18
18
authorization :
19
19
credentials :
20
20
key : token
21
- name : {{ .Values.inferenceExtension.serviceMonitor .auth.secretName }}
21
+ name : {{ .Values.inferenceExtension.monitoring.prometheus .auth.secretName }}
22
22
{{- end }}
23
23
jobLabel : {{ include "gateway-api-inference-extension.name" . }}
24
24
namespaceSelector :
Original file line number Diff line number Diff line change 40
40
logging :
41
41
enabled : true # log all requests by default
42
42
---
43
- {{- if and .Values.inferenceExtension.serviceMonitor. enabled .Values.inferenceExtension.serviceMonitor .auth.enabled }}
43
+ {{- if and .Values.inferenceExtension.monitoring.prometheus. enabled .Values.inferenceExtension.monitoring.prometheus .auth.enabled }}
44
44
{{- $metricsReadSA := printf "%s-metrics-reader-sa" .Release.Name -}}
45
45
{{- $metricsReadSecretName := printf "%s-metrics-reader-secret" .Release.Name -}}
46
46
{{- $metricsReadRoleName := printf "%s-%s-metrics-reader" .Release.Namespace .Release.Name -}}
83
83
endpoints :
84
84
- port : metrics
85
85
scheme : http
86
- interval : {{ .Values.inferenceExtension.serviceMonitor .interval }}
86
+ interval : {{ .Values.inferenceExtension.monitoring.prometheus .interval }}
87
87
path : /metrics
88
88
authorization :
89
89
type : Bearer
Original file line number Diff line number Diff line change 17
17
- subjectaccessreviews
18
18
verbs :
19
19
- create
20
- {{- if .Values.inferenceExtension.serviceMonitor .enabled }}
20
+ {{- if .Values.inferenceExtension.monitoring.prometheus .enabled }}
21
21
- nonResourceURLs :
22
22
- " /metrics"
23
23
verbs :
Original file line number Diff line number Diff line change @@ -40,16 +40,18 @@ inferenceExtension:
40
40
41
41
tolerations : []
42
42
43
- # Prometheus ServiceMonitor will be created when enabled for EPP metrics collection
44
- serviceMonitor :
45
- enabled : true
46
- interval : " 10s"
47
- auth :
48
- enabled : true
49
- # Service account token secret for authentication
50
- secretName : inference-gateway-sa-metrics-reader-secret
51
- # additional labels for the ServiceMonitor
52
- extraLabels : {}
43
+ # Monitoring configuration for EPP
44
+ monitoring :
45
+ # Prometheus ServiceMonitor will be created when enabled for EPP metrics collection
46
+ prometheus :
47
+ enabled : false
48
+ interval : " 10s"
49
+ auth :
50
+ enabled : true
51
+ # Service account token secret for authentication
52
+ secretName : inference-gateway-sa-metrics-reader-secret
53
+ # additional labels for the ServiceMonitor
54
+ extraLabels : {}
53
55
54
56
inferencePool :
55
57
targetPorts :
You can’t perform that action at this time.
0 commit comments