File tree Expand file tree Collapse file tree 6 files changed +25
-20
lines changed
config/charts/inferencepool Expand file tree Collapse file tree 6 files changed +25
-20
lines changed Original file line number Diff line number Diff line change 62
62
- " --{{ .name }}"
63
63
- " {{ .value }}"
64
64
{{- end }}
65
+ {{- if not .Values.inferenceExtension.serviceMonitor.auth.enabled }}
66
+ - --metrics-endpoint-auth=false
67
+ {{- end }}
65
68
ports :
66
69
- name : grpc
67
70
containerPort : 9002
Original file line number Diff line number Diff line change 1
- {{- if .Values.inferenceExtension.monitoring.prometheus. enabled }}
1
+ {{- if and .Values.inferenceExtension.serviceMonitor.enabled .Values.inferenceExtension.serviceMonitor.auth. enabled (ne (lower .Values.provider.name) "gke") }}
2
2
apiVersion : v1
3
3
kind : Secret
4
4
metadata :
5
- name : {{ .Values.inferenceExtension.monitoring.secret.name }}
5
+ name : {{ .Values.inferenceExtension.serviceMonitor.auth.secretName }}
6
6
namespace : {{ .Release.Namespace }}
7
7
labels :
8
8
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
Original file line number Diff line number Diff line change 1
- {{- if .Values.inferenceExtension.monitoring.prometheus. enabled }}
1
+ {{- if and .Values.inferenceExtension.serviceMonitor. enabled (ne (lower .Values.provider.name) "gke") }}
2
2
apiVersion : monitoring.coreos.com/v1
3
3
kind : ServiceMonitor
4
4
metadata :
5
5
name : {{ include "gateway-api-inference-extension.name" . }}-monitor
6
6
namespace : {{ .Release.Namespace }}
7
7
labels :
8
8
{{- include "gateway-api-inference-extension.labels" . | nindent 4 }}
9
+ {{- with .Values.inferenceExtension.serviceMonitor.extraLabels }}
10
+ {{- toYaml . | nindent 4 }}
11
+ {{- end }}
9
12
spec :
10
13
endpoints :
11
- - interval : {{ .Values.inferenceExtension.monitoring .interval }}
14
+ - interval : {{ .Values.inferenceExtension.serviceMonitor .interval }}
12
15
port : " http-metrics"
13
16
path : " /metrics"
17
+ {{- if .Values.inferenceExtension.serviceMonitor.auth.enabled }}
14
18
authorization :
15
19
credentials :
16
20
key : token
17
- name : {{ .Values.inferenceExtension.monitoring.secret.name }}
21
+ name : {{ .Values.inferenceExtension.serviceMonitor.auth.secretName }}
22
+ {{- end }}
18
23
jobLabel : {{ include "gateway-api-inference-extension.name" . }}
19
24
namespaceSelector :
20
25
matchNames :
Original file line number Diff line number Diff line change 40
40
logging :
41
41
enabled : true # log all requests by default
42
42
---
43
- {{- if .Values.inferenceExtension.monitoring.gke .enabled }}
43
+ {{- if and .Values.inferenceExtension.serviceMonitor.enabled .Values.inferenceExtension.serviceMonitor.auth .enabled }}
44
44
{{- $metricsReadSA := printf "%s-metrics-reader-sa" .Release.Name -}}
45
45
{{- $metricsReadSecretName := printf "%s-metrics-reader-secret" .Release.Name -}}
46
46
{{- $metricsReadRoleName := printf "%s-%s-metrics-reader" .Release.Namespace .Release.Name -}}
83
83
endpoints :
84
84
- port : metrics
85
85
scheme : http
86
- interval : {{ .Values.inferenceExtension.monitoring .interval }}
86
+ interval : {{ .Values.inferenceExtension.serviceMonitor .interval }}
87
87
path : /metrics
88
88
authorization :
89
89
type : Bearer
Original file line number Diff line number Diff line change 17
17
- subjectaccessreviews
18
18
verbs :
19
19
- create
20
- {{- if .Values.inferenceExtension.monitoring.prometheus .enabled }}
20
+ {{- if .Values.inferenceExtension.serviceMonitor .enabled }}
21
21
- nonResourceURLs :
22
22
- " /metrics"
23
23
verbs :
Original file line number Diff line number Diff line change @@ -40,19 +40,16 @@ inferenceExtension:
40
40
41
41
tolerations : []
42
42
43
- # Monitoring configuration for EPP
44
- monitoring :
43
+ # Prometheus ServiceMonitor will be created when enabled for EPP metrics collection
44
+ serviceMonitor :
45
+ enabled : true
45
46
interval : " 10s"
46
- # Service account token secret for authentication
47
- secret :
48
- name : inference-gateway-sa-metrics-reader-secret
49
-
50
- # Prometheus ServiceMonitor will be created when enabled for EPP metrics collection
51
- prometheus :
52
- enabled : false
53
-
54
- gke :
55
- enabled : false
47
+ auth :
48
+ enabled : true
49
+ # Service account token secret for authentication
50
+ secretName : inference-gateway-sa-metrics-reader-secret
51
+ # additional labels for the ServiceMonitor
52
+ extraLabels : {}
56
53
57
54
inferencePool :
58
55
targetPorts :
You can’t perform that action at this time.
0 commit comments