|
| 1 | +{{- $functionNs := default .Release.Namespace .Values.functionNamespace }} |
| 2 | + |
| 3 | +# License: OpenFaaS Pro EULA |
| 4 | +# Any use, modification or coping without an OpenFaaS Pro license is prohibited |
| 5 | +# All rights reserved OpenFaaS Ltd 2023 |
| 6 | + |
| 7 | +{{- if .Values.prometheus.create }} |
| 8 | +{{- if .Values.openfaasPro }} |
| 9 | +--- |
| 10 | +kind: ConfigMap |
| 11 | +apiVersion: v1 |
| 12 | +metadata: |
| 13 | + labels: |
| 14 | + app: {{ template "openfaas.name" . }} |
| 15 | + chart: {{ .Chart.Name }}-{{ .Chart.Version }} |
| 16 | + component: prometheus-config |
| 17 | + heritage: {{ .Release.Service }} |
| 18 | + release: {{ .Release.Name }} |
| 19 | + name: prometheus-config |
| 20 | + namespace: {{ .Release.Namespace | quote }} |
| 21 | +data: |
| 22 | + prometheus.yml: | |
| 23 | + global: |
| 24 | + scrape_interval: 15s |
| 25 | + evaluation_interval: 15s |
| 26 | + external_labels: |
| 27 | + monitor: 'faas-monitor' |
| 28 | +
|
| 29 | + rule_files: |
| 30 | + - 'prometheus-rules.yml' |
| 31 | +
|
| 32 | + scrape_configs: |
| 33 | + - job_name: 'prometheus' |
| 34 | + scrape_interval: 10s |
| 35 | + static_configs: |
| 36 | + - targets: ['localhost:9090'] |
| 37 | +
|
| 38 | + # Capture endpoints in the openfaas namespace with a scrape annotation |
| 39 | + # such as the gateway-provider service. |
| 40 | + - job_name: 'openfaas-endpoints' |
| 41 | + kubernetes_sd_configs: |
| 42 | + - role: endpoints |
| 43 | + namespaces: |
| 44 | + names: |
| 45 | + - {{ .Release.Namespace }} |
| 46 | + relabel_configs: |
| 47 | + - action: labelmap |
| 48 | + regex: __meta_kubernetes_service_label_(.+) |
| 49 | + - source_labels: [__meta_kubernetes_namespace] |
| 50 | + action: replace |
| 51 | + target_label: kubernetes_namespace |
| 52 | + - source_labels: [__meta_kubernetes_service_name] |
| 53 | + action: replace |
| 54 | + target_label: kubernetes_name |
| 55 | +
|
| 56 | + - source_labels: [__address__, __meta_kubernetes_service_annotation_prometheus_io_port] |
| 57 | + separator: ; |
| 58 | + regex: ([^:]+)(?::\d+)?;(\d+) |
| 59 | + target_label: __address__ |
| 60 | + replacement: $1:$2 |
| 61 | + action: replace |
| 62 | +
|
| 63 | + - source_labels: [__meta_kubernetes_service_annotation_prometheus_io_scrape] |
| 64 | + action: keep |
| 65 | + regex: true |
| 66 | +
|
| 67 | + - job_name: 'kubernetes-pods' |
| 68 | + scrape_interval: 5s |
| 69 | + honor_labels: false |
| 70 | + kubernetes_sd_configs: |
| 71 | + - role: pod |
| 72 | + namespaces: |
| 73 | + names: |
| 74 | + - {{ .Release.Namespace }} |
| 75 | +{{- if ne $functionNs (.Release.Namespace | toString) }} |
| 76 | + - {{ $functionNs }} |
| 77 | +{{- end }} |
| 78 | + relabel_configs: |
| 79 | + - action: labelmap |
| 80 | + regex: __meta_kubernetes_pod_label_(.+) |
| 81 | + - source_labels: [__meta_kubernetes_namespace] |
| 82 | + action: replace |
| 83 | + target_label: kubernetes_namespace |
| 84 | + - source_labels: [__meta_kubernetes_pod_name] |
| 85 | + action: replace |
| 86 | + target_label: kubernetes_pod_name |
| 87 | + - source_labels: [__meta_kubernetes_pod_annotation_prometheus_io_scrape] |
| 88 | + action: keep |
| 89 | + regex: true |
| 90 | + - source_labels: [__address__, __meta_kubernetes_pod_annotation_prometheus_io_port] |
| 91 | + action: replace |
| 92 | + regex: ([^:]+)(?::\d+)?;(\d+) |
| 93 | + replacement: $1:$2 |
| 94 | + target_label: __address__ |
| 95 | + - action: replace |
| 96 | + regex: (.+) |
| 97 | + source_labels: |
| 98 | + - __meta_kubernetes_pod_annotation_prometheus_io_path |
| 99 | + target_label: __metrics_path__ |
| 100 | + |
| 101 | + - job_name: 'kubernetes-resource-metrics' |
| 102 | + scrape_interval: 10s |
| 103 | + scheme: https |
| 104 | + tls_config: |
| 105 | + ca_file: /var/run/secrets/kubernetes.io/serviceaccount/ca.crt |
| 106 | + insecure_skip_verify: true |
| 107 | + bearer_token_file: /var/run/secrets/kubernetes.io/serviceaccount/token |
| 108 | + kubernetes_sd_configs: |
| 109 | + - role: node |
| 110 | + relabel_configs: |
| 111 | + - action: labelmap |
| 112 | + regex: __meta_kubernetes_node_label_(.+) |
| 113 | + - target_label: __address__ |
| 114 | + replacement: kubernetes.default.svc:443 |
| 115 | + - source_labels: [__meta_kubernetes_node_name] |
| 116 | + regex: (.+) |
| 117 | + target_label: __metrics_path__ |
| 118 | + replacement: /api/v1/nodes/${1}/proxy/metrics/resource |
| 119 | + metric_relabel_configs: |
| 120 | + - source_labels: [__name__] |
| 121 | + regex: (pod)_(cpu|memory)_(.+) |
| 122 | + action: keep |
| 123 | + # Exclude container metrics |
| 124 | + - source_labels: [__name__] |
| 125 | + regex: container_(.+) |
| 126 | + action: drop |
| 127 | + - action: replace |
| 128 | + source_labels: |
| 129 | + - namespace |
| 130 | + regex: '(.*)' |
| 131 | + replacement: '$1' |
| 132 | + target_label: kubernetes_namespace |
| 133 | + # Output deployment name from Pod |
| 134 | + - action: replace |
| 135 | + source_labels: |
| 136 | + - pod |
| 137 | + regex: '^([0-9a-zA-Z-]+)+(-[0-9a-zA-Z]+-[0-9a-zA-Z]+)$' |
| 138 | + replacement: '$1' |
| 139 | + target_label: deployment_name |
| 140 | + # Output fully-qualified function name fn.ns |
| 141 | + - source_labels: [deployment_name, kubernetes_namespace] |
| 142 | + separator: ";" |
| 143 | + regex: '(.*);(.*)' |
| 144 | + replacement: '${1}.${2}' |
| 145 | + target_label: "function_name" |
| 146 | + |
| 147 | + prometheus-rules.yml: | |
| 148 | + groups: |
| 149 | + - name: load |
| 150 | + rules: |
| 151 | + - record: job:function_current_load:sum |
| 152 | + expr: sum by (function_name) ( rate( gateway_function_invocation_total{}[30s] ) ) and avg by (function_name) (gateway_service_target_load{scaling_type="rps"}) > 1 |
| 153 | + labels: |
| 154 | + scaling_type: rps |
| 155 | +
|
| 156 | + - record: job:function_current_load:sum |
| 157 | + expr: sum by (function_name) ( max_over_time( gateway_function_invocation_inflight[45s:5s])) and on (function_name) avg by(function_name) (gateway_service_target_load{scaling_type="capacity"}) > bool 1 |
| 158 | + labels: |
| 159 | + scaling_type: capacity |
| 160 | +
|
| 161 | + - record: job:function_current_load:sum |
| 162 | + expr: sum(irate ( pod_cpu_usage_seconds_total{}[1m])*1000) by (function_name) * on (function_name) avg by (function_name) (gateway_service_target_load{scaling_type="cpu"} > bool 1 ) |
| 163 | + labels: |
| 164 | + scaling_type: cpu |
| 165 | +
|
| 166 | + - name: recently_started_1m |
| 167 | + interval: 10s |
| 168 | + rules: |
| 169 | + - record: job:function_current_started:max_sum |
| 170 | + expr: max_over_time(sum by (function_name) (rate( gateway_function_invocation_started{}[1m]))[1m:5s]) > 0 |
| 171 | +
|
| 172 | +{{- end }} |
| 173 | +{{- end }} |
0 commit comments