Skip to content

Commit 5106e5a

Browse files
committed
Add cluster label to resource alerts
1 parent b8f44bb commit 5106e5a

File tree

1 file changed

+12
-12
lines changed

1 file changed

+12
-12
lines changed

alerts/resource_alerts.libsonnet

Lines changed: 12 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -25,65 +25,65 @@
2525
{
2626
alert: 'KubeCPUOvercommit',
2727
expr: |||
28-
sum(namespace_cpu:kube_pod_container_resource_requests:sum{%(ignoringOverprovisionedWorkloadSelector)s}) - (sum(kube_node_status_allocatable{resource="cpu"}) - max(kube_node_status_allocatable{resource="cpu"})) > 0
28+
sum(namespace_cpu:kube_pod_container_resource_requests:sum{%(ignoringOverprovisionedWorkloadSelector)s}) by (%(clusterLabel)s) - (sum(kube_node_status_allocatable{resource="cpu"}) by (%(clusterLabel)s) - max(kube_node_status_allocatable{resource="cpu"}) by (%(clusterLabel)s)) > 0
2929
and
30-
(sum(kube_node_status_allocatable{resource="cpu"}) - max(kube_node_status_allocatable{resource="cpu"})) > 0
30+
(sum(kube_node_status_allocatable{resource="cpu"}) by (%(clusterLabel)s) - max(kube_node_status_allocatable{resource="cpu"}) by (%(clusterLabel)s)) > 0
3131
||| % $._config,
3232
labels: {
3333
severity: 'warning',
3434
},
3535
annotations: {
36-
description: 'Cluster has overcommitted CPU resource requests for Pods by {{ $value }} CPU shares and cannot tolerate node failure.',
36+
description: 'Cluster {{ $labels.cluster }} has overcommitted CPU resource requests for Pods by {{ $value }} CPU shares and cannot tolerate node failure.',
3737
summary: 'Cluster has overcommitted CPU resource requests.',
3838
},
3939
'for': '10m',
4040
},
4141
{
4242
alert: 'KubeMemoryOvercommit',
4343
expr: |||
44-
sum(namespace_memory:kube_pod_container_resource_requests:sum{%(ignoringOverprovisionedWorkloadSelector)s}) - (sum(kube_node_status_allocatable{resource="memory"}) - max(kube_node_status_allocatable{resource="memory"})) > 0
44+
sum(namespace_memory:kube_pod_container_resource_requests:sum{%(ignoringOverprovisionedWorkloadSelector)s}) by (%(clusterLabel)s) - (sum(kube_node_status_allocatable{resource="memory"}) by (%(clusterLabel)s) - max(kube_node_status_allocatable{resource="memory"}) by (%(clusterLabel)s)) > 0
4545
and
46-
(sum(kube_node_status_allocatable{resource="memory"}) - max(kube_node_status_allocatable{resource="memory"})) > 0
46+
(sum(kube_node_status_allocatable{resource="memory"}) by (%(clusterLabel)s) - max(kube_node_status_allocatable{resource="memory"}) by (%(clusterLabel)s)) > 0
4747
||| % $._config,
4848
labels: {
4949
severity: 'warning',
5050
},
5151
annotations: {
52-
description: 'Cluster has overcommitted memory resource requests for Pods by {{ $value | humanize }} bytes and cannot tolerate node failure.',
52+
description: 'Cluster {{ $labels.cluster }} has overcommitted memory resource requests for Pods by {{ $value | humanize }} bytes and cannot tolerate node failure.',
5353
summary: 'Cluster has overcommitted memory resource requests.',
5454
},
5555
'for': '10m',
5656
},
5757
{
5858
alert: 'KubeCPUQuotaOvercommit',
5959
expr: |||
60-
sum(min without(resource) (kube_resourcequota{%(prefixedNamespaceSelector)s%(kubeStateMetricsSelector)s, type="hard", resource=~"(cpu|requests.cpu)"}))
60+
sum(min without(resource) (kube_resourcequota{%(prefixedNamespaceSelector)s%(kubeStateMetricsSelector)s, type="hard", resource=~"(cpu|requests.cpu)"})) by (%(clusterLabel)s)
6161
/
62-
sum(kube_node_status_allocatable{resource="cpu", %(kubeStateMetricsSelector)s})
62+
sum(kube_node_status_allocatable{resource="cpu", %(kubeStateMetricsSelector)s}) by (%(clusterLabel)s)
6363
> %(namespaceOvercommitFactor)s
6464
||| % $._config,
6565
labels: {
6666
severity: 'warning',
6767
},
6868
annotations: {
69-
description: 'Cluster has overcommitted CPU resource requests for Namespaces.',
69+
description: 'Cluster {{ $labels.cluster }} has overcommitted CPU resource requests for Namespaces.',
7070
summary: 'Cluster has overcommitted CPU resource requests.',
7171
},
7272
'for': '5m',
7373
},
7474
{
7575
alert: 'KubeMemoryQuotaOvercommit',
7676
expr: |||
77-
sum(min without(resource) (kube_resourcequota{%(prefixedNamespaceSelector)s%(kubeStateMetricsSelector)s, type="hard", resource=~"(memory|requests.memory)"}))
77+
sum(min without(resource) (kube_resourcequota{%(prefixedNamespaceSelector)s%(kubeStateMetricsSelector)s, type="hard", resource=~"(memory|requests.memory)"})) by (%(clusterLabel)s)
7878
/
79-
sum(kube_node_status_allocatable{resource="memory", %(kubeStateMetricsSelector)s})
79+
sum(kube_node_status_allocatable{resource="memory", %(kubeStateMetricsSelector)s}) by (%(clusterLabel)s)
8080
> %(namespaceOvercommitFactor)s
8181
||| % $._config,
8282
labels: {
8383
severity: 'warning',
8484
},
8585
annotations: {
86-
description: 'Cluster has overcommitted memory resource requests for Namespaces.',
86+
description: 'Cluster {{ $labels.cluster }} has overcommitted memory resource requests for Namespaces.',
8787
summary: 'Cluster has overcommitted memory resource requests.',
8888
},
8989
'for': '5m',

0 commit comments

Comments
 (0)