Skip to content

Commit b9b9443

Browse files
authored
Merge pull request #754 from phillebaba/more/multicluster
Fix multicluster labels
2 parents a2196d1 + 64aa572 commit b9b9443

File tree

3 files changed

+9
-9
lines changed

3 files changed

+9
-9
lines changed

alerts/kubelet.libsonnet

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -52,11 +52,11 @@
5252
// Some node has a capacity of 1 like AWS's Fargate and only exists while a pod is running on it.
5353
// We have to ignore this special node in the KubeletTooManyPods alert.
5454
expr: |||
55-
count by(node) (
56-
(kube_pod_status_phase{%(kubeStateMetricsSelector)s,phase="Running"} == 1) * on(instance,pod,namespace,cluster) group_left(node) topk by(instance,pod,namespace,cluster) (1, kube_pod_info{%(kubeStateMetricsSelector)s})
55+
count by(%(clusterLabel)s, node) (
56+
(kube_pod_status_phase{%(kubeStateMetricsSelector)s,phase="Running"} == 1) * on(instance,pod,namespace,%(clusterLabel)s) group_left(node) topk by(instance,pod,namespace,%(clusterLabel)s) (1, kube_pod_info{%(kubeStateMetricsSelector)s})
5757
)
5858
/
59-
max by(node) (
59+
max by(%(clusterLabel)s, node) (
6060
kube_node_status_capacity{%(kubeStateMetricsSelector)s,resource="pods"} != 1
6161
) > 0.95
6262
||| % $._config,
@@ -72,7 +72,7 @@
7272
{
7373
alert: 'KubeNodeReadinessFlapping',
7474
expr: |||
75-
sum(changes(kube_node_status_condition{status="true",condition="Ready"}[15m])) by (node) > 2
75+
sum(changes(kube_node_status_condition{status="true",condition="Ready"}[15m])) by (%(clusterLabel)s, node) > 2
7676
||| % $._config,
7777
'for': '15m',
7878
labels: {

alerts/system_alerts.libsonnet

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -28,11 +28,11 @@
2828
// this is normal and an expected error, therefore it should be
2929
// ignored in this alert.
3030
expr: |||
31-
(sum(rate(rest_client_requests_total{code=~"5.."}[5m])) by (instance, job, namespace)
31+
(sum(rate(rest_client_requests_total{code=~"5.."}[5m])) by (%(clusterLabel)s, instance, job, namespace)
3232
/
33-
sum(rate(rest_client_requests_total[5m])) by (instance, job, namespace))
33+
sum(rate(rest_client_requests_total[5m])) by (%(clusterLabel)s, instance, job, namespace))
3434
> 0.01
35-
|||,
35+
||| % $._config,
3636
'for': '15m',
3737
labels: {
3838
severity: 'warning',

rules/node.libsonnet

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -20,8 +20,8 @@
2020
// below for instance.
2121
record: 'node_namespace_pod:kube_pod_info:',
2222
expr: |||
23-
topk by(namespace, %(podLabel)s) (1,
24-
max by (node, namespace, %(podLabel)s) (
23+
topk by(%(clusterLabel)s, namespace, %(podLabel)s) (1,
24+
max by (%(clusterLabel)s, node, namespace, %(podLabel)s) (
2525
label_replace(kube_pod_info{%(kubeStateMetricsSelector)s,node!=""}, "%(podLabel)s", "$1", "pod", "(.*)")
2626
))
2727
||| % $._config,

0 commit comments

Comments
 (0)