1
1
rule_files :
2
2
- ../prometheus_rules.yaml
3
+ - ../prometheus_alerts.yaml
3
4
4
5
evaluation_interval : 1m
5
6
@@ -26,3 +27,38 @@ tests:
26
27
labels : ' node_quantile:kubelet_pleg_relist_duration_seconds:histogram_quantile{cluster="cluster",instance="ip-172-0-0-1", node="ip-172-0-0-1", quantile="0.9"}'
27
28
- value : 0.99
28
29
labels : ' node_quantile:kubelet_pleg_relist_duration_seconds:histogram_quantile{cluster="cluster",instance="ip-172-0-0-1", node="ip-172-0-0-1", quantile="0.99"}'
30
+
31
+ - name : " KubeletPodStartUpLatencyHigh alert test, including duplicate series check"
32
+ interval : 1m
33
+ input_series :
34
+ - series : ' kubelet_pod_worker_duration_seconds_bucket{cluster="cluster",instance="ip-172-0-0-1",job="kubelet",le="+Inf"}'
35
+ values : ' 0+1x16'
36
+ - series : ' kubelet_pod_worker_duration_seconds_bucket{cluster="cluster",instance="ip-172-0-0-1",job="kubelet",le="+Inf",dupe="dupe"}'
37
+ values : ' 0+1x16'
38
+ - series : ' kubelet_pod_worker_duration_seconds_bucket{cluster="cluster",instance="ip-172-0-0-1",job="kubelet",le="99"}'
39
+ values : ' 0+1x16'
40
+ - series : ' kubelet_pod_worker_duration_seconds_bucket{cluster="cluster",instance="ip-172-0-0-1",job="kubelet",le="99",dupe="dupe"}'
41
+ values : ' 0+1x16'
42
+ - series : ' kubelet_pod_worker_duration_seconds_count{cluster="cluster",instance="ip-172-0-0-1",job="kubelet"}'
43
+ values : ' 0+1x16'
44
+ - series : ' kubelet_pod_worker_duration_seconds_count{cluster="cluster",instance="ip-172-0-0-1",job="kubelet",dupe="dupe"}'
45
+ values : ' 0+1x16'
46
+ - series : ' kubelet_node_name{cluster="cluster",node="ip-172-0-0-1",instance="ip-172-0-0-1",job="kubelet"}'
47
+ values : ' 1x16'
48
+ - series : ' kubelet_node_name{cluster="cluster",node="ip-172-0-0-1",instance="ip-172-0-0-1",job="kubelet",dupe="dupe"}'
49
+ values : ' 1x16'
50
+ alert_rule_test :
51
+ - eval_time : 15m
52
+ alertname : KubeletPodStartUpLatencyHigh
53
+ - eval_time : 16m
54
+ alertname : KubeletPodStartUpLatencyHigh
55
+ exp_alerts :
56
+ - exp_labels :
57
+ severity : warning
58
+ cluster : cluster
59
+ instance : ip-172-0-0-1
60
+ node : ip-172-0-0-1
61
+ exp_annotations :
62
+ summary : " Kubelet Pod startup latency is too high."
63
+ description : " Kubelet Pod startup 99th percentile latency is 98.01 seconds on node ip-172-0-0-1."
64
+ runbook_url : " https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeletpodstartuplatencyhigh"
0 commit comments