@@ -1323,3 +1323,107 @@ tests:
13231323 description : ' Cluster has overcommitted memory resource requests for Namespaces.'
13241324 runbook_url : " https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubememoryquotaovercommit"
13251325 summary : " Cluster has overcommitted memory resource requests."
1326+
1327+ - name : KubeCPUOvercommit alert (single-node)
1328+ - interval : 1m
1329+ input_series :
1330+ - series : ' namespace_cpu:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1331+ values : ' 1x10'
1332+ - series : ' namespace_cpu:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="kube-system"}'
1333+ values : ' 1x10'
1334+ - series : ' kube_node_status_allocatable{cluster="kubernetes", node="n1", resource="cpu", job="kube-state-metrics"}'
1335+ values : ' 1.9x10' # This value was seen on a 2x vCPU node
1336+ - series : ' kube_node_info{cluster="kubernetes", node="n1", job="kube-state-metrics"}'
1337+ values : ' 1x10'
1338+ alert_rule_test :
1339+ - eval_time : 9m
1340+ alertname : KubeCPUOvercommit
1341+ - eval_time : 10m
1342+ alertname : KubeCPUOvercommit
1343+ exp_alerts :
1344+ - exp_labels :
1345+ severity : warning
1346+ exp_annotations :
1347+ description : Cluster has overcommitted CPU resource requests for Pods by 0.385 CPU shares and cannot tolerate node failure.
1348+ runbook_url : https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubecpuovercommit
1349+ summary : Cluster has overcommitted CPU resource requests.
1350+
1351+ - name : KubeCPUOvercommit alert (multi-node)
1352+ - interval : 1m
1353+ input_series :
1354+ - series : ' namespace_cpu:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1355+ values : ' 2x10'
1356+ - series : ' namespace_cpu:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="kube-system"}'
1357+ values : ' 2x10'
1358+ - series : ' kube_node_status_allocatable{cluster="kubernetes", node="n1", resource="cpu", job="kube-state-metrics"}'
1359+ values : ' 1.9x10' # This value was seen on a 2x vCPU node
1360+ - series : ' kube_node_status_allocatable{cluster="kubernetes", node="n2", resource="cpu", job="kube-state-metrics"}'
1361+ values : ' 1.9x10'
1362+ - series : ' kube_node_info{cluster="kubernetes", node="n1", job="kube-state-metrics"}'
1363+ values : ' 1x10'
1364+ - series : ' kube_node_info{cluster="kubernetes", node="n2", job="kube-state-metrics"}'
1365+ values : ' 1x10'
1366+ alert_rule_test :
1367+ - eval_time : 9m
1368+ alertname : KubeCPUOvercommit
1369+ - eval_time : 10m
1370+ alertname : KubeCPUOvercommit
1371+ exp_alerts :
1372+ - exp_labels :
1373+ severity : warning
1374+ exp_annotations :
1375+ description : Cluster has overcommitted CPU resource requests for Pods by 2.1 CPU shares and cannot tolerate node failure.
1376+ runbook_url : https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubecpuovercommit
1377+ summary : Cluster has overcommitted CPU resource requests.
1378+
1379+ - name : KubeMemoryOvercommit alert (single-node)
1380+ - interval : 1m
1381+ input_series :
1382+ - series : ' namespace_memory:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1383+ values : ' 1000000000x10' # 1 GB
1384+ - series : ' namespace_memory:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="kube-system"}'
1385+ values : ' 1000000000x10'
1386+ - series : ' kube_node_status_allocatable{cluster="kubernetes", node="n1", resource="memory", job="kube-state-metrics"}'
1387+ values : ' 1000000000x10'
1388+ - series : ' kube_node_info{cluster="kubernetes", node="n1", job="kube-state-metrics"}'
1389+ values : ' 1x10'
1390+ alert_rule_test :
1391+ - eval_time : 9m
1392+ alertname : KubeMemoryOvercommit
1393+ - eval_time : 10m
1394+ alertname : KubeMemoryOvercommit
1395+ exp_alerts :
1396+ - exp_labels :
1397+ severity : warning
1398+ exp_annotations :
1399+ description : Cluster has overcommitted memory resource requests for Pods by 1.15G bytes and cannot tolerate node failure.
1400+ runbook_url : https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubememoryovercommit
1401+ summary : Cluster has overcommitted memory resource requests.
1402+
1403+ - name : KubeMemoryOvercommit alert (multi-node)
1404+ - interval : 1m
1405+ input_series :
1406+ - series : ' namespace_memory:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1407+ values : ' 2000000000x10' # 2 GB
1408+ - series : ' namespace_memory:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="kube-system"}'
1409+ values : ' 2000000000x10'
1410+ - series : ' kube_node_status_allocatable{cluster="kubernetes", node="n1", resource="memory", job="kube-state-metrics"}'
1411+ values : ' 1000000000x10'
1412+ - series : ' kube_node_status_allocatable{cluster="kubernetes", node="n2", resource="memory", job="kube-state-metrics"}'
1413+ values : ' 1000000000x10'
1414+ - series : ' kube_node_info{cluster="kubernetes", node="n1", job="kube-state-metrics"}'
1415+ values : ' 1x10'
1416+ - series : ' kube_node_info{cluster="kubernetes", node="n2", job="kube-state-metrics"}'
1417+ values : ' 1x10'
1418+ alert_rule_test :
1419+ - eval_time : 9m
1420+ alertname : KubeMemoryOvercommit
1421+ - eval_time : 10m
1422+ alertname : KubeMemoryOvercommit
1423+ exp_alerts :
1424+ - exp_labels :
1425+ severity : warning
1426+ exp_annotations :
1427+ description : Cluster has overcommitted memory resource requests for Pods by 3G bytes and cannot tolerate node failure.
1428+ runbook_url : https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubememoryovercommit
1429+ summary : Cluster has overcommitted memory resource requests.
0 commit comments