Skip to content

Commit 41645e2

Browse files
sklrexagod
authored andcommitted
test: Add tests for KubeCPUOvercommit and KubeMemoryOvercommit
1 parent 5788ff9 commit 41645e2

File tree

1 file changed

+104
-0
lines changed

1 file changed

+104
-0
lines changed

tests/tests.yaml

Lines changed: 104 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1323,3 +1323,107 @@ tests:
13231323
description: 'Cluster has overcommitted memory resource requests for Namespaces.'
13241324
runbook_url: "https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubememoryquotaovercommit"
13251325
summary: "Cluster has overcommitted memory resource requests."
1326+
1327+
- name: KubeCPUOvercommit alert (single-node)
1328+
- interval: 1m
1329+
input_series:
1330+
- series: 'namespace_cpu:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1331+
values: '1x10'
1332+
- series: 'namespace_cpu:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="kube-system"}'
1333+
values: '1x10'
1334+
- series: 'kube_node_status_allocatable{cluster="kubernetes", node="n1", resource="cpu", job="kube-state-metrics"}'
1335+
values: '1.9x10' # This value was seen on a 2x vCPU node
1336+
- series: 'kube_node_info{cluster="kubernetes", node="n1", job="kube-state-metrics"}'
1337+
values: '1x10'
1338+
alert_rule_test:
1339+
- eval_time: 9m
1340+
alertname: KubeCPUOvercommit
1341+
- eval_time: 10m
1342+
alertname: KubeCPUOvercommit
1343+
exp_alerts:
1344+
- exp_labels:
1345+
severity: warning
1346+
exp_annotations:
1347+
description: Cluster has overcommitted CPU resource requests for Pods by 0.385 CPU shares and cannot tolerate node failure.
1348+
runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubecpuovercommit
1349+
summary: Cluster has overcommitted CPU resource requests.
1350+
1351+
- name: KubeCPUOvercommit alert (multi-node)
1352+
- interval: 1m
1353+
input_series:
1354+
- series: 'namespace_cpu:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1355+
values: '2x10'
1356+
- series: 'namespace_cpu:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="kube-system"}'
1357+
values: '2x10'
1358+
- series: 'kube_node_status_allocatable{cluster="kubernetes", node="n1", resource="cpu", job="kube-state-metrics"}'
1359+
values: '1.9x10' # This value was seen on a 2x vCPU node
1360+
- series: 'kube_node_status_allocatable{cluster="kubernetes", node="n2", resource="cpu", job="kube-state-metrics"}'
1361+
values: '1.9x10'
1362+
- series: 'kube_node_info{cluster="kubernetes", node="n1", job="kube-state-metrics"}'
1363+
values: '1x10'
1364+
- series: 'kube_node_info{cluster="kubernetes", node="n2", job="kube-state-metrics"}'
1365+
values: '1x10'
1366+
alert_rule_test:
1367+
- eval_time: 9m
1368+
alertname: KubeCPUOvercommit
1369+
- eval_time: 10m
1370+
alertname: KubeCPUOvercommit
1371+
exp_alerts:
1372+
- exp_labels:
1373+
severity: warning
1374+
exp_annotations:
1375+
description: Cluster has overcommitted CPU resource requests for Pods by 2.1 CPU shares and cannot tolerate node failure.
1376+
runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubecpuovercommit
1377+
summary: Cluster has overcommitted CPU resource requests.
1378+
1379+
- name: KubeMemoryOvercommit alert (single-node)
1380+
- interval: 1m
1381+
input_series:
1382+
- series: 'namespace_memory:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1383+
values: '1000000000x10' # 1 GB
1384+
- series: 'namespace_memory:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="kube-system"}'
1385+
values: '1000000000x10'
1386+
- series: 'kube_node_status_allocatable{cluster="kubernetes", node="n1", resource="memory", job="kube-state-metrics"}'
1387+
values: '1000000000x10'
1388+
- series: 'kube_node_info{cluster="kubernetes", node="n1", job="kube-state-metrics"}'
1389+
values: '1x10'
1390+
alert_rule_test:
1391+
- eval_time: 9m
1392+
alertname: KubeMemoryOvercommit
1393+
- eval_time: 10m
1394+
alertname: KubeMemoryOvercommit
1395+
exp_alerts:
1396+
- exp_labels:
1397+
severity: warning
1398+
exp_annotations:
1399+
description: Cluster has overcommitted memory resource requests for Pods by 1.15G bytes and cannot tolerate node failure.
1400+
runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubememoryovercommit
1401+
summary: Cluster has overcommitted memory resource requests.
1402+
1403+
- name: KubeMemoryOvercommit alert (multi-node)
1404+
- interval: 1m
1405+
input_series:
1406+
- series: 'namespace_memory:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1407+
values: '2000000000x10' # 2 GB
1408+
- series: 'namespace_memory:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="kube-system"}'
1409+
values: '2000000000x10'
1410+
- series: 'kube_node_status_allocatable{cluster="kubernetes", node="n1", resource="memory", job="kube-state-metrics"}'
1411+
values: '1000000000x10'
1412+
- series: 'kube_node_status_allocatable{cluster="kubernetes", node="n2", resource="memory", job="kube-state-metrics"}'
1413+
values: '1000000000x10'
1414+
- series: 'kube_node_info{cluster="kubernetes", node="n1", job="kube-state-metrics"}'
1415+
values: '1x10'
1416+
- series: 'kube_node_info{cluster="kubernetes", node="n2", job="kube-state-metrics"}'
1417+
values: '1x10'
1418+
alert_rule_test:
1419+
- eval_time: 9m
1420+
alertname: KubeMemoryOvercommit
1421+
- eval_time: 10m
1422+
alertname: KubeMemoryOvercommit
1423+
exp_alerts:
1424+
- exp_labels:
1425+
severity: warning
1426+
exp_annotations:
1427+
description: Cluster has overcommitted memory resource requests for Pods by 3G bytes and cannot tolerate node failure.
1428+
runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubememoryovercommit
1429+
summary: Cluster has overcommitted memory resource requests.

0 commit comments

Comments
 (0)