Skip to content

Commit 758d714

Browse files
committed
fixup! Use kube-scheduler's metrics instead of kube-state-metrics
1 parent 9ddfce6 commit 758d714

File tree

7 files changed

+31
-31
lines changed

7 files changed

+31
-31
lines changed

dashboards/resources/multi-cluster.libsonnet

Lines changed: 12 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -26,23 +26,23 @@ local g = import 'github.com/grafana/jsonnet-libs/grafana-builder/grafana.libson
2626
)
2727
.addPanel(
2828
g.panel('CPU Requests Commitment') +
29-
g.statPanel('sum(kube_pod_resource_requests{%(kubeStateMetricsSelector)s, resource="cpu"}) / sum(kube_node_status_allocatable{%(kubeStateMetricsSelector)s, resource="cpu"})' % $._config)
29+
g.statPanel('sum(kube_pod_resource_requests{%(kubeSchedulerSelector)s, resource="cpu"}) / sum(kube_node_status_allocatable{%(kubeSchedulerSelector)s, resource="cpu"})' % $._config)
3030
)
3131
.addPanel(
3232
g.panel('CPU Limits Commitment') +
33-
g.statPanel('sum(kube_pod_resource_limits{%(kubeStateMetricsSelector)s, resource="cpu"}) / sum(kube_node_status_allocatable{%(kubeStateMetricsSelector)s, resource="cpu"})' % $._config)
33+
g.statPanel('sum(kube_pod_resource_limits{%(kubeSchedulerSelector)s, resource="cpu"}) / sum(kube_node_status_allocatable{%(kubeSchedulerSelector)s, resource="cpu"})' % $._config)
3434
)
3535
.addPanel(
3636
g.panel('Memory Utilisation') +
3737
g.statPanel('1 - sum(:node_memory_MemAvailable_bytes:sum) / sum(node_memory_MemTotal_bytes{%(nodeExporterSelector)s})' % $._config)
3838
)
3939
.addPanel(
4040
g.panel('Memory Requests Commitment') +
41-
g.statPanel('sum(kube_pod_resource_requests{%(kubeStateMetricsSelector)s, resource="memory"}) / sum(kube_node_status_allocatable{%(kubeStateMetricsSelector)s, resource="memory"})' % $._config)
41+
g.statPanel('sum(kube_pod_resource_requests{%(kubeSchedulerSelector)s, resource="memory"}) / sum(kube_node_status_allocatable{%(kubeSchedulerSelector)s, resource="memory"})' % $._config)
4242
)
4343
.addPanel(
4444
g.panel('Memory Limits Commitment') +
45-
g.statPanel('sum(kube_pod_resource_limits{%(kubeStateMetricsSelector)s, resource="memory"}) / sum(kube_node_status_allocatable{%(kubeStateMetricsSelector)s, resource="memory"})' % $._config)
45+
g.statPanel('sum(kube_pod_resource_limits{%(kubeSchedulerSelector)s, resource="memory"}) / sum(kube_node_status_allocatable{%(kubeSchedulerSelector)s, resource="memory"})' % $._config)
4646
)
4747
)
4848
.addRow(
@@ -59,10 +59,10 @@ local g = import 'github.com/grafana/jsonnet-libs/grafana-builder/grafana.libson
5959
g.panel('CPU Quota') +
6060
g.tablePanel([
6161
'sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate) by (%(clusterLabel)s)' % $._config,
62-
'sum(kube_pod_resource_requests{%(kubeStateMetricsSelector)s, resource="cpu"}) by (%(clusterLabel)s)' % $._config,
63-
'sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate) by (%(clusterLabel)s) / sum(kube_pod_resource_requests{%(kubeStateMetricsSelector)s, resource="cpu"}) by (%(clusterLabel)s)' % $._config,
64-
'sum(kube_pod_resource_limits{%(kubeStateMetricsSelector)s, resource="cpu"}) by (%(clusterLabel)s)' % $._config,
65-
'sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate) by (%(clusterLabel)s) / sum(kube_pod_resource_limits{%(kubeStateMetricsSelector)s, resource="cpu"}) by (%(clusterLabel)s)' % $._config,
62+
'sum(kube_pod_resource_requests{%(kubeSchedulerSelector)s, resource="cpu"}) by (%(clusterLabel)s)' % $._config,
63+
'sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate) by (%(clusterLabel)s) / sum(kube_pod_resource_requests{%(kubeSchedulerSelector)s, resource="cpu"}) by (%(clusterLabel)s)' % $._config,
64+
'sum(kube_pod_resource_limits{%(kubeSchedulerSelector)s, resource="cpu"}) by (%(clusterLabel)s)' % $._config,
65+
'sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate) by (%(clusterLabel)s) / sum(kube_pod_resource_limits{%(kubeSchedulerSelector)s, resource="cpu"}) by (%(clusterLabel)s)' % $._config,
6666
], tableStyles {
6767
'Value #A': { alias: 'CPU Usage' },
6868
'Value #B': { alias: 'CPU Requests' },
@@ -88,10 +88,10 @@ local g = import 'github.com/grafana/jsonnet-libs/grafana-builder/grafana.libson
8888
g.tablePanel([
8989
// Not using container_memory_usage_bytes here because that includes page cache
9090
'sum(container_memory_rss{%(cadvisorSelector)s, container!=""}) by (%(clusterLabel)s)' % $._config,
91-
'sum(kube_pod_resource_requests{%(kubeStateMetricsSelector)s, resource="memory"}) by (%(clusterLabel)s)' % $._config,
92-
'sum(container_memory_rss{%(cadvisorSelector)s, container!=""}) by (%(clusterLabel)s) / sum(kube_pod_resource_requests{%(kubeStateMetricsSelector)s, resource="memory"}) by (%(clusterLabel)s)' % $._config,
93-
'sum(kube_pod_resource_limits{%(kubeStateMetricsSelector)s, resource="memory"}) by (%(clusterLabel)s)' % $._config,
94-
'sum(container_memory_rss{%(cadvisorSelector)s, container!=""}) by (%(clusterLabel)s) / sum(kube_pod_resource_limits{%(kubeStateMetricsSelector)s, resource="memory"}) by (%(clusterLabel)s)' % $._config,
91+
'sum(kube_pod_resource_requests{%(kubeSchedulerSelector)s, resource="memory"}) by (%(clusterLabel)s)' % $._config,
92+
'sum(container_memory_rss{%(cadvisorSelector)s, container!=""}) by (%(clusterLabel)s) / sum(kube_pod_resource_requests{%(kubeSchedulerSelector)s, resource="memory"}) by (%(clusterLabel)s)' % $._config,
93+
'sum(kube_pod_resource_limits{%(kubeSchedulerSelector)s, resource="memory"}) by (%(clusterLabel)s)' % $._config,
94+
'sum(container_memory_rss{%(cadvisorSelector)s, container!=""}) by (%(clusterLabel)s) / sum(kube_pod_resource_limits{%(kubeSchedulerSelector)s, resource="memory"}) by (%(clusterLabel)s)' % $._config,
9595
], tableStyles {
9696
'Value #A': { alias: 'Memory Usage', unit: 'bytes' },
9797
'Value #B': { alias: 'Memory Requests', unit: 'bytes' },

dashboards/resources/namespace.libsonnet

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -141,19 +141,19 @@ local template = grafana.template;
141141
})
142142
.addPanel(
143143
g.panel('CPU Utilisation (from requests)') +
144-
g.statPanel('sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{%(clusterLabel)s="$cluster", namespace="$namespace"}) / sum(kube_pod_resource_requests{%(kubeStateMetricsSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="cpu"})' % $._config)
144+
g.statPanel('sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{%(clusterLabel)s="$cluster", namespace="$namespace"}) / sum(kube_pod_resource_requests{%(kubeSchedulerSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="cpu"})' % $._config)
145145
)
146146
.addPanel(
147147
g.panel('CPU Utilisation (from limits)') +
148-
g.statPanel('sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{%(clusterLabel)s="$cluster", namespace="$namespace"}) / sum(kube_pod_resource_limits{%(kubeStateMetricsSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="cpu"})' % $._config)
148+
g.statPanel('sum(node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{%(clusterLabel)s="$cluster", namespace="$namespace"}) / sum(kube_pod_resource_limits{%(kubeSchedulerSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="cpu"})' % $._config)
149149
)
150150
.addPanel(
151151
g.panel('Memory Utilisation (from requests)') +
152-
g.statPanel('sum(container_memory_working_set_bytes{%(cadvisorSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace",container!="", image!=""}) / sum(kube_pod_resource_requests{%(kubeStateMetricsSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="memory"})' % $._config)
152+
g.statPanel('sum(container_memory_working_set_bytes{%(cadvisorSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace",container!="", image!=""}) / sum(kube_pod_resource_requests{%(kubeSchedulerSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="memory"})' % $._config)
153153
)
154154
.addPanel(
155155
g.panel('Memory Utilisation (from limits)') +
156-
g.statPanel('sum(container_memory_working_set_bytes{%(cadvisorSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace",container!="", image!=""}) / sum(kube_pod_resource_limits{%(kubeStateMetricsSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="memory"})' % $._config)
156+
g.statPanel('sum(container_memory_working_set_bytes{%(cadvisorSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace",container!="", image!=""}) / sum(kube_pod_resource_limits{%(kubeSchedulerSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="memory"})' % $._config)
157157
)
158158
)
159159
.addRow(

dashboards/resources/pod.libsonnet

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,7 @@ local template = grafana.template;
5050

5151
local cpuRequestsQuery = |||
5252
sum(
53-
kube_pod_resource_requests{%(kubeStateMetricsSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", pod="$pod", resource="cpu"}
53+
kube_pod_resource_requests{%(kubeSchedulerSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", pod="$pod", resource="cpu"}
5454
)
5555
||| % $._config;
5656

dashboards/resources/workload-namespace.libsonnet

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -137,7 +137,7 @@ local template = grafana.template;
137137

138138
local cpuRequestsQuery = |||
139139
sum(
140-
kube_pod_resource_requests{%(kubeStateMetricsSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="cpu"}
140+
kube_pod_resource_requests{%(kubeSchedulerSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="cpu"}
141141
* on(namespace,pod)
142142
group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{%(clusterLabel)s="$cluster", namespace="$namespace", workload_type="$type"}
143143
) by (workload, workload_type)

dashboards/resources/workload.libsonnet

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -135,7 +135,7 @@ local template = grafana.template;
135135

136136
local cpuRequestsQuery = |||
137137
sum(
138-
kube_pod_resource_requests{%(kubeStateMetricsSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="cpu"}
138+
kube_pod_resource_requests{%(kubeSchedulerSelector)s, %(clusterLabel)s="$cluster", namespace="$namespace", resource="cpu"}
139139
* on(namespace,pod)
140140
group_left(workload, workload_type) namespace_workload_pod:kube_pod_owner:relabel{%(clusterLabel)s="$cluster", namespace="$namespace", workload="$workload", workload_type="$type"}
141141
) by (pod)

rules/apps.libsonnet

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -61,7 +61,7 @@
6161
{
6262
record: 'cluster:namespace:pod_memory:active:kube_pod_resource_requests',
6363
expr: |||
64-
kube_pod_resource_requests{resource="memory",%(kubeStateMetricsSelector)s} * on (namespace, pod, %(clusterLabel)s)
64+
kube_pod_resource_requests{resource="memory",%(kubeSchedulerSelector)s} * on (namespace, pod, %(clusterLabel)s)
6565
group_left() max by (namespace, pod, %(clusterLabel)s) (
6666
(kube_pod_status_phase{phase=~"Pending|Running"} == 1)
6767
)
@@ -73,7 +73,7 @@
7373
sum by (namespace, %(clusterLabel)s) (
7474
sum by (namespace, pod, %(clusterLabel)s) (
7575
max by (namespace, pod, container, %(clusterLabel)s) (
76-
kube_pod_resource_requests{resource="memory",%(kubeStateMetricsSelector)s}
76+
kube_pod_resource_requests{resource="memory",%(kubeSchedulerSelector)s}
7777
) * on(namespace, pod, %(clusterLabel)s) group_left() max by (namespace, pod, %(clusterLabel)s) (
7878
kube_pod_status_phase{phase=~"Pending|Running"} == 1
7979
)
@@ -84,7 +84,7 @@
8484
{
8585
record: 'cluster:namespace:pod_cpu:active:kube_pod_resource_requests',
8686
expr: |||
87-
kube_pod_resource_requests{resource="cpu",%(kubeStateMetricsSelector)s} * on (namespace, pod, %(clusterLabel)s)
87+
kube_pod_resource_requests{resource="cpu",%(kubeSchedulerSelector)s} * on (namespace, pod, %(clusterLabel)s)
8888
group_left() max by (namespace, pod, %(clusterLabel)s) (
8989
(kube_pod_status_phase{phase=~"Pending|Running"} == 1)
9090
)
@@ -96,7 +96,7 @@
9696
sum by (namespace, %(clusterLabel)s) (
9797
sum by (namespace, pod, %(clusterLabel)s) (
9898
max by (namespace, pod, container, %(clusterLabel)s) (
99-
kube_pod_resource_requests{resource="cpu",%(kubeStateMetricsSelector)s}
99+
kube_pod_resource_requests{resource="cpu",%(kubeSchedulerSelector)s}
100100
) * on(namespace, pod, %(clusterLabel)s) group_left() max by (namespace, pod, %(clusterLabel)s) (
101101
kube_pod_status_phase{phase=~"Pending|Running"} == 1
102102
)
@@ -107,7 +107,7 @@
107107
{
108108
record: 'cluster:namespace:pod_memory:active:kube_pod_resource_limits',
109109
expr: |||
110-
kube_pod_resource_limits{resource="memory",%(kubeStateMetricsSelector)s} * on (namespace, pod, %(clusterLabel)s)
110+
kube_pod_resource_limits{resource="memory",%(kubeSchedulerSelector)s} * on (namespace, pod, %(clusterLabel)s)
111111
group_left() max by (namespace, pod, %(clusterLabel)s) (
112112
(kube_pod_status_phase{phase=~"Pending|Running"} == 1)
113113
)
@@ -119,7 +119,7 @@
119119
sum by (namespace, %(clusterLabel)s) (
120120
sum by (namespace, pod, %(clusterLabel)s) (
121121
max by (namespace, pod, container, %(clusterLabel)s) (
122-
kube_pod_resource_limits{resource="memory",%(kubeStateMetricsSelector)s}
122+
kube_pod_resource_limits{resource="memory",%(kubeSchedulerSelector)s}
123123
) * on(namespace, pod, %(clusterLabel)s) group_left() max by (namespace, pod, %(clusterLabel)s) (
124124
kube_pod_status_phase{phase=~"Pending|Running"} == 1
125125
)
@@ -130,7 +130,7 @@
130130
{
131131
record: 'cluster:namespace:pod_cpu:active:kube_pod_resource_limits',
132132
expr: |||
133-
kube_pod_resource_limits{resource="cpu",%(kubeStateMetricsSelector)s} * on (namespace, pod, %(clusterLabel)s)
133+
kube_pod_resource_limits{resource="cpu",%(kubeSchedulerSelector)s} * on (namespace, pod, %(clusterLabel)s)
134134
group_left() max by (namespace, pod, %(clusterLabel)s) (
135135
(kube_pod_status_phase{phase=~"Pending|Running"} == 1)
136136
)
@@ -142,7 +142,7 @@
142142
sum by (namespace, %(clusterLabel)s) (
143143
sum by (namespace, pod, %(clusterLabel)s) (
144144
max by (namespace, pod, container, %(clusterLabel)s) (
145-
kube_pod_resource_limits{resource="cpu",%(kubeStateMetricsSelector)s}
145+
kube_pod_resource_limits{resource="cpu",%(kubeSchedulerSelector)s}
146146
) * on(namespace, pod, %(clusterLabel)s) group_left() max by (namespace, pod, %(clusterLabel)s) (
147147
kube_pod_status_phase{phase=~"Pending|Running"} == 1
148148
)

rules/windows.libsonnet

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -217,28 +217,28 @@
217217
record: 'kube_pod_windows_container_resource_memory_request',
218218
expr: |||
219219
max by (namespace, pod, container) (
220-
kube_pod_resource_requests{resource="memory",%(kubeStateMetricsSelector)s}
220+
kube_pod_resource_requests{resource="memory",%(kubeSchedulerSelector)s}
221221
) * on(container,pod,namespace) (windows_pod_container_available)
222222
||| % $._config,
223223
},
224224
{
225225
record: 'kube_pod_windows_container_resource_memory_limit',
226226
expr: |||
227-
kube_pod_resource_limits{resource="memory",%(kubeStateMetricsSelector)s} * on(container,pod,namespace) (windows_pod_container_available)
227+
kube_pod_resource_limits{resource="memory",%(kubeSchedulerSelector)s} * on(container,pod,namespace) (windows_pod_container_available)
228228
||| % $._config,
229229
},
230230
{
231231
record: 'kube_pod_windows_container_resource_cpu_cores_request',
232232
expr: |||
233233
max by (namespace, pod, container) (
234-
kube_pod_resource_requests{resource="cpu",%(kubeStateMetricsSelector)s}
234+
kube_pod_resource_requests{resource="cpu",%(kubeSchedulerSelector)s}
235235
) * on(container,pod,namespace) (windows_pod_container_available)
236236
||| % $._config,
237237
},
238238
{
239239
record: 'kube_pod_windows_container_resource_cpu_cores_limit',
240240
expr: |||
241-
kube_pod_resource_limits{resource="cpu",%(kubeStateMetricsSelector)s} * on(container,pod,namespace) (windows_pod_container_available)
241+
kube_pod_resource_limits{resource="cpu",%(kubeSchedulerSelector)s} * on(container,pod,namespace) (windows_pod_container_available)
242242
||| % $._config,
243243
},
244244
{

0 commit comments

Comments
 (0)