Skip to content

Commit 7a3d3b7

Browse files
cluster monitoring components
1 parent 37c562c commit 7a3d3b7

File tree

10 files changed

+3232
-1694
lines changed

10 files changed

+3232
-1694
lines changed

prometheus-monitoring/kubernetes/1.14.8/grafana/grafana.dashboards.configmap.yaml

Lines changed: 2915 additions & 1684 deletions
Large diffs are not rendered by default.
Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,15 @@
1+
apiVersion: rbac.authorization.k8s.io/v1
2+
kind: ClusterRoleBinding
3+
metadata:
4+
labels:
5+
app.kubernetes.io/name: kube-state-metrics
6+
app.kubernetes.io/version: v1.8.0
7+
name: kube-state-metrics
8+
roleRef:
9+
apiGroup: rbac.authorization.k8s.io
10+
kind: ClusterRole
11+
name: kube-state-metrics
12+
subjects:
13+
- kind: ServiceAccount
14+
name: kube-state-metrics
15+
namespace: monitoring
Lines changed: 110 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,110 @@
1+
apiVersion: rbac.authorization.k8s.io/v1
2+
kind: ClusterRole
3+
metadata:
4+
labels:
5+
app.kubernetes.io/name: kube-state-metrics
6+
app.kubernetes.io/version: v1.8.0
7+
name: kube-state-metrics
8+
rules:
9+
- apiGroups:
10+
- ""
11+
resources:
12+
- configmaps
13+
- secrets
14+
- nodes
15+
- pods
16+
- services
17+
- resourcequotas
18+
- replicationcontrollers
19+
- limitranges
20+
- persistentvolumeclaims
21+
- persistentvolumes
22+
- namespaces
23+
- endpoints
24+
verbs:
25+
- list
26+
- watch
27+
- apiGroups:
28+
- extensions
29+
resources:
30+
- daemonsets
31+
- deployments
32+
- replicasets
33+
- ingresses
34+
verbs:
35+
- list
36+
- watch
37+
- apiGroups:
38+
- apps
39+
resources:
40+
- statefulsets
41+
- daemonsets
42+
- deployments
43+
- replicasets
44+
verbs:
45+
- list
46+
- watch
47+
- apiGroups:
48+
- batch
49+
resources:
50+
- cronjobs
51+
- jobs
52+
verbs:
53+
- list
54+
- watch
55+
- apiGroups:
56+
- autoscaling
57+
resources:
58+
- horizontalpodautoscalers
59+
verbs:
60+
- list
61+
- watch
62+
- apiGroups:
63+
- authentication.k8s.io
64+
resources:
65+
- tokenreviews
66+
verbs:
67+
- create
68+
- apiGroups:
69+
- authorization.k8s.io
70+
resources:
71+
- subjectaccessreviews
72+
verbs:
73+
- create
74+
- apiGroups:
75+
- policy
76+
resources:
77+
- poddisruptionbudgets
78+
verbs:
79+
- list
80+
- watch
81+
- apiGroups:
82+
- certificates.k8s.io
83+
resources:
84+
- certificatesigningrequests
85+
verbs:
86+
- list
87+
- watch
88+
- apiGroups:
89+
- storage.k8s.io
90+
resources:
91+
- storageclasses
92+
- volumeattachments
93+
verbs:
94+
- list
95+
- watch
96+
- apiGroups:
97+
- admissionregistration.k8s.io
98+
resources:
99+
- mutatingwebhookconfigurations
100+
- validatingwebhookconfigurations
101+
verbs:
102+
- list
103+
- watch
104+
- apiGroups:
105+
- networking.k8s.io
106+
resources:
107+
- networkpolicies
108+
verbs:
109+
- list
110+
- watch
Lines changed: 42 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,42 @@
1+
apiVersion: apps/v1
2+
kind: Deployment
3+
metadata:
4+
labels:
5+
k8s-app: kube-state-metrics
6+
app.kubernetes.io/name: kube-state-metrics
7+
app.kubernetes.io/version: v1.8.0
8+
name: kube-state-metrics
9+
spec:
10+
replicas: 1
11+
selector:
12+
matchLabels:
13+
app.kubernetes.io/name: kube-state-metrics
14+
template:
15+
metadata:
16+
labels:
17+
app.kubernetes.io/name: kube-state-metrics
18+
app.kubernetes.io/version: v1.8.0
19+
spec:
20+
containers:
21+
- image: quay.io/coreos/kube-state-metrics:v1.8.0
22+
livenessProbe:
23+
httpGet:
24+
path: /healthz
25+
port: 8080
26+
initialDelaySeconds: 5
27+
timeoutSeconds: 5
28+
name: kube-state-metrics
29+
ports:
30+
- containerPort: 8080
31+
name: http-metrics
32+
- containerPort: 8081
33+
name: telemetry
34+
readinessProbe:
35+
httpGet:
36+
path: /
37+
port: 8081
38+
initialDelaySeconds: 5
39+
timeoutSeconds: 5
40+
nodeSelector:
41+
kubernetes.io/os: linux
42+
serviceAccountName: kube-state-metrics
Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,7 @@
1+
apiVersion: v1
2+
kind: ServiceAccount
3+
metadata:
4+
labels:
5+
app.kubernetes.io/name: kube-state-metrics
6+
app.kubernetes.io/version: v1.8.0
7+
name: kube-state-metrics
Lines changed: 22 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,22 @@
1+
apiVersion: monitoring.coreos.com/v1
2+
kind: ServiceMonitor
3+
metadata:
4+
name: kube-state-metrics
5+
labels:
6+
prometheus: cluster-monitoring
7+
k8s-app: kube-state-metrics
8+
spec:
9+
targetLabels:
10+
- cluster
11+
jobLabel: kube-state-metrics
12+
selector:
13+
matchLabels:
14+
k8s-app: kube-state-metrics
15+
namespaceSelector:
16+
matchNames:
17+
- monitoring
18+
endpoints:
19+
- port: http-metrics
20+
honorLabels: true
21+
scheme: http
22+
interval: 60s
Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,20 @@
1+
apiVersion: v1
2+
kind: Service
3+
metadata:
4+
labels:
5+
app.kubernetes.io/name: kube-state-metrics
6+
app.kubernetes.io/version: v1.8.0
7+
k8s-app: kube-state-metrics
8+
cluster: docker-for-desktop
9+
name: kube-state-metrics
10+
spec:
11+
clusterIP: None
12+
ports:
13+
- name: http-metrics
14+
port: 8080
15+
targetPort: http-metrics
16+
- name: telemetry
17+
port: 8081
18+
targetPort: telemetry
19+
selector:
20+
app.kubernetes.io/name: kube-state-metrics
Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,24 @@
1+
apiVersion: monitoring.coreos.com/v1
2+
kind: ServiceMonitor
3+
metadata:
4+
name: kube-apiserver
5+
labels:
6+
prometheus: cluster-monitoring
7+
k8s-app: apiserver
8+
spec:
9+
jobLabel: component
10+
selector:
11+
matchLabels:
12+
component: apiserver
13+
provider: kubernetes
14+
namespaceSelector:
15+
matchNames:
16+
- default
17+
endpoints:
18+
- port: https
19+
interval: 60s
20+
scheme: https
21+
tlsConfig:
22+
caFile: /var/run/secrets/kubernetes.io/serviceaccount/ca.crt
23+
serverName: kubernetes
24+
bearerTokenFile: /var/run/secrets/kubernetes.io/serviceaccount/token
Lines changed: 77 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,77 @@
1+
apiVersion: monitoring.coreos.com/v1
2+
kind: ServiceMonitor
3+
metadata:
4+
labels:
5+
k8s-app: kubelet
6+
name: kubelet
7+
namespace: monitoring
8+
spec:
9+
endpoints:
10+
- bearerTokenFile: /var/run/secrets/kubernetes.io/serviceaccount/token
11+
honorLabels: true
12+
interval: 30s
13+
metricRelabelings:
14+
- action: drop
15+
regex: kubelet_(pod_worker_latency_microseconds|pod_start_latency_microseconds|cgroup_manager_latency_microseconds|pod_worker_start_latency_microseconds|pleg_relist_latency_microseconds|pleg_relist_interval_microseconds|runtime_operations|runtime_operations_latency_microseconds|runtime_operations_errors|eviction_stats_age_microseconds|device_plugin_registration_count|device_plugin_alloc_latency_microseconds|network_plugin_operations_latency_microseconds)
16+
sourceLabels:
17+
- __name__
18+
- action: drop
19+
regex: scheduler_(e2e_scheduling_latency_microseconds|scheduling_algorithm_predicate_evaluation|scheduling_algorithm_priority_evaluation|scheduling_algorithm_preemption_evaluation|scheduling_algorithm_latency_microseconds|binding_latency_microseconds|scheduling_latency_seconds)
20+
sourceLabels:
21+
- __name__
22+
- action: drop
23+
regex: apiserver_(request_count|request_latencies|request_latencies_summary|dropped_requests|storage_data_key_generation_latencies_microseconds|storage_transformation_failures_total|storage_transformation_latencies_microseconds|proxy_tunnel_sync_latency_secs)
24+
sourceLabels:
25+
- __name__
26+
- action: drop
27+
regex: kubelet_docker_(operations|operations_latency_microseconds|operations_errors|operations_timeout)
28+
sourceLabels:
29+
- __name__
30+
- action: drop
31+
regex: reflector_(items_per_list|items_per_watch|list_duration_seconds|lists_total|short_watches_total|watch_duration_seconds|watches_total)
32+
sourceLabels:
33+
- __name__
34+
- action: drop
35+
regex: etcd_(helper_cache_hit_count|helper_cache_miss_count|helper_cache_entry_count|request_cache_get_latencies_summary|request_cache_add_latencies_summary|request_latencies_summary)
36+
sourceLabels:
37+
- __name__
38+
- action: drop
39+
regex: transformation_(transformation_latencies_microseconds|failures_total)
40+
sourceLabels:
41+
- __name__
42+
- action: drop
43+
regex: (admission_quota_controller_adds|crd_autoregistration_controller_work_duration|APIServiceOpenAPIAggregationControllerQueue1_adds|AvailableConditionController_retries|crd_openapi_controller_unfinished_work_seconds|APIServiceRegistrationController_retries|admission_quota_controller_longest_running_processor_microseconds|crdEstablishing_longest_running_processor_microseconds|crdEstablishing_unfinished_work_seconds|crd_openapi_controller_adds|crd_autoregistration_controller_retries|crd_finalizer_queue_latency|AvailableConditionController_work_duration|non_structural_schema_condition_controller_depth|crd_autoregistration_controller_unfinished_work_seconds|AvailableConditionController_adds|DiscoveryController_longest_running_processor_microseconds|autoregister_queue_latency|crd_autoregistration_controller_adds|non_structural_schema_condition_controller_work_duration|APIServiceRegistrationController_adds|crd_finalizer_work_duration|crd_naming_condition_controller_unfinished_work_seconds|crd_openapi_controller_longest_running_processor_microseconds|DiscoveryController_adds|crd_autoregistration_controller_longest_running_processor_microseconds|autoregister_unfinished_work_seconds|crd_naming_condition_controller_queue_latency|crd_naming_condition_controller_retries|non_structural_schema_condition_controller_queue_latency|crd_naming_condition_controller_depth|AvailableConditionController_longest_running_processor_microseconds|crdEstablishing_depth|crd_finalizer_longest_running_processor_microseconds|crd_naming_condition_controller_adds|APIServiceOpenAPIAggregationControllerQueue1_longest_running_processor_microseconds|DiscoveryController_queue_latency|DiscoveryController_unfinished_work_seconds|crd_openapi_controller_depth|APIServiceOpenAPIAggregationControllerQueue1_queue_latency|APIServiceOpenAPIAggregationControllerQueue1_unfinished_work_seconds|DiscoveryController_work_duration|autoregister_adds|crd_autoregistration_controller_queue_latency|crd_finalizer_retries|AvailableConditionController_unfinished_work_seconds|autoregister_longest_running_processor_microseconds|non_structural_schema_condition_controller_unfinished_work_seconds|APIServiceOpenAPIAggregationControllerQueue1_depth|AvailableConditionController_depth|DiscoveryController_retries|admission_quota_controller_depth|crdEstablishing_adds|APIServiceOpenAPIAggregationControllerQueue1_retries|crdEstablishing_queue_latency|non_structural_schema_condition_controller_longest_running_processor_microseconds|autoregister_work_duration|crd_openapi_controller_retries|APIServiceRegistrationController_work_duration|crdEstablishing_work_duration|crd_finalizer_adds|crd_finalizer_depth|crd_openapi_controller_queue_latency|APIServiceOpenAPIAggregationControllerQueue1_work_duration|APIServiceRegistrationController_queue_latency|crd_autoregistration_controller_depth|AvailableConditionController_queue_latency|admission_quota_controller_queue_latency|crd_naming_condition_controller_work_duration|crd_openapi_controller_work_duration|DiscoveryController_depth|crd_naming_condition_controller_longest_running_processor_microseconds|APIServiceRegistrationController_depth|APIServiceRegistrationController_longest_running_processor_microseconds|crd_finalizer_unfinished_work_seconds|crdEstablishing_retries|admission_quota_controller_unfinished_work_seconds|non_structural_schema_condition_controller_adds|APIServiceRegistrationController_unfinished_work_seconds|admission_quota_controller_work_duration|autoregister_depth|autoregister_retries|kubeproxy_sync_proxy_rules_latency_microseconds|rest_client_request_latency_seconds|non_structural_schema_condition_controller_retries)
44+
sourceLabels:
45+
- __name__
46+
port: https-metrics
47+
relabelings:
48+
- sourceLabels:
49+
- __metrics_path__
50+
targetLabel: metrics_path
51+
scheme: https
52+
tlsConfig:
53+
insecureSkipVerify: true
54+
- bearerTokenFile: /var/run/secrets/kubernetes.io/serviceaccount/token
55+
honorLabels: true
56+
interval: 30s
57+
metricRelabelings:
58+
- action: drop
59+
regex: container_(network_tcp_usage_total|network_udp_usage_total|tasks_state|cpu_load_average_10s)
60+
sourceLabels:
61+
- __name__
62+
path: /metrics/cadvisor
63+
port: https-metrics
64+
relabelings:
65+
- sourceLabels:
66+
- __metrics_path__
67+
targetLabel: metrics_path
68+
scheme: https
69+
tlsConfig:
70+
insecureSkipVerify: true
71+
jobLabel: k8s-app
72+
namespaceSelector:
73+
matchNames:
74+
- kube-system
75+
selector:
76+
matchLabels:
77+
k8s-app: kubelet

prometheus-monitoring/kubernetes/1.14.8/prometheus-standalone/prometheus.yaml

Lines changed: 0 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -16,16 +16,6 @@ spec:
1616
operator: In
1717
values:
1818
- apps
19-
# - kube-state-metrics
20-
# - apiserver
21-
# - kubelet
22-
# ruleSelector:
23-
# matchLabels:
24-
# role: alert-rules
25-
# prometheus: k8s
26-
# resources:
27-
# requests:
28-
# memory: 400Mi
2919
---
3020
apiVersion: v1
3121
kind: ServiceAccount

0 commit comments

Comments
 (0)