Skip to content

Commit fa75ff9

Browse files
committed
add alert related deadlock / crashloop panels for core tekton controllers
rh-pre-commit.version: 2.3.0 rh-pre-commit.check-secrets: ENABLED
1 parent ccd582e commit fa75ff9

File tree

1 file changed

+209
-14
lines changed

1 file changed

+209
-14
lines changed

operator/gitops/argocd/grafana/dashboards/pipeline-service-dashboard.json

Lines changed: 209 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@
2121
"type": "grafana",
2222
"id": "grafana",
2323
"name": "Grafana",
24-
"version": "9.1.6"
24+
"version": "10.4.3"
2525
},
2626
{
2727
"type": "panel",
@@ -87,6 +87,7 @@
8787
"y": 0
8888
},
8989
"id": 93,
90+
"panels": [],
9091
"repeat": "datasource",
9192
"title": "Alerts",
9293
"type": "row"
@@ -138,10 +139,12 @@
138139
"fields": "",
139140
"values": false
140141
},
142+
"showPercentChange": false,
141143
"text": {},
142-
"textMode": "auto"
144+
"textMode": "auto",
145+
"wideLayout": true
143146
},
144-
"pluginVersion": "9.1.6",
147+
"pluginVersion": "10.4.3",
145148
"targets": [
146149
{
147150
"editorMode": "code",
@@ -206,9 +209,11 @@
206209
"fields": "",
207210
"values": false
208211
},
209-
"textMode": "auto"
212+
"showPercentChange": false,
213+
"textMode": "auto",
214+
"wideLayout": true
210215
},
211-
"pluginVersion": "9.1.6",
216+
"pluginVersion": "10.4.3",
212217
"targets": [
213218
{
214219
"editorMode": "code",
@@ -221,6 +226,198 @@
221226
"title": "Tekton Execution Overhead",
222227
"type": "stat"
223228
},
229+
{
230+
"description": "The number of times the pipelines controller has restarted",
231+
"fieldConfig": {
232+
"defaults": {
233+
"color": {
234+
"mode": "thresholds"
235+
},
236+
"mappings": [],
237+
"max": 1,
238+
"min": 0,
239+
"noValue": "No data",
240+
"thresholds": {
241+
"mode": "absolute",
242+
"steps": [
243+
{
244+
"color": "green",
245+
"value": null
246+
},
247+
{
248+
"color": "red",
249+
"value": 5
250+
}
251+
]
252+
},
253+
"unit": "none"
254+
},
255+
"overrides": []
256+
},
257+
"gridPos": {
258+
"h": 9,
259+
"w": 4,
260+
"x": 8,
261+
"y": 1
262+
},
263+
"id": 480,
264+
"options": {
265+
"colorMode": "value",
266+
"graphMode": "area",
267+
"justifyMode": "auto",
268+
"orientation": "auto",
269+
"reduceOptions": {
270+
"calcs": [
271+
"lastNotNull"
272+
],
273+
"fields": "",
274+
"values": false
275+
},
276+
"showPercentChange": false,
277+
"textMode": "auto",
278+
"wideLayout": true
279+
},
280+
"pluginVersion": "10.4.3",
281+
"targets": [
282+
{
283+
"editorMode": "code",
284+
"expr": "sum(increase(kube_pod_container_status_restarts_total{namespace=\"openshift-pipelines\", pod=~\"tekton-pipelines-controller-.*\"}[30m]))",
285+
"legendFormat": "__auto",
286+
"range": true,
287+
"refId": "A"
288+
}
289+
],
290+
"title": "Pipieline Controller Restarts",
291+
"type": "stat"
292+
},
293+
{
294+
"description": "Number of PipelineRuns outside of Kubernetes Throttling where the Tekton Controller has yet to attempt to process its correctly defined Task specifications for multiple scan iterations.",
295+
"fieldConfig": {
296+
"defaults": {
297+
"color": {
298+
"mode": "thresholds"
299+
},
300+
"mappings": [],
301+
"max": 1,
302+
"min": 0,
303+
"noValue": "No data",
304+
"thresholds": {
305+
"mode": "absolute",
306+
"steps": [
307+
{
308+
"color": "green",
309+
"value": null
310+
},
311+
{
312+
"color": "red",
313+
"value": 30
314+
}
315+
]
316+
},
317+
"unit": "none"
318+
},
319+
"overrides": []
320+
},
321+
"gridPos": {
322+
"h": 9,
323+
"w": 4,
324+
"x": 12,
325+
"y": 1
326+
},
327+
"id": 481,
328+
"options": {
329+
"colorMode": "value",
330+
"graphMode": "area",
331+
"justifyMode": "auto",
332+
"orientation": "auto",
333+
"reduceOptions": {
334+
"calcs": [
335+
"lastNotNull"
336+
],
337+
"fields": "",
338+
"values": false
339+
},
340+
"showPercentChange": false,
341+
"textMode": "auto",
342+
"wideLayout": true
343+
},
344+
"pluginVersion": "10.4.3",
345+
"targets": [
346+
{
347+
"editorMode": "code",
348+
"expr": "sum(increase(pipelinerun_kickoff_not_attempted_count[30m]))",
349+
"legendFormat": "__auto",
350+
"range": true,
351+
"refId": "A"
352+
}
353+
],
354+
"title": "Pipeline Controller Kickoff After Kubernetes scheduling checks pass",
355+
"type": "stat"
356+
},
357+
{
358+
"description": "Number of TaskRuns outside of Kubernetes Throttling where the Tekton Controller has yet to attempt to create its underlying Pod, or the TaskRun is still in Pending state for multiple scan iterations",
359+
"fieldConfig": {
360+
"defaults": {
361+
"color": {
362+
"mode": "thresholds"
363+
},
364+
"mappings": [],
365+
"max": 1,
366+
"min": 0,
367+
"noValue": "No data",
368+
"thresholds": {
369+
"mode": "absolute",
370+
"steps": [
371+
{
372+
"color": "green",
373+
"value": null
374+
},
375+
{
376+
"color": "red",
377+
"value": 30
378+
}
379+
]
380+
},
381+
"unit": "none"
382+
},
383+
"overrides": []
384+
},
385+
"gridPos": {
386+
"h": 9,
387+
"w": 4,
388+
"x": 16,
389+
"y": 1
390+
},
391+
"id": 482,
392+
"options": {
393+
"colorMode": "value",
394+
"graphMode": "area",
395+
"justifyMode": "auto",
396+
"orientation": "auto",
397+
"reduceOptions": {
398+
"calcs": [
399+
"lastNotNull"
400+
],
401+
"fields": "",
402+
"values": false
403+
},
404+
"showPercentChange": false,
405+
"textMode": "auto",
406+
"wideLayout": true
407+
},
408+
"pluginVersion": "10.4.3",
409+
"targets": [
410+
{
411+
"editorMode": "code",
412+
"expr": "sum(increase(taskrun_pod_create_not_attempted_or_pending_count[30m]))",
413+
"legendFormat": "__auto",
414+
"range": true,
415+
"refId": "A"
416+
}
417+
],
418+
"title": "TaskRun Controller kickoff after Kubernetes scheduling checks pass",
419+
"type": "stat"
420+
},
224421
{
225422
"collapsed": true,
226423
"gridPos": {
@@ -1064,7 +1261,7 @@
10641261
"h": 8,
10651262
"w": 12,
10661263
"x": 12,
1067-
"y": 30
1264+
"y": 22
10681265
},
10691266
"hiddenSeries": false,
10701267
"id": 77,
@@ -1190,7 +1387,7 @@
11901387
"h": 8,
11911388
"w": 12,
11921389
"x": 0,
1193-
"y": 38
1390+
"y": 30
11941391
},
11951392
"id": 39,
11961393
"options": {
@@ -1676,7 +1873,7 @@
16761873
"y": 30
16771874
},
16781875
"hiddenSeries": false,
1679-
"id": 77,
1876+
"id": 478,
16801877
"legend": {
16811878
"avg": false,
16821879
"current": false,
@@ -1755,7 +1952,7 @@
17551952
"y": 14
17561953
},
17571954
"hiddenSeries": false,
1758-
"id": 76,
1955+
"id": 479,
17591956
"legend": {
17601957
"avg": false,
17611958
"current": false,
@@ -3979,8 +4176,7 @@
39794176
"mode": "absolute",
39804177
"steps": [
39814178
{
3982-
"color": "green",
3983-
"value": null
4179+
"color": "green"
39844180
},
39854181
{
39864182
"color": "red",
@@ -4063,8 +4259,7 @@
40634259
"mode": "absolute",
40644260
"steps": [
40654261
{
4066-
"color": "green",
4067-
"value": null
4262+
"color": "green"
40684263
},
40694264
{
40704265
"color": "red",
@@ -4391,4 +4586,4 @@
43914586
"uid": "02ebfdefeeed166624895c36b0c1af4ed3006c5d",
43924587
"version": 1,
43934588
"weekStart": ""
4394-
}
4589+
}

0 commit comments

Comments
 (0)