Skip to content

Commit f252c46

Browse files
authored
Add NodeSystemdServiceCrashlooping alert to mixin (#3039)
* Add NodeSystemdServiceCrashlooping alert --------- Signed-off-by: Vitaly Zhuravlev <[email protected]>
1 parent edc40d1 commit f252c46

File tree

1 file changed

+14
-0
lines changed

1 file changed

+14
-0
lines changed

docs/node-mixin/alerts/alerts.libsonnet

Lines changed: 14 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -407,6 +407,20 @@
407407
description: 'Systemd service {{ $labels.name }} has entered failed state at {{ $labels.instance }}',
408408
},
409409
},
410+
{
411+
alert: 'NodeSystemdServiceCrashlooping',
412+
expr: |||
413+
increase(node_systemd_service_restart_total{%(nodeExporterSelector)s}[5m]) > 2
414+
||| % $._config,
415+
'for': '15m',
416+
labels: {
417+
severity: 'warning',
418+
},
419+
annotations: {
420+
summary: 'Systemd service keeps restaring, possibly crash looping.',
421+
description: 'Systemd service {{ $labels.name }} has being restarted too many times at {{ $labels.instance }} for the last 15 minutes. Please check if service is crash looping.',
422+
},
423+
},
410424
{
411425
alert: 'NodeBondingDegraded',
412426
expr: |||

0 commit comments

Comments
 (0)