You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
description: "This is an alert meant to ensure that the entire alerting pipeline is functional.\nThis alert is always firing, therefore it should always be firing in Alertmanager\nand always fire against a receiver. There are integrations with various notification\nmechanisms that send a notification when this alert is not firing. For example the\n\"DeadMansSnitch\" integration in PagerDuty."
148
-
summary: 'Ensure entire alerting pipeline is functional'
149
-
- alert: InstanceDown
150
-
expr: 'up == 0'
151
-
for: 5m
152
-
labels:
153
-
severity: critical
154
-
annotations:
155
-
description: '{% raw %}{{ $labels.instance }} of job {{ $labels.job }} has been down for more than 5 minutes.{% endraw %}'
156
-
summary: '{% raw %}Instance {{ $labels.instance }} down{% endraw %}'
157
-
- alert: RebootRequired
158
-
expr: 'node_reboot_required > 0'
159
-
labels:
160
-
severity: warning
161
-
annotations:
162
-
description: '{% raw %}{{ $labels.instance }} requires a reboot.{% endraw %}'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left and is filling up.{% endraw %}'
167
-
summary: 'Filesystem is predicted to run out of space within the next 24 hours.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left and is filling up fast.{% endraw %}'
175
-
summary: 'Filesystem is predicted to run out of space within the next 4 hours.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left.{% endraw %}'
183
-
summary: 'Filesystem has less than 5% space left.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left.{% endraw %}'
191
-
summary: 'Filesystem has less than 3% space left.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left and is filling up.{% endraw %}'
199
-
summary: 'Filesystem is predicted to run out of inodes within the next 24 hours.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left and is filling up fast.{% endraw %}'
207
-
summary: 'Filesystem is predicted to run out of inodes within the next 4 hours.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left.{% endraw %}'
215
-
summary: 'Filesystem has less than 5% inodes left.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left.{% endraw %}'
223
-
summary: 'Filesystem has less than 3% inodes left.'
description: '{% raw %}{{ $labels.instance }} interface {{ $labels.device }} has encountered {{ printf "%.0f" $value }} receive errors in the last two minutes.{% endraw %}'
231
-
summary: 'Network interface is reporting many receive errors.'
description: '{% raw %}{{ $labels.instance }} interface {{ $labels.device }} has encountered {{ printf "%.0f" $value }} transmit errors in the last two minutes.{% endraw %}'
239
-
summary: 'Network interface is reporting many transmit errors.'
description: "This is an alert meant to ensure that the entire alerting pipeline is functional.\nThis alert is always firing, therefore it should always be firing in Alertmanager\nand always fire against a receiver. There are integrations with various notification\nmechanisms that send a notification when this alert is not firing. For example the\n\"DeadMansSnitch\" integration in PagerDuty."
153
+
summary: 'Ensure entire alerting pipeline is functional'
154
+
- alert: InstanceDown
155
+
expr: 'up == 0'
156
+
for: 5m
157
+
labels:
158
+
severity: critical
159
+
annotations:
160
+
description: '{% raw %}{{ $labels.instance }} of job {{ $labels.job }} has been down for more than 5 minutes.{% endraw %}'
161
+
summary: '{% raw %}Instance {{ $labels.instance }} down{% endraw %}'
162
+
- alert: RebootRequired
163
+
expr: 'node_reboot_required > 0'
164
+
labels:
165
+
severity: warning
166
+
annotations:
167
+
description: '{% raw %}{{ $labels.instance }} requires a reboot.{% endraw %}'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left and is filling up.{% endraw %}'
172
+
summary: 'Filesystem is predicted to run out of space within the next 24 hours.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left and is filling up fast.{% endraw %}'
180
+
summary: 'Filesystem is predicted to run out of space within the next 4 hours.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left.{% endraw %}'
188
+
summary: 'Filesystem has less than 5% space left.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left.{% endraw %}'
196
+
summary: 'Filesystem has less than 3% space left.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left and is filling up.{% endraw %}'
204
+
summary: 'Filesystem is predicted to run out of inodes within the next 24 hours.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left and is filling up fast.{% endraw %}'
212
+
summary: 'Filesystem is predicted to run out of inodes within the next 4 hours.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left.{% endraw %}'
220
+
summary: 'Filesystem has less than 5% inodes left.'
description: '{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left.{% endraw %}'
228
+
summary: 'Filesystem has less than 3% inodes left.'
description: '{% raw %}{{ $labels.instance }} interface {{ $labels.device }} has encountered {{ printf "%.0f" $value }} receive errors in the last two minutes.{% endraw %}'
236
+
summary: 'Network interface is reporting many receive errors.'
description: '{% raw %}{{ $labels.instance }} interface {{ $labels.device }} has encountered {{ printf "%.0f" $value }} transmit errors in the last two minutes.{% endraw %}'
244
+
summary: 'Network interface is reporting many transmit errors.'
0 commit comments