Skip to content

Commit cd8ed96

Browse files
Reduced time in Fluentd alerts, and modified some names
1 parent f0e0be6 commit cd8ed96

File tree

2 files changed

+29
-29
lines changed

2 files changed

+29
-29
lines changed

resources/fluentd/ALERTS.md

Lines changed: 13 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -1,28 +1,28 @@
11
# Alerts
2-
## No Input From Container
2+
## [Fluentd] No Input From Container
33
No Input From Container.
44

5-
## Increased Error Ratio
6-
Increased Error Ratio.
5+
## [Fluentd] High Error Ratio
6+
High Error Ratio.
77

8-
## Increased Retry Ratio
9-
Increased Retry Ratio.
8+
## [Fluentd] High Retry Ratio
9+
High Retry Ratio.
1010

11-
## Increased Retry Wait
12-
Increased Retry Wait.
11+
## [Fluentd] High Retry Wait
12+
High Retry Wait.
1313

14-
## Low Buffer Available Space
14+
## [Fluentd] Low Buffer Available Space
1515
Low Buffer Available Space.
1616

17-
## Buffer Queue Length Increasing
17+
## [Fluentd] Buffer Queue Length Increasing
1818
Buffer Queue Length Increasing.
1919

20-
## Buffer Total Bytes Increasing
20+
## [Fluentd] Buffer Total Bytes Increasing
2121
Buffer Total Bytes Increasing.
2222

23-
## Increased Slow Flush Ratio
24-
Increased Slow Flush Ratio.
23+
## [Fluentd] High Slow Flush Ratio
24+
High Slow Flush Ratio.
2525

26-
## No Output Records From Plugin
26+
## [Fluentd] No Output Records From Plugin
2727
No Output Records From Plugin.
2828

resources/fluentd/alerts.yaml

Lines changed: 16 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -13,36 +13,36 @@ configurations:
1313
rules:
1414
- alert: '[Fluentd] No Input From Container'
1515
expr: |
16-
sum by (input_namespace, input_container)(rate(fluentd_input_status_num_records_total[1m])) == 0
16+
sum by (input_namespace, input_container)(rate(fluentd_input_status_num_records_total[5m])) == 0
1717
for: 5m
1818
labels:
1919
severity: warning
2020
annotations:
2121
description: No Input From Container.
22-
- alert: '[Fluentd] Increased Error Ratio'
22+
- alert: '[Fluentd] High Error Ratio'
2323
expr: |
24-
sum by (type, plugin_id)(rate(fluentd_output_status_num_errors[1m])) /sum by (type, plugin_id)(rate(fluentd_output_status_emit_count[1m]))> 0.05
24+
sum by (type, plugin_id)(rate(fluentd_output_status_num_errors[5m])) /sum by (type, plugin_id)(rate(fluentd_output_status_emit_count[5m]))> 0.05
2525
for: 5m
2626
labels:
2727
severity: critical
2828
annotations:
29-
description: Increased Error Ratio.
30-
- alert: '[Fluentd] Increased Retry Ratio'
29+
description: High Error Ratio.
30+
- alert: '[Fluentd] High Retry Ratio'
3131
expr: |
32-
sum by (type, plugin_id)(rate(fluentd_output_status_retry_count[1m])) /sum by (type, plugin_id)(rate(fluentd_output_status_emit_count[1m]))> 0.05
32+
sum by (type, plugin_id)(rate(fluentd_output_status_retry_count[5m])) /sum by (type, plugin_id)(rate(fluentd_output_status_emit_count[5m]))> 0.05
3333
for: 5m
3434
labels:
3535
severity: critical
3636
annotations:
37-
description: Increased Retry Ratio.
38-
- alert: '[Fluentd] Increased Retry Wait'
37+
description: High Retry Ratio.
38+
- alert: '[Fluentd] High Retry Wait'
3939
expr: |
40-
sum by (type, plugin_id)(max_over_time(fluentd_output_status_retry_wait[1m])) > 60
40+
sum by (type, plugin_id)(max_over_time(fluentd_output_status_retry_wait[5m])) > 60
4141
for: 5m
4242
labels:
4343
severity: critical
4444
annotations:
45-
description: Increased Retry Wait.
45+
description: High Retry Wait.
4646
- alert: '[Fluentd] Low Buffer Available Space'
4747
expr: |
4848
fluentd_output_status_buffer_available_space_ratio < 10
@@ -56,7 +56,7 @@ configurations:
5656
avg_over_time(fluentd_output_status_buffer_queue_length[5m]) - avg_over_time(fluentd_output_status_buffer_queue_length[5m] offset 5m)> 0
5757
for: 5m
5858
labels:
59-
severity: critical
59+
severity: warning
6060
annotations:
6161
description: Buffer Queue Length Increasing.
6262
- alert: '[Fluentd] Buffer Total Bytes Increasing'
@@ -67,19 +67,19 @@ configurations:
6767
severity: warning
6868
annotations:
6969
description: Buffer Total Bytes Increasing.
70-
- alert: '[Fluentd] Increased Slow Flush Ratio'
70+
- alert: '[Fluentd] High Slow Flush Ratio'
7171
expr: |
72-
sum by (type, plugin_id)(rate(fluentd_output_status_slow_flush_count[1m])) /sum by (type, plugin_id)(rate(fluentd_output_status_emit_count[1m]))> 0.05
72+
sum by (type, plugin_id)(rate(fluentd_output_status_slow_flush_count[5m])) /sum by (type, plugin_id)(rate(fluentd_output_status_emit_count[5m]))> 0.05
7373
for: 5m
7474
labels:
7575
severity: warning
7676
annotations:
77-
description: Increased Slow Flush Ratio.
77+
description: High Slow Flush Ratio.
7878
- alert: '[Fluentd] No Output Records From Plugin'
7979
expr: |
80-
rate(fluentd_output_status_emit_records[1m]) == 0
80+
rate(fluentd_output_status_emit_records[5m]) == 0
8181
for: 5m
8282
labels:
8383
severity: warning
8484
annotations:
85-
description: No Output Records From Plugin.
85+
description: No Output Records From Plugin.

0 commit comments

Comments
 (0)