Skip to content

Commit 39ee75a

Browse files
authored
Merge pull request #225 from sysdiglabs/phpfpm
fix php-fpm alerts
2 parents 1fb78ce + fab815e commit 39ee75a

File tree

1 file changed

+27
-64
lines changed

1 file changed

+27
-64
lines changed

resources/php-fpm/alerts.yaml

Lines changed: 27 additions & 64 deletions
Original file line numberDiff line numberDiff line change
@@ -9,83 +9,46 @@ configurations:
99
- kind: Prometheus
1010
data: |-
1111
groups:
12-
- name: "Php-Fpm"
13-
groupId: "php-fpm"
14-
description: "Php-Fpm alerts"
15-
integrationType: "php-fpm"
16-
scopeVariables:
17-
- variable: cluster
18-
label: kubernetes.cluster.name
19-
operator: in
20-
- variable: namespace
21-
label: kubernetes.namespace.name
22-
operator: in
23-
- variable: workload
24-
label: kubernetes.workload.name
25-
operator: in
12+
- name: Php-Fpm
2613
rules:
27-
- alert: "[Php-Fpm] Percentage of instances low"
28-
alertId: "PercentageOfInstancesLow"
29-
description: "Most of the instances are down"
14+
- alert: '[Php-Fpm] Percentage of instances low'
3015
expr: |
31-
sum by (kube_workload_name,kube_namespace_name,kube_cluster_name)(phpfpm_up{kube_cluster_name=~$cluster,kube_namespace_name=~$namespace,kube_workload_name=~$workload})/sum by (kube_workload_name,kube_namespace_name,kube_cluster_name)(kube_workload_status_desired{kube_cluster_name=~$cluster,kube_namespace_name=~$namespace,kube_workload_name=~$workload}) < 0.75
16+
sum (phpfpm_up==1) / sum (phpfpm_up) < 0.75
3217
for: 5m
3318
labels:
34-
severity: high
19+
severity: critical
3520
annotations:
36-
summary: |
37-
[{{$labels.kube_cluster_name}} > {{$labels.kube_namespace_name}} > {{$labels.kube_workload_name}}] {{__alert_name__}} is {{__alert_status__}}
38-
description: |
39-
Most of the instances are down
40-
- alert: "[Php-Fpm] Recently reboot"
41-
alertId: "RecentlyReeboot"
42-
description: "Instances have been recently reboot"
21+
description: Less than 75% of instances are down
22+
- alert: '[Php-Fpm] Recently reboot'
4323
expr: |
44-
(count by (kube_cluster_name, kube_namespace_name,kube_pod_name)(phpfpm_start_since{kube_cluster_name=~$cluster,kube_namespace_name=~$namespace,kube_workload_name=~$workload} < 1800) or vector (0))/sum by (kube_cluster_name, kube_namespace_name,kube_pod_name)(phpfpm_up{kube_cluster_name=~$cluster,kube_namespace_name=~$namespace,kube_workload_name=~$workload}) > 0.4
24+
(count (phpfpm_start_since < 1800) or vector (0))/sum (phpfpm_up) > 0.4
4525
for: 5m
4626
labels:
47-
severity: high
27+
severity: info
4828
annotations:
49-
summary: |
50-
[{{$labels.kube_cluster_name}} > {{$labels.kube_namespace_name}} > {{$labels.kube_workload_name}}] {{__alert_name__}} is {{__alert_status__}}
51-
description: |
52-
Instances have been recently reboot
53-
- alert: "[Php-Fpm] Limit of child proccess exceeded"
54-
alertId: "LimitOfChildsExceeded"
55-
description: "Number of childs process have been exceeded"
29+
description: Instances have been recently reboot
30+
- alert: '[Php-Fpm] Limit of child proccess exceeded'
5631
expr: |
57-
sum by (kube_cluster_name, kube_namespace_name,kube_pod_name) (rate (phpfpm_max_children_reached{kube_cluster_name=~$cluster,kube_namespace_name=~$namespace,kube_workload_name=~$workload}[5m])) > 0
32+
sum (rate (phpfpm_max_children_reached[5m])) > 0
5833
for: 5m
5934
labels:
60-
severity: high
35+
severity: critical
6136
annotations:
62-
summary: |
63-
[{{$labels.kube_cluster_name}} > {{$labels.kube_namespace_name}} > {{$labels.kube_workload_name}}] {{__alert_name__}} is {{__alert_status__}}
64-
description: |
65-
Number of childs process have been exceeded
66-
- alert: "[Php-Fpm] Reaching limit of queue process"
67-
alertId: "ReachedQueueLimit"
68-
description: "Buffer of queue requests reaching its limit"
37+
description: Number of childs process have been exceeded
38+
- alert: '[Php-Fpm] Reaching limit of queue process'
6939
expr: |
70-
(phpfpm_listen_queue{kube_cluster_name=~$cluster,kube_namespace_name=~$namespace,kube_workload_name=~$workload} / phpfpm_listen_queue_length{kube_cluster_name=~$cluster,kube_namespace_name=~$namespace,kube_workload_name=~$workload}) > 0.8
40+
(phpfpm_listen_queue / phpfpm_listen_queue_length) > 0.8
7141
for: 5m
7242
labels:
73-
severity: medium
74-
annotations:
75-
summary: |
76-
[{{$labels.kube_cluster_name}} > {{$labels.kube_namespace_name}} > {{$labels.kube_workload_name}}] {{__alert_name__}} is {{__alert_status__}}
77-
description: |
78-
Buffer of queue requests reaching its limit
79-
- alert: "[Php-Fpm] Requests processed reached timeout limit"
80-
alertId: "TimeoutLimitRequestReached"
81-
description: "Timeout limit reached by some of the requests"
82-
expr: |
83-
rate (phpfpm_slow_requests{kube_cluster_name=~$cluster,kube_namespace_name=~$namespace,kube_workload_name=~$workload}[5m]) / rate (phpfpm_process_requests{kube_cluster_name=~$cluster,kube_namespace_name=~$namespace,kube_workload_name=~$workload}[5m]) > 0.75
84-
for: 5m
85-
labels:
86-
severity: medium
87-
annotations:
88-
summary: |
89-
[{{$labels.kube_cluster_name}} > {{$labels.kube_namespace_name}} > {{$labels.kube_workload_name}}] {{__alert_name__}} is {{__alert_status__}}
90-
description: |
91-
Timeout limit reached by some of the requests
43+
severity: warning
44+
annotations:
45+
description: Buffer of queue requests reaching its limit
46+
- alert: '[Php-Fpm] Too slow requests processing'
47+
expr: |
48+
rate (phpfpm_slow_requests[5m]) / rate (phpfpm_process_requests[5m]) > 0.1
49+
for: 5m
50+
labels:
51+
severity: warning
52+
annotations:
53+
description: Requests have taking too much time to be processed
54+

0 commit comments

Comments
 (0)