Skip to content

Commit db3981c

Browse files
committed
add CsvAbnornalReplacing alerts
Signed-off-by: Ben Ye <[email protected]>
1 parent 6405f0e commit db3981c

File tree

2 files changed

+28
-6
lines changed

2 files changed

+28
-6
lines changed

deploy/chart/templates/0000_90_olm_01-prometheus-rule.yaml

Lines changed: 14 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -9,12 +9,23 @@ metadata:
99
role: alert-rules
1010
spec:
1111
groups:
12-
- name: olm.failing_operators.rules
12+
- name: olm.csv_abnormal.rules
1313
rules:
14-
- alert: FailingOperator
14+
- alert: CsvAbnormalFailedOver2Min
15+
expr: csv_abnormal{phase=~"^Failed$",exported_namespace=~"(^openshift.*|^kube.*|^redhat.*|^default$)"}
16+
for: 2m
17+
labels:
18+
severity: warning
19+
namespace: "{{ "{{ $labels.namespace }}" }}"
1520
annotations:
1621
message: Failed to install Operator {{ printf "{{ $labels.name }}" }} version {{ printf "{{ $labels.version }}" }}. Reason-{{ printf "{{ $labels.reason }}" }}
17-
expr: csv_abnormal{phase="Failed"}
22+
23+
- alert: CsvAbnormalOver30Min
24+
expr: csv_abnormal{phase=~"(^Replacing$|^Pending$|^Deleting$|^Unknown$)",exported_namespace=~"(^openshift.*|^kube.*|^redhat.*|^default$)"}
25+
for: 30m
1826
labels:
1927
severity: warning
28+
namespace: "{{ "{{ $labels.namespace }}" }}"
29+
annotations:
30+
message: Failed to install Operator {{ printf "{{ $labels.name }}" }} version {{ printf "{{ $labels.version }}" }}. Phase-{{ printf "{{ $labels.phase }}" }} Reason-{{ printf "{{ $labels.reason }}" }}
2031
{{ end }}

manifests/0000_90_olm_01-prometheus-rule.yaml

Lines changed: 14 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -8,11 +8,22 @@ metadata:
88
role: alert-rules
99
spec:
1010
groups:
11-
- name: olm.failing_operators.rules
11+
- name: olm.csv_abnormal.rules
1212
rules:
13-
- alert: FailingOperator
13+
- alert: CsvAbnormalFailedOver2Min
14+
expr: csv_abnormal{phase=~"^Failed$",exported_namespace=~"(^openshift.*|^kube.*|^redhat.*|^default$)"}
15+
for: 2m
16+
labels:
17+
severity: warning
18+
namespace: "{{ $labels.namespace }}"
1419
annotations:
1520
message: Failed to install Operator {{ $labels.name }} version {{ $labels.version }}. Reason-{{ $labels.reason }}
16-
expr: csv_abnormal{phase="Failed"}
21+
22+
- alert: CsvAbnormalOver30Min
23+
expr: csv_abnormal{phase=~"(^Replacing$|^Pending$|^Deleting$|^Unknown$)",exported_namespace=~"(^openshift.*|^kube.*|^redhat.*|^default$)"}
24+
for: 30m
1725
labels:
1826
severity: warning
27+
namespace: "{{ $labels.namespace }}"
28+
annotations:
29+
message: Failed to install Operator {{ $labels.name }} version {{ $labels.version }}. Phase-{{ $labels.phase }} Reason-{{ $labels.reason }}

0 commit comments

Comments
 (0)