File tree Expand file tree Collapse file tree 1 file changed +47
-0
lines changed
Expand file tree Collapse file tree 1 file changed +47
-0
lines changed Original file line number Diff line number Diff line change 1515groups :
1616- name : alert.rules
1717 rules :
18+ - alert : TiProxyServerIsDown
19+ expr : up{job="tiproxy"} == 0
20+ for : 1m
21+ labels :
22+ env : ENV_LABELS_ENV
23+ severity : emergency
24+ expr : up{job="tiproxy"} == 0
25+ annotations :
26+ description : ' cluster: ENV_LABELS_ENV, instance: {{ $labels.instance }} is down for 1 minute'
27+ value : ' {{ $value }}'
28+ summary : TiProxy server is down
29+
30+ - alert : TiProxyDiscoveredTimeJumpBack
31+ expr : increase(tiproxy_monitor_time_jump_back_total[10m]) > 0
32+ for : 1m
33+ labels :
34+ env : ENV_LABELS_ENV
35+ severity : warning
36+ expr : increase(tiproxy_monitor_time_jump_back_total[10m]) > 0
37+ annotations :
38+ description : ' cluster: ENV_LABELS_ENV, instance: {{ $labels.instance }}, values:{{ $value }}'
39+ value : ' {{ $value }}'
40+ summary : TiProxy monitor found time jump back error
41+
42+ - alert : TiProxyReportErr
43+ expr : increase(tiproxy_server_err[10m]) > 0
44+ for : 1m
45+ labels :
46+ env : ENV_LABELS_ENV
47+ severity : major
48+ expr : increase(tiproxy_server_err[10m]) > 0
49+ annotations :
50+ description : ' cluster: ENV_LABELS_ENV, instance: {{ $labels.instance }}, value: {{ $value }}'
51+ value : ' {{ $value }}'
52+ summary : TiProxy reports critical error
53+
54+ - alert : TiProxyGetBackendFail
55+ expr : sum(rate(tiproxy_backend_get_backend{res="fail"}[1m])) by (instance) > 10
56+ for : 1m
57+ labels :
58+ env : ENV_LABELS_ENV
59+ severity : major
60+ expr : sum(rate(tiproxy_backend_get_backend{res="fail"}[1m])) by (instance) > 10
61+ annotations :
62+ description : ' cluster: ENV_LABELS_ENV, instance: {{ $labels.instance }}, value: {{ $value }}'
63+ value : ' {{ $value }}'
64+ summary : TiProxy fails to get backends
You can’t perform that action at this time.
0 commit comments