diff --git a/etc/kayobe/kolla/config/prometheus/openstack.rules b/etc/kayobe/kolla/config/prometheus/openstack.rules index 78a7f8282..ba78e76a3 100644 --- a/etc/kayobe/kolla/config/prometheus/openstack.rules +++ b/etc/kayobe/kolla/config/prometheus/openstack.rules @@ -11,5 +11,14 @@ groups: annotations: summary: "{{ $labels.service }} at {{ $labels.hostname }} is down" description: "OpenStack service {{ $labels.service }} at {{ $labels.hostname }} is down" - +- name: Routers + rules: + - alert: OpenStackRouterDown + expr: count by (router_id) (openstack_neutron_l3_agent_of_router{ha_state="active"}) != 1 + for: 1m + labels: + severity: alert + annotations: + summary: "The router {{ $labels.router_id }} is not active on exactly one agent" + description: "The router {{ $labels.router_id }} should be active on exactly one agent. It can either be active on multiple agents or not active at all." {% endraw %} diff --git a/releasenotes/notes/adds-alert-for-active-routers-91281912213692c9.yaml b/releasenotes/notes/adds-alert-for-active-routers-91281912213692c9.yaml new file mode 100644 index 000000000..1578a4706 --- /dev/null +++ b/releasenotes/notes/adds-alert-for-active-routers-91281912213692c9.yaml @@ -0,0 +1,5 @@ +--- +features: + - | + Adds an alert to check that there is exactly one active router on ML2/OVS based + deployments.