Skip to content

Commit 811a2d1

Browse files
authored
Merge pull request #1121 from rackerlabs/PUC-717-20250801
fix(rabbitmq): Sets rabbitmq cluster replicas to 3 to match OpenStack helm values
2 parents b2891f8 + a8f1202 commit 811a2d1

13 files changed

+48
-56
lines changed
Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,20 @@
1+
---
12
apiVersion: rabbitmq.com/v1beta1
23
kind: RabbitmqCluster
34
metadata:
45
name: rabbitmq
56
annotations:
67
# do not allow ArgoCD to delete our cluster
78
argocd.argoproj.io/sync-options: Delete=false
9+
spec:
10+
replicas: 3
11+
---
12+
apiVersion: policy/v1
13+
kind: PodDisruptionBudget
14+
metadata:
15+
name: pdb-rabbitmq
16+
spec:
17+
maxUnavailable: 1
18+
selector:
19+
matchLabels:
20+
app.kubernetes.io/name: rabbitmq

operators/rabbitmq-system/cluster-operator/kustomization.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ apiVersion: kustomize.config.k8s.io/v1beta1
22
kind: Kustomization
33

44
resources:
5-
- https://github.com/rabbitmq/cluster-operator/releases/download/v2.14.0/cluster-operator.yml
5+
- https://github.com/rabbitmq/cluster-operator/releases/download/v2.15.0/cluster-operator.yml
66

77
# this needs to be here to remove the namespace from the above
88
# because the cluster-operator defines the same namespace and it would conflict

operators/rabbitmq-system/monitoring/kustomization.yaml

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,5 +17,4 @@ resources:
1717
- ./rules/rabbitmq/cluster-alarms.yml
1818
- ./rules/rabbitmq/insufficient-established-erlang-distribution-links.yml
1919
- ./rules/rabbitmq/persistent-volume-missing.yml
20-
- ./rules/rabbitmq/tcp-sockets-near-limit.yml
2120
- ./rules/rabbitmq-cluster-operator/unavailable-replicas.yml

operators/rabbitmq-system/monitoring/rules/rabbitmq-per-object/queue-has-no-consumers.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ spec:
1414
expr: |
1515
(
1616
((rabbitmq_detailed_queue_consumers{vhost="/", queue=~".*"} == 0) + rabbitmq_detailed_queue_messages) > 0
17-
) * on (instance, job) group_left(rabbitmq_cluster) rabbitmq_identity_info
17+
) * on (instance) group_left(rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info)
1818
for: 10m
1919
annotations:
2020
description: |

operators/rabbitmq-system/monitoring/rules/rabbitmq-per-object/queue-is-growing.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ spec:
1515
expr: |
1616
(
1717
avg_over_time(rabbitmq_detailed_queue_messages[10m]) - avg_over_time(rabbitmq_detailed_queue_messages[10m] offset 1m) > 1
18-
) * on (instance, job) group_left(rabbitmq_cluster) rabbitmq_identity_info
18+
) * on (instance) group_left(rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info)
1919
for: 10m
2020
annotations:
2121
description: |

operators/rabbitmq-system/monitoring/rules/rabbitmq/cluster-alarms.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ spec:
1414
expr: |
1515
max by(rabbitmq_cluster) (
1616
max_over_time(rabbitmq_alarms_memory_used_watermark[5m])
17-
* on(instance) group_left(rabbitmq_cluster, rabbitmq_node, pod) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster)
17+
* on(instance) group_left(rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info)
1818
) > 0
1919
keep_firing_for: 5m
2020
annotations:
@@ -30,7 +30,7 @@ spec:
3030
expr: |
3131
max by(rabbitmq_cluster) (
3232
max_over_time(rabbitmq_alarms_free_disk_space_watermark[5m])
33-
* on(instance) group_left(rabbitmq_cluster, rabbitmq_node, pod) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster)
33+
* on(instance) group_left(rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info)
3434
) > 0
3535
keep_firing_for: 5m
3636
annotations:
@@ -46,7 +46,7 @@ spec:
4646
expr: |
4747
max by(rabbitmq_cluster) (
4848
max_over_time(rabbitmq_alarms_file_descriptor_limit[5m])
49-
* on(instance) group_left(rabbitmq_cluster, rabbitmq_node, pod) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster)
49+
* on(instance) group_left(rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info)
5050
) > 0
5151
keep_firing_for: 5m
5252
annotations:

operators/rabbitmq-system/monitoring/rules/rabbitmq/container-restarts.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -12,9 +12,9 @@ spec:
1212
rules:
1313
- alert: ContainerRestarts
1414
expr: |
15-
increase(kube_pod_container_status_restarts_total[10m]) * on(namespace, pod, container) group_left(rabbitmq_cluster) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster)
16-
>=
17-
1
15+
increase(kube_pod_container_status_restarts_total[10m])
16+
* on(namespace, pod, container) group_left(rabbitmq_cluster) max by (namespace, pod, container, rabbitmq_cluster) (rabbitmq_identity_info)
17+
>= 1
1818
for: 5m
1919
annotations:
2020
description: |

operators/rabbitmq-system/monitoring/rules/rabbitmq/file-descriptors-near-limit.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -12,9 +12,9 @@ spec:
1212
rules:
1313
- alert: FileDescriptorsNearLimit
1414
expr: |
15-
sum by(namespace, rabbitmq_cluster, pod, rabbitmq_node) (max_over_time(rabbitmq_process_open_fds[5m]) * on(instance) group_left(rabbitmq_cluster, rabbitmq_node, pod) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster))
15+
sum by(namespace, rabbitmq_cluster, pod, rabbitmq_node) (max_over_time(rabbitmq_process_open_fds[5m]) * on(instance) group_left(rabbitmq_cluster, rabbitmq_node) max by (instance, rabbitmq_node, rabbitmq_cluster) (rabbitmq_identity_info))
1616
/
17-
sum by(namespace, rabbitmq_cluster, pod, rabbitmq_node) (rabbitmq_process_max_fds * on(instance) group_left(rabbitmq_cluster, rabbitmq_node, pod) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster))
17+
sum by(namespace, rabbitmq_cluster, pod, rabbitmq_node) (rabbitmq_process_max_fds * on(instance) group_left(rabbitmq_cluster, rabbitmq_node) max by (instance, rabbitmq_node, rabbitmq_cluster) (rabbitmq_identity_info))
1818
> 0.8
1919
for: 10m
2020
annotations:

operators/rabbitmq-system/monitoring/rules/rabbitmq/high-connection-churn.yml

Lines changed: 16 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -13,15 +13,27 @@ spec:
1313
- alert: HighConnectionChurn
1414
expr: |
1515
(
16-
sum(rate(rabbitmq_connections_closed_total[5m]) * on(instance) group_left(rabbitmq_cluster, rabbitmq_node) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster)) by(namespace, rabbitmq_cluster)
16+
sum by (namespace, rabbitmq_cluster) (
17+
rate(rabbitmq_connections_closed_total[5m])
18+
* on (instance) group_left (rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info)
19+
)
1720
+
18-
sum(rate(rabbitmq_connections_opened_total[5m]) * on(instance) group_left(rabbitmq_cluster, rabbitmq_node) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster)) by(namespace, rabbitmq_cluster)
21+
sum by (namespace, rabbitmq_cluster) (
22+
rate(rabbitmq_connections_opened_total[5m])
23+
* on (instance) group_left (rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info)
24+
)
1925
)
2026
/
21-
sum (rabbitmq_connections * on(instance) group_left(rabbitmq_cluster) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster)) by (namespace, rabbitmq_cluster)
27+
sum by (namespace, rabbitmq_cluster) (
28+
rabbitmq_connections
29+
* on (instance) group_left (rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info)
30+
)
2231
> 0.1
2332
unless
24-
sum (rabbitmq_connections * on(instance) group_left(rabbitmq_cluster) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster)) by (namespace, rabbitmq_cluster)
33+
sum by (namespace, rabbitmq_cluster) (
34+
rabbitmq_connections
35+
* on (instance) group_left (rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info)
36+
)
2537
< 100
2638
for: 10m
2739
annotations:

operators/rabbitmq-system/monitoring/rules/rabbitmq/insufficient-established-erlang-distribution-links.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -13,11 +13,11 @@ spec:
1313
- alert: InsufficientEstablishedErlangDistributionLinks
1414
# erlang_vm_dist_node_state: 1=pending, 2=up_pending, 3=up
1515
expr: |
16-
count by (namespace, rabbitmq_cluster) (erlang_vm_dist_node_state * on(instance) group_left(rabbitmq_cluster) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster) == 3)
16+
count by (namespace, rabbitmq_cluster) (erlang_vm_dist_node_state * on(instance) group_left(rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info) == 3)
1717
<
18-
count by (namespace, rabbitmq_cluster) (rabbitmq_build_info * on(instance) group_left(rabbitmq_cluster) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster))
18+
count by (namespace, rabbitmq_cluster) (rabbitmq_build_info * on(instance) group_left(rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info))
1919
*
20-
(count by (namespace, rabbitmq_cluster) (rabbitmq_build_info * on(instance) group_left(rabbitmq_cluster) max(rabbitmq_identity_info) by (namespace, pod, container, rabbitmq_cluster)) -1 )
20+
(count by (namespace, rabbitmq_cluster) (rabbitmq_build_info * on(instance) group_left(rabbitmq_cluster) max by (instance, rabbitmq_cluster) (rabbitmq_identity_info)) -1 )
2121
for: 10m
2222
annotations:
2323
description: |

0 commit comments

Comments
 (0)