Skip to content

Commit 9284c7f

Browse files
committed
[observability] Introduce "ReplicasUnavailable" alert (as warning for now)
1 parent 084175e commit 9284c7f

File tree

4 files changed

+48
-0
lines changed

4 files changed

+48
-0
lines changed

operations/observability/mixins/workspace/rules/central/image-builder.yaml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -51,3 +51,15 @@ spec:
5151
expr: |
5252
kube_deployment_spec_replicas{deployment="image-builder-mk3", cluster!~"ephemeral.*"} != kube_deployment_status_replicas_available{deployment="image-builder-mk3", cluster!~"ephemeral.*"}
5353
for: 3m
54+
- alert: GitpodImageBuilderMk3ReplicasUnavailable
55+
labels:
56+
# TODO(gpl): warning for now, to set it up and fine-tune it
57+
severity: warning
58+
dedicated: included
59+
annotations:
60+
runbook_url: https://github.com/gitpod-io/runbooks/blob/main/runbooks/GitpodWorkspaceDeploymentReplicaMismatch.md
61+
summary: image-builder-mk3 replicas are unavailable in cluster {{ $labels.cluster }}
62+
description: 'image-builder-mk3 pods are unavailable in cluster {{ $labels.cluster }}: {{ printf "%.2f" $value }}'
63+
expr: |
64+
kube_deployment_status_replicas_unavailable{deployment="image-builder-mk3", cluster!~"ephemeral.*"} > 0
65+
for: 10m

operations/observability/mixins/workspace/rules/central/node-labeler.yaml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -35,3 +35,15 @@ spec:
3535
expr: |
3636
kube_deployment_spec_replicas{deployment="node-labeler", cluster!~"ephemeral.*"} != kube_deployment_status_replicas_available{deployment="node-labeler", cluster!~"ephemeral.*"}
3737
for: 3m
38+
- alert: GitpodNodeLabelerReplicasUnavailable
39+
labels:
40+
# TODO(gpl): warning for now, to set it up and fine-tune it
41+
severity: warning
42+
dedicated: included
43+
annotations:
44+
runbook_url: https://github.com/gitpod-io/runbooks/blob/main/runbooks/GitpodWorkspaceDeploymentReplicaMismatch.md
45+
summary: node-labeler replicas are unavailable in cluster {{ $labels.cluster }}
46+
description: 'node-labeler pods are unavailable in cluster {{ $labels.cluster }}: {{ printf "%.2f" $value }}'
47+
expr: |
48+
kube_deployment_status_replicas_unavailable{deployment="node-labeler", cluster!~"ephemeral.*"} > 0
49+
for: 10m

operations/observability/mixins/workspace/rules/central/ws-manager.yaml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -35,3 +35,15 @@ spec:
3535
expr: |
3636
kube_deployment_spec_replicas{deployment="ws-manager-mk2", cluster!~"ephemeral.*"} != kube_deployment_status_replicas_available{deployment="ws-manager-mk2", cluster!~"ephemeral.*"}
3737
for: 3m
38+
- alert: GitpodWsManagerMk2ReplicasUnavailable
39+
labels:
40+
# TODO(gpl): warning for now, to set it up and fine-tune it
41+
severity: warning
42+
dedicated: included
43+
annotations:
44+
runbook_url: https://github.com/gitpod-io/runbooks/blob/main/runbooks/GitpodWorkspaceDeploymentReplicaMismatch.md
45+
summary: ws-manager-mk2 replicas are unavailable in cluster {{ $labels.cluster }}
46+
description: 'ws-manager-mk2 pods are unavailable in cluster {{ $labels.cluster }}: {{ printf "%.2f" $value }}'
47+
expr: |
48+
kube_deployment_status_replicas_unavailable{deployment="ws-manager-mk2", cluster!~"ephemeral.*"} > 0
49+
for: 10m

operations/observability/mixins/workspace/rules/central/ws-proxy.yaml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -35,3 +35,15 @@ spec:
3535
expr: |
3636
kube_deployment_spec_replicas{deployment="ws-proxy", cluster!~"ephemeral.*"} != kube_deployment_status_replicas_available{deployment="ws-proxy", cluster!~"ephemeral.*"}
3737
for: 3m
38+
- alert: GitpodWsProxyMk2ReplicasUnavailable
39+
labels:
40+
# TODO(gpl): warning for now, to set it up and fine-tune it
41+
severity: warning
42+
dedicated: included
43+
annotations:
44+
runbook_url: https://github.com/gitpod-io/runbooks/blob/main/runbooks/GitpodWorkspaceDeploymentReplicaMismatch.md
45+
summary: ws-proxy replicas are unavailable in cluster {{ $labels.cluster }}
46+
description: 'ws-proxy pods are unavailable in cluster {{ $labels.cluster }}: {{ printf "%.2f" $value }}'
47+
expr: |
48+
kube_deployment_status_replicas_unavailable{deployment="ws-proxy", cluster!~"ephemeral.*"} > 0
49+
for: 10m

0 commit comments

Comments
 (0)