Skip to content

Commit 3d259ae

Browse files
committed
KFLUXINFRA-2067: Push Kueue metrics to RHOBS
Those metrics will be used for creating SLO alerts. Signed-off-by: Gal Ben Haim <[email protected]>
1 parent df2767a commit 3d259ae

File tree

4 files changed

+22
-2
lines changed

4 files changed

+22
-2
lines changed

components/monitoring/prometheus/production/base/monitoringstack/endpoints-params.yaml

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -52,6 +52,15 @@
5252
- '{__name__="kube_deployment_status_replicas_ready", namespace="gitops-service-argocd"}'
5353
- '{__name__="kube_deployment_spec_replicas", namespace=~"gitops-service-argocd"}'
5454

55+
# Kueue
56+
- '{__name__="tekton_kueue_cel_evaluations_total"}'
57+
- '{__name__="kube_pod_container_status_restarts_total", namespace=~"tekton-kueue|kueue-external-admission|openshift-kueue-operator"}'
58+
- '{__name__="kube_pod_container_status_ready", namespace=~"tekton-kueue|kueue-external-admission|openshift-kueue-operator"}'
59+
- '{__name__="kueue_cluster_queue_status"}'
60+
- '{__name__="kueue_admission_wait_time_seconds_bucket"}'
61+
- '{__name__="apiserver_admission_webhook_request_total", name="pipelinerun-kueue-defaulter.tekton-kueue.io"}'
62+
- '{__name__="up", job=~".*kueue.*"}'
63+
5564
# Namespace (expression): "build-service"
5665
- '{__name__="kube_deployment_status_replicas_ready", namespace="build-service"}'
5766
- '{__name__="kube_deployment_status_replicas_available", namespace="build-service"}'

components/monitoring/prometheus/production/base/monitoringstack/writeRelabelConfigs.yaml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,4 +15,5 @@
1515
verb|request_kind|tested_cluster|resource_type|exported_job|http_method|\
1616
http_route|http_status_code|gin_errors|rule_result|rule_execution_cause|\
1717
policy_name|policy_background_mode|rule_type|policy_type|policy_validation_mode|\
18-
resource_request_operation|resource_kind|policy_change_type|event_type"
18+
resource_request_operation|resource_kind|policy_change_type|event_type|\
19+
name|cluster_queue"

components/monitoring/prometheus/staging/base/monitoringstack/endpoints-params.yaml

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -52,6 +52,15 @@
5252
- '{__name__="kube_deployment_status_replicas_ready", namespace="gitops-service-argocd"}'
5353
- '{__name__="kube_deployment_spec_replicas", namespace=~"gitops-service-argocd"}'
5454

55+
# Kueue
56+
- '{__name__="tekton_kueue_cel_evaluations_total"}'
57+
- '{__name__="kube_pod_container_status_restarts_total", namespace=~"tekton-kueue|kueue-external-admission|openshift-kueue-operator"}'
58+
- '{__name__="kube_pod_container_status_ready", namespace=~"tekton-kueue|kueue-external-admission|openshift-kueue-operator"}'
59+
- '{__name__="kueue_cluster_queue_status"}'
60+
- '{__name__="kueue_admission_wait_time_seconds_bucket"}'
61+
- '{__name__="apiserver_admission_webhook_request_total", name="pipelinerun-kueue-defaulter.tekton-kueue.io"}'
62+
- '{__name__="up", job=~".*kueue.*"}'
63+
5564
# Namespace (expression): "build-service"
5665
- '{__name__="kube_deployment_status_replicas_ready", namespace="build-service"}'
5766
- '{__name__="kube_deployment_status_replicas_available", namespace="build-service"}'

components/monitoring/prometheus/staging/base/monitoringstack/writeRelabelConfigs.yaml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,4 +15,5 @@
1515
verb|request_kind|tested_cluster|resource_type|exported_job|http_method|\
1616
http_route|http_status_code|gin_errors|rule_result|rule_execution_cause|\
1717
policy_name|policy_background_mode|rule_type|policy_type|policy_validation_mode|\
18-
resource_request_operation|resource_kind|policy_change_type|event_type"
18+
resource_request_operation|resource_kind|policy_change_type|event_type|\
19+
name|cluster_queue"

0 commit comments

Comments
 (0)