Skip to content

Commit c9e9d5d

Browse files
committed
SRVKP-4532: factor k8s throttling into task panel
Also: - fix tekton-config.yaml yamllint error - widen controller restart query - make osp pruner cfg consistent with konflux prod rh-pre-commit.version: 2.3.0 rh-pre-commit.check-secrets: ENABLED
1 parent c12b163 commit c9e9d5d

File tree

2 files changed

+12
-13
lines changed

2 files changed

+12
-13
lines changed

operator/gitops/argocd/grafana/dashboards/pipeline-service-dashboard.json

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -227,7 +227,7 @@
227227
"type": "stat"
228228
},
229229
{
230-
"description": "The number of times the pipelines controller has restarted",
230+
"description": "The number of times any of the pipelines controllers hav restarted",
231231
"fieldConfig": {
232232
"defaults": {
233233
"color": {
@@ -281,7 +281,7 @@
281281
"targets": [
282282
{
283283
"editorMode": "code",
284-
"expr": "sum(increase(kube_pod_container_status_restarts_total{namespace=\"openshift-pipelines\", pod=~\"tekton-pipelines-controller-.*\"}[2m]))",
284+
"expr": "sum(increase(kube_pod_container_status_restarts_total{namespace=\"openshift-pipelines\", pod=~\"tekton-.*\"}[2m]))",
285285
"legendFormat": "__auto",
286286
"range": true,
287287
"refId": "A"
@@ -409,7 +409,7 @@
409409
"targets": [
410410
{
411411
"editorMode": "code",
412-
"expr": "sum(increase(taskrun_pod_create_not_attempted_or_pending_count[2m]))",
412+
"expr": "sum(increase(taskrun_pod_create_not_attempted_or_pending_count[2m])) - sum(increase(tekton_pipelines_controller_running_taskruns_throttled_by_quota[2m])) - sum(increase(tekton_pipelines_controller_running_taskruns_throttled_by_node[2m]))",
413413
"legendFormat": "__auto",
414414
"range": true,
415415
"refId": "A"

operator/gitops/argocd/pipeline-service/openshift-pipelines/tekton-config.yaml

Lines changed: 9 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -190,13 +190,12 @@ spec:
190190
kube-api-qps: 50
191191
kube-api-burst: 50
192192
pruner:
193-
# The load on prod-rh01 is to the point now where tekton-results
194-
# can fall too far behind. Until the watcher's log storage is rewritten
195-
# etc with SRVKP-4347 or if we risk adding more processing power (threads,qps,burst)
196-
# to the mem leak version of the watcher, we need the OSP pruner as a backup.
197-
# a bit of an adjustment, we will prune once an hour now per https://crontab.guru/every-1-hour
198-
# to line up with typical timeout settings.
199-
keep: 10
200-
resources:
201-
- pipelinerun
202-
schedule: 0 * * * *
193+
# The load on prod-rh01 is to the point now where tekton-results
194+
# can fall too far behind. Until the watcher's log storage is rewritten
195+
# etc with SRVKP-4347 or if we risk adding more processing power (threads,qps,burst)
196+
# to the mem leak version of the watcher, we need the OSP pruner as a backup.
197+
disable: false
198+
keep-since: 60
199+
resources:
200+
- pipelinerun
201+
schedule: "*/10 * * * *"

0 commit comments

Comments
 (0)