Skip to content

Commit 7cbc55f

Browse files
authored
Merge pull request opendatahub-io#33 from DharmitD/probes
Adding Probes to ML Pipelines' pods
2 parents 4394d9d + c37036c commit 7cbc55f

File tree

11 files changed

+126
-18
lines changed

11 files changed

+126
-18
lines changed

manifests/opendatahub/base/deployments/ml-pipeline-persistenceagent.yaml

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,22 @@ spec:
3131
image: persistenceagent
3232
imagePullPolicy: IfNotPresent
3333
name: ml-pipeline-persistenceagent
34+
livenessProbe:
35+
exec:
36+
command:
37+
- pidof
38+
- persistence_agent
39+
initialDelaySeconds: 30
40+
periodSeconds: 5
41+
timeoutSeconds: 2
42+
readinessProbe:
43+
exec:
44+
command:
45+
- pidof
46+
- persistence_agent
47+
initialDelaySeconds: 3
48+
periodSeconds: 5
49+
timeoutSeconds: 2
3450
resources:
3551
requests:
3652
cpu: 120m

manifests/opendatahub/base/deployments/ml-pipeline-scheduledworkflow.yaml

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,4 +32,20 @@ spec:
3232
image: scheduledworkflow
3333
imagePullPolicy: IfNotPresent
3434
name: ml-pipeline-scheduledworkflow
35+
livenessProbe:
36+
exec:
37+
command:
38+
- pidof
39+
- controller
40+
initialDelaySeconds: 30
41+
periodSeconds: 5
42+
timeoutSeconds: 2
43+
readinessProbe:
44+
exec:
45+
command:
46+
- pidof
47+
- controller
48+
initialDelaySeconds: 3
49+
periodSeconds: 5
50+
timeoutSeconds: 2
3551
serviceAccountName: ml-pipeline-scheduledworkflow

manifests/opendatahub/base/deployments/ml-pipeline-viewer-crd.yaml

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -33,4 +33,20 @@ spec:
3333
image: viewer-crd-controller
3434
imagePullPolicy: Always
3535
name: ml-pipeline-viewer-crd
36+
livenessProbe:
37+
exec:
38+
command:
39+
- pidof
40+
- controller
41+
initialDelaySeconds: 30
42+
periodSeconds: 5
43+
timeoutSeconds: 2
44+
readinessProbe:
45+
exec:
46+
command:
47+
- pidof
48+
- controller
49+
initialDelaySeconds: 3
50+
periodSeconds: 5
51+
timeoutSeconds: 2
3652
serviceAccountName: ml-pipeline-viewer-crd-service-account

manifests/opendatahub/base/deployments/ml-pipeline-visualizationserver.yaml

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,10 @@ spec:
2121
containers:
2222
- image: visualization-server
2323
imagePullPolicy: IfNotPresent
24+
name: ml-pipeline-visualizationserver
25+
ports:
26+
- containerPort: 8888
27+
name: http
2428
livenessProbe:
2529
exec:
2630
command:
@@ -30,13 +34,9 @@ spec:
3034
- -O
3135
- '-'
3236
- http://localhost:8888/
33-
initialDelaySeconds: 3
37+
initialDelaySeconds: 30
3438
periodSeconds: 5
3539
timeoutSeconds: 2
36-
name: ml-pipeline-visualizationserver
37-
ports:
38-
- containerPort: 8888
39-
name: http
4040
readinessProbe:
4141
exec:
4242
command:

manifests/opendatahub/base/deployments/ml-pipeline.yaml

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -121,6 +121,12 @@ spec:
121121
name: $(pipeline_install_configuration)
122122
image: api-server
123123
imagePullPolicy: Always
124+
name: ml-pipeline-api-server
125+
ports:
126+
- containerPort: 8888
127+
name: http
128+
- containerPort: 8887
129+
name: grpc
124130
livenessProbe:
125131
exec:
126132
command:
@@ -133,12 +139,6 @@ spec:
133139
initialDelaySeconds: 3
134140
periodSeconds: 5
135141
timeoutSeconds: 2
136-
name: ml-pipeline-api-server
137-
ports:
138-
- containerPort: 8888
139-
name: http
140-
- containerPort: 8887
141-
name: grpc
142142
readinessProbe:
143143
exec:
144144
command:

manifests/opendatahub/overlays/component-mlmd/deployments/metadata-envoy-deployment.yaml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -27,3 +27,15 @@ spec:
2727
name: md-envoy
2828
- containerPort: 9901
2929
name: envoy-admin
30+
livenessProbe:
31+
initialDelaySeconds: 30
32+
periodSeconds: 5
33+
tcpSocket:
34+
port: md-envoy
35+
timeoutSeconds: 2
36+
readinessProbe:
37+
initialDelaySeconds: 3
38+
periodSeconds: 5
39+
tcpSocket:
40+
port: md-envoy
41+
timeoutSeconds: 2

manifests/opendatahub/overlays/component-mlmd/deployments/metadata-grpc-deployment.yaml

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -55,16 +55,16 @@ spec:
5555
key: dbPort
5656
name: $(pipeline_install_configuration)
5757
image: metadata-grpc
58+
name: container
59+
ports:
60+
- containerPort: 8080
61+
name: grpc-api
5862
livenessProbe:
59-
initialDelaySeconds: 3
63+
initialDelaySeconds: 30
6064
periodSeconds: 5
6165
tcpSocket:
6266
port: grpc-api
6367
timeoutSeconds: 2
64-
name: container
65-
ports:
66-
- containerPort: 8080
67-
name: grpc-api
6868
readinessProbe:
6969
initialDelaySeconds: 3
7070
periodSeconds: 5

manifests/opendatahub/overlays/component-mlmd/deployments/metadata-writer.yaml

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,4 +32,20 @@ spec:
3232
name: $(ml_pipelines_configuration)
3333
image: metadata-writer
3434
name: main
35+
livenessProbe:
36+
exec:
37+
command:
38+
- pidof
39+
- python3
40+
initialDelaySeconds: 30
41+
periodSeconds: 5
42+
timeoutSeconds: 2
43+
readinessProbe:
44+
exec:
45+
command:
46+
- pidof
47+
- python3
48+
initialDelaySeconds: 3
49+
periodSeconds: 5
50+
timeoutSeconds: 2
3551
serviceAccountName: kubeflow-pipelines-metadata-writer

manifests/opendatahub/overlays/metadata-store-mysql/deployments/mysql.yaml

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,22 @@ spec:
3131
ports:
3232
- containerPort: 3306
3333
name: mysql
34+
livenessProbe:
35+
failureThreshold: 3
36+
initialDelaySeconds: 30
37+
periodSeconds: 10
38+
successThreshold: 1
39+
tcpSocket:
40+
port: 3306
41+
timeoutSeconds: 1
42+
readinessProbe:
43+
failureThreshold: 3
44+
initialDelaySeconds: 5
45+
periodSeconds: 10
46+
successThreshold: 1
47+
tcpSocket:
48+
port: 3306
49+
timeoutSeconds: 1
3450
resources:
3551
requests:
3652
cpu: 100m

manifests/opendatahub/overlays/metadata-store-postgresql/deployments/postgresql.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -35,15 +35,15 @@ spec:
3535
- name: POSTGRESQL_DATABASE
3636
value: kfp-tekton
3737
imagePullPolicy: Always
38+
ports:
39+
- containerPort: 5432
3840
livenessProbe:
3941
exec:
4042
command:
4143
- /usr/libexec/check-container
4244
- --live
4345
initialDelaySeconds: 120
4446
timeoutSeconds: 10
45-
ports:
46-
- containerPort: 5432
4747
readinessProbe:
4848
exec:
4949
command:

0 commit comments

Comments
 (0)