Skip to content

Commit 093c121

Browse files
authored
Merge pull request #156 from run-ai/fix/compute-domain-dra-plugin-liveness-probe
fix: adding compute domain liveness probe
2 parents 9476038 + 5688181 commit 093c121

File tree

2 files changed

+16
-0
lines changed

2 files changed

+16
-0
lines changed

deploy/fake-gpu-operator/templates/compute-domain-dra-plugin/_helpers.tpl

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,22 @@ containers:
3737
value: "/var/lib/kubelet/plugins_registry"
3838
- name: KUBELET_PLUGINS_DIRECTORY_PATH
3939
value: "/var/lib/kubelet/plugins"
40+
{{- if .Values.computeDomainDraPlugin.healthcheckPort }}
41+
- name: HEALTHCHECK_PORT
42+
value: {{ .Values.computeDomainDraPlugin.healthcheckPort | quote }}
43+
{{- end }}
4044
name: compute-domain-dra-plugin-ctr
45+
{{- if (gt (int .Values.computeDomainDraPlugin.healthcheckPort) 0) }}
46+
livenessProbe:
47+
grpc:
48+
port: {{ .Values.computeDomainDraPlugin.healthcheckPort }}
49+
service: liveness
50+
initialDelaySeconds: 30
51+
periodSeconds: 10
52+
timeoutSeconds: 5
53+
failureThreshold: 3
54+
successThreshold: 1
55+
{{- end }}
4156
securityContext:
4257
privileged: true
4358
terminationMessagePath: /dev/termination-log

deploy/fake-gpu-operator/values.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -194,6 +194,7 @@ computeDomainController:
194194

195195
computeDomainDraPlugin:
196196
enabled: false
197+
healthcheckPort: 8082
197198
image:
198199
pullPolicy: Always
199200
repository: ghcr.io/run-ai/fake-gpu-operator/compute-domain-dra-plugin

0 commit comments

Comments
 (0)