Skip to content

Commit ae7e206

Browse files
authored
Merge pull request #87 from stackhpc/extra-llm-pod-config
Add scheduling config options for UI and API pods
2 parents cbac2a7 + 6cb23f0 commit ae7e206

File tree

3 files changed

+37
-1
lines changed

3 files changed

+37
-1
lines changed

charts/azimuth-llm/templates/api/deployment.yml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -70,4 +70,16 @@ spec:
7070
emptyDir:
7171
medium: Memory
7272
sizeLimit: 1Gi
73+
{{- with $.Values.api.nodeSelector }}
74+
nodeSelector:
75+
{{- toYaml . | nindent 8 }}
76+
{{- end }}
77+
{{- with $.Values.api.affinity }}
78+
affinity:
79+
{{- toYaml . | nindent 8 }}
80+
{{- end }}
81+
{{- with $.Values.api.tolerations }}
82+
tolerations:
83+
{{- toYaml . | nindent 8 }}
84+
{{- end }}
7385
{{- end -}}

charts/azimuth-llm/templates/ui/deployment.yml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -47,4 +47,16 @@ spec:
4747
- name: app
4848
configMap:
4949
name: {{ .Release.Name }}-web-app
50+
{{- with $.Values.ui.nodeSelector }}
51+
nodeSelector:
52+
{{- toYaml . | nindent 8 }}
53+
{{- end }}
54+
{{- with $.Values.ui.affinity }}
55+
affinity:
56+
{{- toYaml . | nindent 8 }}
57+
{{- end }}
58+
{{- with $.Values.ui.tolerations }}
59+
tolerations:
60+
{{- toYaml . | nindent 8 }}
61+
{{- end }}
5062
{{- end -}}

charts/azimuth-llm/values.yaml

Lines changed: 13 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,6 @@ api:
6767
# - secretName: chart-example-tls
6868
# hosts:
6969
# - chart-example.local
70-
7170
# Config for huggingface model cache volume
7271
# This is mounted at /root/.cache/huggingface in the api deployment
7372
cacheVolume:
@@ -97,6 +96,13 @@ api:
9796
# Extra args to supply to the vLLM backend, see
9897
# https://docs.vllm.ai/en/stable/serving/openai_compatible_server.html#command-line-arguments-for-the-server
9998
extraArgs: []
99+
# Pod node selector labels
100+
nodeSelector: {}
101+
# Pod tolerations
102+
tolerations: []
103+
# Pod affinities
104+
affinity: {}
105+
100106
# Configuration for the frontend web interface
101107
ui:
102108
# Toggles installation of the gradio web UI
@@ -155,3 +161,9 @@ ui:
155161
rollingUpdate:
156162
maxSurge: 25%
157163
maxUnavailable: 25%
164+
# Pod node selector labels
165+
nodeSelector: {}
166+
# Pod tolerations
167+
tolerations: []
168+
# Pod affinities
169+
affinity: {}

0 commit comments

Comments
 (0)