We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ad40723 commit f3e25c0Copy full SHA for f3e25c0
charts/azimuth-llm/values.yaml
@@ -66,8 +66,12 @@ api:
66
gpus: 1
67
# The update strategy to use for the deployment
68
# See https://kubernetes.io/docs/concepts/workloads/controllers/deployment/#updating-a-deployment
69
- # NOTE: Changing this has implications for the number of additional GPU worker nodes required
70
- # to preform a rolling zero-downtime update
+ # NOTE: The following RollingUpdate strategy offers a zero-downtime update but requires additional GPU worker nodes.
+ # updateStrategy:
71
+ # type: RollingUpdate
72
+ # rollingUpdate:
73
+ # maxSurge: 1
74
+ # maxUnavailable: 0
75
updateStrategy:
76
type: Recreate
77
# The value of the vLLM backend's max_model_len argument (if the model's default is not suitable)
0 commit comments