|
1 | 1 | # RayCluster
|
2 | 2 |
|
3 |
| -RayCluster is a custom resource definition (CRD). **KubeRay operator** will listen to the resource |
4 |
| -events about RayCluster and create related Kubernetes resources (e.g. Pod & Service). Hence, |
5 |
| -**KubeRay operator** installation and **CRD** registration are required for this guide. |
| 3 | + |
| 4 | + |
| 5 | +A Helm chart for deploying the RayCluster with the kuberay operator. |
| 6 | + |
| 7 | +**Homepage:** <https://github.com/ray-project/kuberay> |
| 8 | + |
| 9 | +## Introduction |
| 10 | + |
| 11 | +RayCluster is a custom resource definition (CRD). |
| 12 | +KubeRay operator will listen to the resource events about RayCluster and create related Kubernetes resources |
| 13 | +(e.g. Pod & Service). |
| 14 | +Hence, KubeRay operator installation and CRD registration are required for this guide. |
6 | 15 |
|
7 | 16 | ## Prerequisites
|
8 | 17 |
|
@@ -58,3 +67,96 @@ helm uninstall raycluster
|
58 | 67 | ```
|
59 | 68 |
|
60 | 69 | [kuberay-operator/README.md]: https://github.com/ray-project/kuberay/blob/master/helm-chart/kuberay-operator/README.md
|
| 70 | + |
| 71 | +## Values |
| 72 | + |
| 73 | +| Key | Type | Default | Description | |
| 74 | +|-----|------|---------|-------------| |
| 75 | +| image.repository | string | `"rayproject/ray"` | Image repository. | |
| 76 | +| image.tag | string | `"2.46.0"` | Image tag. | |
| 77 | +| image.pullPolicy | string | `"IfNotPresent"` | Image pull policy. | |
| 78 | +| nameOverride | string | `"kuberay"` | String to partially override release name. | |
| 79 | +| fullnameOverride | string | `""` | String to fully override release name. | |
| 80 | +| imagePullSecrets | list | `[]` | Secrets with credentials to pull images from a private registry | |
| 81 | +| common.containerEnv | list | `[]` | containerEnv specifies environment variables for the Ray head and worker containers. Follows standard K8s container env schema. | |
| 82 | +| head.initContainers | list | `[]` | Init containers to add to the head pod | |
| 83 | +| head.labels | object | `{}` | Labels for the head pod | |
| 84 | +| head.serviceAccountName | string | `""` | | |
| 85 | +| head.restartPolicy | string | `""` | | |
| 86 | +| head.containerEnv | list | `[]` | | |
| 87 | +| head.envFrom | list | `[]` | envFrom to pass to head pod | |
| 88 | +| head.resources.limits.cpu | string | `"1"` | | |
| 89 | +| head.resources.limits.memory | string | `"2G"` | | |
| 90 | +| head.resources.requests.cpu | string | `"1"` | | |
| 91 | +| head.resources.requests.memory | string | `"2G"` | | |
| 92 | +| head.annotations | object | `{}` | Extra annotations for head pod | |
| 93 | +| head.nodeSelector | object | `{}` | Node labels for head pod assignment | |
| 94 | +| head.tolerations | list | `[]` | Node tolerations for head pod scheduling to nodes with taints | |
| 95 | +| head.affinity | object | `{}` | Head pod affinity | |
| 96 | +| head.podSecurityContext | object | `{}` | Head pod security context. | |
| 97 | +| head.securityContext | object | `{}` | Ray container security context. | |
| 98 | +| head.volumes[0].name | string | `"log-volume"` | | |
| 99 | +| head.volumes[0].emptyDir | object | `{}` | | |
| 100 | +| head.volumeMounts[0].mountPath | string | `"/tmp/ray"` | | |
| 101 | +| head.volumeMounts[0].name | string | `"log-volume"` | | |
| 102 | +| head.sidecarContainers | list | `[]` | | |
| 103 | +| head.command | list | `[]` | | |
| 104 | +| head.args | list | `[]` | | |
| 105 | +| head.headService | object | `{}` | | |
| 106 | +| head.topologySpreadConstraints | list | `[]` | | |
| 107 | +| worker.groupName | string | `"workergroup"` | The name of the workergroup | |
| 108 | +| worker.replicas | int | `1` | The number of replicas for the worker pod | |
| 109 | +| worker.minReplicas | int | `1` | The minimum number of replicas for the worker pod | |
| 110 | +| worker.maxReplicas | int | `3` | The maximum number of replicas for the worker pod | |
| 111 | +| worker.labels | object | `{}` | Labels for the worker pod | |
| 112 | +| worker.serviceAccountName | string | `""` | | |
| 113 | +| worker.restartPolicy | string | `""` | | |
| 114 | +| worker.initContainers | list | `[]` | Init containers to add to the worker pod | |
| 115 | +| worker.containerEnv | list | `[]` | | |
| 116 | +| worker.envFrom | list | `[]` | envFrom to pass to worker pod | |
| 117 | +| worker.resources.limits.cpu | string | `"1"` | | |
| 118 | +| worker.resources.limits.memory | string | `"1G"` | | |
| 119 | +| worker.resources.requests.cpu | string | `"1"` | | |
| 120 | +| worker.resources.requests.memory | string | `"1G"` | | |
| 121 | +| worker.annotations | object | `{}` | Extra annotations for worker pod | |
| 122 | +| worker.nodeSelector | object | `{}` | Node labels for worker pod assignment | |
| 123 | +| worker.tolerations | list | `[]` | Node tolerations for worker pod scheduling to nodes with taints | |
| 124 | +| worker.affinity | object | `{}` | Worker pod affinity | |
| 125 | +| worker.podSecurityContext | object | `{}` | Worker pod security context. | |
| 126 | +| worker.securityContext | object | `{}` | Ray container security context. | |
| 127 | +| worker.volumes[0].name | string | `"log-volume"` | | |
| 128 | +| worker.volumes[0].emptyDir | object | `{}` | | |
| 129 | +| worker.volumeMounts[0].mountPath | string | `"/tmp/ray"` | | |
| 130 | +| worker.volumeMounts[0].name | string | `"log-volume"` | | |
| 131 | +| worker.sidecarContainers | list | `[]` | | |
| 132 | +| worker.command | list | `[]` | | |
| 133 | +| worker.args | list | `[]` | | |
| 134 | +| worker.topologySpreadConstraints | list | `[]` | | |
| 135 | +| additionalWorkerGroups.smallGroup.disabled | bool | `true` | | |
| 136 | +| additionalWorkerGroups.smallGroup.replicas | int | `0` | The number of replicas for the additional worker pod | |
| 137 | +| additionalWorkerGroups.smallGroup.minReplicas | int | `0` | The minimum number of replicas for the additional worker pod | |
| 138 | +| additionalWorkerGroups.smallGroup.maxReplicas | int | `3` | The maximum number of replicas for the additional worker pod | |
| 139 | +| additionalWorkerGroups.smallGroup.labels | object | `{}` | Labels for the additional worker pod | |
| 140 | +| additionalWorkerGroups.smallGroup.serviceAccountName | string | `""` | | |
| 141 | +| additionalWorkerGroups.smallGroup.restartPolicy | string | `""` | | |
| 142 | +| additionalWorkerGroups.smallGroup.containerEnv | list | `[]` | | |
| 143 | +| additionalWorkerGroups.smallGroup.envFrom | list | `[]` | envFrom to pass to additional worker pod | |
| 144 | +| additionalWorkerGroups.smallGroup.resources.limits.cpu | int | `1` | | |
| 145 | +| additionalWorkerGroups.smallGroup.resources.limits.memory | string | `"1G"` | | |
| 146 | +| additionalWorkerGroups.smallGroup.resources.requests.cpu | int | `1` | | |
| 147 | +| additionalWorkerGroups.smallGroup.resources.requests.memory | string | `"1G"` | | |
| 148 | +| additionalWorkerGroups.smallGroup.annotations | object | `{}` | Extra annotations for additional worker pod | |
| 149 | +| additionalWorkerGroups.smallGroup.nodeSelector | object | `{}` | Node labels for additional worker pod assignment | |
| 150 | +| additionalWorkerGroups.smallGroup.tolerations | list | `[]` | Node tolerations for additional worker pod scheduling to nodes with taints | |
| 151 | +| additionalWorkerGroups.smallGroup.affinity | object | `{}` | Additional worker pod affinity | |
| 152 | +| additionalWorkerGroups.smallGroup.podSecurityContext | object | `{}` | Additional worker pod security context. | |
| 153 | +| additionalWorkerGroups.smallGroup.securityContext | object | `{}` | Ray container security context. | |
| 154 | +| additionalWorkerGroups.smallGroup.volumes[0].name | string | `"log-volume"` | | |
| 155 | +| additionalWorkerGroups.smallGroup.volumes[0].emptyDir | object | `{}` | | |
| 156 | +| additionalWorkerGroups.smallGroup.volumeMounts[0].mountPath | string | `"/tmp/ray"` | | |
| 157 | +| additionalWorkerGroups.smallGroup.volumeMounts[0].name | string | `"log-volume"` | | |
| 158 | +| additionalWorkerGroups.smallGroup.sidecarContainers | list | `[]` | | |
| 159 | +| additionalWorkerGroups.smallGroup.command | list | `[]` | | |
| 160 | +| additionalWorkerGroups.smallGroup.args | list | `[]` | | |
| 161 | +| additionalWorkerGroups.smallGroup.topologySpreadConstraints | list | `[]` | | |
| 162 | +| service.type | string | `"ClusterIP"` | | |
0 commit comments