Skip to content

Commit 206feed

Browse files
authored
Merge pull request #1166 from nebius/dev
Soperator release 1.21.3
2 parents 64a13e9 + 177bea3 commit 206feed

File tree

62 files changed

+704
-105
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

62 files changed

+704
-105
lines changed

Makefile

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -284,7 +284,8 @@ build: manifests generate fmt vet ## Build manager binary with native toolchain.
284284

285285
.PHONY: run
286286
run: manifests generate fmt vet ## Run a controller from your host with native toolchain.
287-
go run ./cmd/main.go
287+
IS_PROMETHEUS_CRD_INSTALLED=true IS_MARIADB_CRD_INSTALLED=true ENABLE_WEBHOOKS=false IS_APPARMOR_CRD_INSTALLED=true go run cmd/main.go \
288+
-log-level=debug -leader-elect=false -operator-namespace=soperator-system --enable-topology-controller=true
288289

289290
.PHONY: docker-build-go-base
290291
docker-build-go-base: ## Build shared Go base image

VERSION

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
1.21.2
1+
1.21.3

api/v1/slurmcluster_types.go

Lines changed: 16 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -188,10 +188,10 @@ type SlurmConfig struct {
188188
// It is set automatically to `topology/tree` if SlurmTopologyConfigMapRefName is specified.
189189
//
190190
// +kubebuilder:validation:Optional
191+
// +kubebuilder:default="topology/tree"
191192
TopologyPlugin string `json:"topologyPlugin,omitempty"`
192193
// TopologyParam is list of comma-separated options identifying network topology options.
193194
//
194-
// +kubebuilder:default=topology/tree
195195
TopologyParam string `json:"topologyParam,omitempty"`
196196
}
197197

@@ -649,6 +649,21 @@ type SlurmRest struct {
649649
// +kubebuilder:default=false
650650
Enabled bool `json:"enabled,omitempty"`
651651

652+
// ThreadCount defines the number of threads for slurmrestd
653+
//
654+
// +kubebuilder:validation:Optional
655+
// +kubebuilder:validation:Minimum=2
656+
// +kubebuilder:validation:Maximum=1024
657+
// +kubebuilder:default=3
658+
ThreadCount *int32 `json:"threadCount,omitempty"`
659+
660+
// MaxConnections defines the maximum number of connections for slurmrestd
661+
//
662+
// +kubebuilder:validation:Optional
663+
// +kubebuilder:validation:Minimum=2
664+
// +kubebuilder:default=10
665+
MaxConnections *int32 `json:"maxConnections,omitempty"`
666+
652667
// SlurmRestNode represents the Slurm REST API daemon configuration
653668
//
654669
// +kubebuilder:validation:Optional

api/v1/zz_generated.deepcopy.go

Lines changed: 10 additions & 0 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

api/v1alpha1/activecheck_types.go

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@ type ActiveCheckSpec struct {
2626
// Suspend indicates whether the action is suspended.
2727
// +kubebuilder:validation:Optional
2828
// +kubebuilder:default=true
29-
Suspend bool `json:"suspend,omitempty"`
29+
Suspend *bool `json:"suspend,omitempty"`
3030

3131
// ActiveDeadlineSeconds defines the CronJob timeout in seconds
3232
//
@@ -48,7 +48,7 @@ type ActiveCheckSpec struct {
4848

4949
// RunAfterCreation specifies whether the job should run immediately after the CronJob is created.
5050
// +kubebuilder:default=true
51-
RunAfterCreation bool `json:"runAfterCreation,omitempty"`
51+
RunAfterCreation *bool `json:"runAfterCreation,omitempty"`
5252

5353
// NodeSelector defines the desired selector for the K8s nodes to place Slurm workers on
5454
//

api/v1alpha1/zz_generated.deepcopy.go

Lines changed: 10 additions & 0 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

config/crd/bases/slurm.nebius.ai_slurmclusters.yaml

Lines changed: 16 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3244,11 +3244,11 @@ spec:
32443244
description: Additional parameters for the task plugin
32453245
type: string
32463246
topologyParam:
3247-
default: topology/tree
32483247
description: TopologyParam is list of comma-separated options
32493248
identifying network topology options.
32503249
type: string
32513250
topologyPlugin:
3251+
default: topology/tree
32523252
description: |-
32533253
TopologyPlugin identifies the plugin to determine network topology for optimizations.
32543254
It is set automatically to `topology/tree` if SlurmTopologyConfigMapRefName is specified.
@@ -13515,6 +13515,13 @@ spec:
1351513515
K8sNodeFilterName defines the Kubernetes node filter name associated with the Slurm node.
1351613516
Must correspond to the name of one of [K8sNodeFilter]
1351713517
type: string
13518+
maxConnections:
13519+
default: 10
13520+
description: MaxConnections defines the maximum number of
13521+
connections for slurmrestd
13522+
format: int32
13523+
minimum: 2
13524+
type: integer
1351813525
rest:
1351913526
description: SlurmRestNode represents the Slurm REST API daemon
1352013527
configuration
@@ -13576,6 +13583,14 @@ spec:
1357613583
description: Size defines the number of node instances
1357713584
format: int32
1357813585
type: integer
13586+
threadCount:
13587+
default: 3
13588+
description: ThreadCount defines the number of threads for
13589+
slurmrestd
13590+
format: int32
13591+
maximum: 1024
13592+
minimum: 2
13593+
type: integer
1357913594
required:
1358013595
- k8sNodeFilterName
1358113596
type: object

config/manager/kustomization.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,4 +3,4 @@ resources:
33
images:
44
- name: controller
55
newName: cr.eu-north1.nebius.cloud/soperator/slurm-operator
6-
newTag: 1.21.2
6+
newTag: 1.21.3

config/manager/manager.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -87,7 +87,7 @@ spec:
8787
value: "false"
8888
- name: SLURM_OPERATOR_WATCH_NAMESPACES
8989
value: "*"
90-
image: controller:1.21.2
90+
image: controller:1.21.3
9191
imagePullPolicy: Always
9292
name: manager
9393
securityContext:

config/rbac/clustercontroller/role.yaml

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -84,6 +84,17 @@ rules:
8484
verbs:
8585
- get
8686
- update
87+
- apiGroups:
88+
- coordination.k8s.io
89+
resources:
90+
- leases
91+
verbs:
92+
- create
93+
- get
94+
- list
95+
- patch
96+
- update
97+
- watch
8798
- apiGroups:
8899
- k8s.mariadb.com
89100
resources:

0 commit comments

Comments
 (0)