|
| 1 | +# Copyright 2026 Google LLC |
| 2 | +# |
| 3 | +# Licensed under the Apache License, Version 2.0 (the "License"); |
| 4 | +# you may not use this file except in compliance with the License. |
| 5 | +# You may obtain a copy of the License at |
| 6 | +# |
| 7 | +# http://www.apache.org/licenses/LICENSE-2.0 |
| 8 | +# |
| 9 | +# Unless required by applicable law or agreed to in writing, software |
| 10 | +# distributed under the License is distributed on an "AS IS" BASIS, |
| 11 | +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 12 | +# See the License for the specific language governing permissions and |
| 13 | +# limitations under the License. |
| 14 | + |
| 15 | +--- |
| 16 | + |
| 17 | +blueprint_name: hpc-slurm-kms |
| 18 | + |
| 19 | +vars: |
| 20 | + project_id: ## Set GCP Project ID Here ## |
| 21 | + deployment_name: hpc-slurm-kms |
| 22 | + region: us-central1 |
| 23 | + zone: us-central1-a |
| 24 | + kms_key: "projects/my-project/locations/us-central1/keyRings/my-keyring/cryptoKeys/my-key" |
| 25 | + kms_service_account: "my-sa@my-project.iam.gserviceaccount.com" |
| 26 | + |
| 27 | +# Documentation for each of the modules used below can be found at |
| 28 | +# https://github.com/GoogleCloudPlatform/hpc-toolkit/blob/main/modules/README.md |
| 29 | + |
| 30 | +deployment_groups: |
| 31 | +- group: primary |
| 32 | + modules: |
| 33 | + # Source is an embedded module, denoted by "modules/*" without ./, ../, / |
| 34 | + # as a prefix. To refer to a local module, prefix with ./, ../ or / |
| 35 | + - id: network |
| 36 | + source: modules/network/vpc |
| 37 | + |
| 38 | + # Private Service Access (PSA) requires the compute.networkAdmin role which is |
| 39 | + # included in the Owner role, but not Editor. |
| 40 | + # PSA is a best practice for Filestore instances, but can be optionally |
| 41 | + # removed by deleting the private_service_access module and any references to |
| 42 | + # the module by Filestore modules. |
| 43 | + # https://cloud.google.com/vpc/docs/configure-private-services-access#permissions |
| 44 | + - id: private_service_access |
| 45 | + source: modules/network/private-service-access |
| 46 | + use: [network] |
| 47 | + |
| 48 | + - id: homefs |
| 49 | + source: modules/file-system/filestore |
| 50 | + use: [network, private_service_access] |
| 51 | + settings: |
| 52 | + local_mount: /home |
| 53 | + |
| 54 | + - id: debug_nodeset |
| 55 | + source: community/modules/compute/schedmd-slurm-gcp-v6-nodeset |
| 56 | + use: [network] |
| 57 | + settings: |
| 58 | + node_count_dynamic_max: 4 |
| 59 | + machine_type: n2-standard-2 |
| 60 | + allow_automatic_updates: false |
| 61 | + disk_encryption_key_service_account: $(vars.kms_service_account) |
| 62 | + disk_encryption_key: $(vars.kms_key) |
| 63 | + |
| 64 | + - id: debug_partition |
| 65 | + source: community/modules/compute/schedmd-slurm-gcp-v6-partition |
| 66 | + use: |
| 67 | + - debug_nodeset |
| 68 | + settings: |
| 69 | + partition_name: debug |
| 70 | + exclusive: false # allows nodes to stay up after jobs are done |
| 71 | + is_default: true |
| 72 | + |
| 73 | + - id: compute_nodeset |
| 74 | + source: community/modules/compute/schedmd-slurm-gcp-v6-nodeset |
| 75 | + use: [network] |
| 76 | + settings: |
| 77 | + node_count_dynamic_max: 20 |
| 78 | + bandwidth_tier: gvnic_enabled |
| 79 | + allow_automatic_updates: false |
| 80 | + disk_encryption_key: $(vars.kms_key) |
| 81 | + disk_encryption_key_service_account: $(vars.kms_service_account) |
| 82 | + |
| 83 | + - id: compute_partition |
| 84 | + source: community/modules/compute/schedmd-slurm-gcp-v6-partition |
| 85 | + use: |
| 86 | + - compute_nodeset |
| 87 | + settings: |
| 88 | + partition_name: compute |
| 89 | + |
| 90 | + - id: h3_nodeset |
| 91 | + source: community/modules/compute/schedmd-slurm-gcp-v6-nodeset |
| 92 | + use: [network] |
| 93 | + settings: |
| 94 | + node_count_dynamic_max: 20 |
| 95 | + # Note that H3 is available in only specific zones. https://cloud.google.com/compute/docs/regions-zones |
| 96 | + machine_type: h3-standard-88 |
| 97 | + # H3 does not support pd-ssd and pd-standard |
| 98 | + # https://cloud.google.com/compute/docs/compute-optimized-machines#h3_disks |
| 99 | + disk_type: pd-balanced |
| 100 | + bandwidth_tier: gvnic_enabled |
| 101 | + allow_automatic_updates: false |
| 102 | + disk_encryption_key: $(vars.kms_key) |
| 103 | + disk_encryption_key_service_account: $(vars.kms_service_account) |
| 104 | + |
| 105 | + - id: h3_partition |
| 106 | + source: community/modules/compute/schedmd-slurm-gcp-v6-partition |
| 107 | + use: |
| 108 | + - h3_nodeset |
| 109 | + settings: |
| 110 | + partition_name: h3 |
| 111 | + |
| 112 | + - id: slurm_login |
| 113 | + source: community/modules/scheduler/schedmd-slurm-gcp-v6-login |
| 114 | + use: [network] |
| 115 | + settings: |
| 116 | + machine_type: n2-standard-4 |
| 117 | + enable_login_public_ips: true |
| 118 | + disk_encryption_key: $(vars.kms_key) |
| 119 | + disk_encryption_key_service_account: $(vars.kms_service_account) |
| 120 | + |
| 121 | + - id: slurm_controller |
| 122 | + source: community/modules/scheduler/schedmd-slurm-gcp-v6-controller |
| 123 | + use: |
| 124 | + - network |
| 125 | + - debug_partition |
| 126 | + - compute_partition |
| 127 | + - h3_partition |
| 128 | + - homefs |
| 129 | + - slurm_login |
| 130 | + settings: |
| 131 | + enable_controller_public_ips: true |
| 132 | + disk_encryption_key: $(vars.kms_key) |
| 133 | + disk_encryption_key_service_account: $(vars.kms_service_account) |
| 134 | + slurm_bucket_kms_key: $(vars.kms_key) |
0 commit comments