File tree Expand file tree Collapse file tree 15 files changed +3
-362
lines changed
environments/common/inventory Expand file tree Collapse file tree 15 files changed +3
-362
lines changed Original file line number Diff line number Diff line change @@ -32,11 +32,11 @@ jobs:
32
32
- image_name : openhpc-extra-RL8
33
33
source_image_name_key : RL8 # key into environments/.stackhpc/tofu/cluster_image.auto.tfvars.json
34
34
inventory_groups : doca,cuda,lustre
35
- volume_size : 35 # needed for cuda
35
+ volume_size : 30 # needed for cuda
36
36
- image_name : openhpc-extra-RL9
37
37
source_image_name_key : RL9
38
38
inventory_groups : doca,cuda,lustre
39
- volume_size : 35 # needed for cuda
39
+ volume_size : 30 # needed for cuda
40
40
env :
41
41
ANSIBLE_FORCE_COLOR : True
42
42
OS_CLOUD : openstack
Original file line number Diff line number Diff line change @@ -90,7 +90,5 @@ roles/*
90
90
! roles /gateway /**
91
91
! roles /alertmanager /
92
92
! roles /alertmanager /**
93
- ! roles /slurm_recompile /**
94
- ! roles /slurm_recompile /**
95
93
! roles /nhc /
96
94
! roles /nhc /**
Original file line number Diff line number Diff line change 48
48
name : cuda
49
49
tasks_from : " {{ 'runtime.yml' if appliances_mode == 'configure' else 'install.yml' }}"
50
50
51
- - name : Setup vGPU
52
- hosts : vgpu
53
- become : yes
54
- gather_facts : yes
55
- tags : vgpu
56
- tasks :
57
- - include_role :
58
- name : stackhpc.linux.vgpu
59
- tasks_from : " {{ 'configure.yml' if appliances_mode == 'configure' else 'install.yml' }}"
60
- handlers :
61
- - name : reboot
62
- fail :
63
- msg : Reboot handler for stackhpc.linux.vgpu role fired unexpectedly. This was supposed to be unreachable.
64
-
65
51
- name : Persist hostkeys across rebuilds
66
52
# Must be after filesystems.yml (for storage)
67
53
# and before portal.yml (where OOD login node hostkeys are scanned)
Original file line number Diff line number Diff line change 250
250
name : cloudalchemy.grafana
251
251
tasks_from : install.yml
252
252
253
- - name : Add support for NVIDIA GPU auto detection to Slurm
254
- hosts : cuda
255
- become : yes
256
- tasks :
257
- - name : Recompile slurm
258
- import_role :
259
- name : slurm_recompile
260
- vars :
261
- slurm_recompile_with_nvml : " {{ groups.cuda | length > 0 }}"
262
-
263
253
- name : Run post.yml hook
264
254
vars :
265
255
appliances_environment_root : " {{ lookup('env', 'APPLIANCES_ENVIRONMENT_ROOT') }}"
Original file line number Diff line number Diff line change @@ -75,7 +75,6 @@ it also requires an image build with the role name added to the
75
75
| extras.yml | basic_users | All functionality [ 6] | No |
76
76
| extras.yml | eessi | All functionality [ 7] | No |
77
77
| extras.yml | cuda | None required - use image build | Yes [ 8] |
78
- | extras.yml | vgpu | All functionality | Yes |
79
78
| extras.yml | persist_hostkeys | Not relevant for compute nodes | n/a |
80
79
| extras.yml | compute_init (export) | Not relevant for compute nodes | n/a |
81
80
| extras.yml | k9s (install) | Not relevant during boot | n/a |
Original file line number Diff line number Diff line change 19
19
enable_basic_users : " {{ os_metadata.meta.basic_users | default(false) | bool }}"
20
20
enable_eessi : " {{ os_metadata.meta.eessi | default(false) | bool }}"
21
21
enable_chrony : " {{ os_metadata.meta.chrony | default(false) | bool }}"
22
- enable_vgpu : " {{ os_metadata.meta.vpgu | default(false) | bool }}"
23
22
enable_nhc : " {{ os_metadata.meta.nhc | default(false) | bool }}"
24
23
25
24
# TODO: "= role defaults" - could be moved to a vars_file: on play with similar precedence effects
297
296
cmd : " cvmfs_config setup"
298
297
when : enable_eessi
299
298
300
- - name : Configure VGPUs
301
- include_role :
302
- name : stackhpc.linux.vgpu
303
- tasks_from : ' configure.yml'
304
- when : enable_vgpu
305
-
306
299
# NB: don't need conditional block on enable_compute as have already exited
307
300
# if not the case
308
301
- name : Write Munge key
Load Diff This file was deleted.
Load Diff This file was deleted.
Load Diff This file was deleted.
Load Diff This file was deleted.
You can’t perform that action at this time.
0 commit comments