File tree Expand file tree Collapse file tree 5 files changed +10
-9
lines changed
Expand file tree Collapse file tree 5 files changed +10
-9
lines changed Original file line number Diff line number Diff line change @@ -178,7 +178,7 @@ jobs:
178178 ansible-playbook -v ansible/site.yml
179179 ansible-playbook -v ansible/ci/check_slurm.yml
180180
181- - name : Test compute node reimage, compute-init, and reboot
181+ - name : Test compute node reboot and compute-init
182182 run : |
183183 . venv/bin/activate
184184 . environments/.stackhpc/activate
Original file line number Diff line number Diff line change 1- # Reboot compute nodes via slurm. The nodes will be rebuilt if image in hostvars is different to the active one in OpenStack .
1+ # Reboot compute nodes via slurm. Nodes will be rebuilt if `image_id` in inventory is different to the currently-provisioned image .
22# Example:
33# ansible-playbook -v ansible/adhoc/reboot_via_slurm.yml
44
55- hosts : login
6+ run_once : true
67 become : yes
78 gather_facts : no
89 tasks :
1415 register : slurm_result
1516 failed_when : slurm_result.rc != 0
1617
17- - name : Fetch Slurm logs if reboot fails
18+ - name : Fetch Slurm controller logs if reboot fails
1819 ansible.builtin.shell : |
1920 journalctl -u slurmctld --since "10 minutes ago" | tail -n 50
2021 become_user : root
Original file line number Diff line number Diff line change @@ -35,7 +35,7 @@ openhpc_config_default:
3535 SlurmctldParameters :
3636 - enable_configless
3737 TaskPlugin : task/cgroup,task/affinity
38- ReturnToService : 2
38+ ReturnToService : 2 # is stackhpc.openhpc default, but templating bug means it is needed here too
3939openhpc_config_rebuild :
4040 RebootProgram : /opt/slurm-tools/bin/slurm-openstack-rebuild
4141 SlurmctldParameters :
Original file line number Diff line number Diff line change 6262# All hosts requiring control of SELinux status.
6363cluster
6464
65+ [rebuild]
66+ # Enable rebuild of nodes on an OpenStack cloud; add 'control' group.
67+
6568[update]
6669# All hosts to (optionally) run yum update on.
6770
@@ -162,6 +165,3 @@ extra_packages
162165
163166[pulp]
164167# Add builder to this group to enable automatically syncing of pulp during image build
165-
166- [rebuild]
167- # Enable rebuild of nodes on an OpenStack cloud; add 'control' group.
Original file line number Diff line number Diff line change @@ -25,6 +25,8 @@ control
2525[filebeat:children]
2626slurm_stats
2727
28+ # NB: [rebuild] not defined here as likely to need features not currently supported
29+
2830[update:children]
2931
3032[fail2ban:children]
@@ -109,5 +111,3 @@ control
109111[extra_packages:children]
110112# Hosts to install specified additional packages on
111113builder
112-
113- # NB: [rebuild] not defined here as likely to need features not currently supported
You can’t perform that action at this time.
0 commit comments