Skip to content

Commit 354ce1e

Browse files
committed
add CI tests for compute node rebuilds
1 parent b820632 commit 354ce1e

File tree

1 file changed

+8
-19
lines changed

1 file changed

+8
-19
lines changed

.github/workflows/stackhpc.yml

Lines changed: 8 additions & 19 deletions
Original file line numberDiff line numberDiff line change
@@ -170,33 +170,22 @@ jobs:
170170
env:
171171
TESTUSER_PASSWORD: ${{ secrets.TEST_USER_PASSWORD }}
172172

173-
# - name: Build environment-specific compute image
174-
# id: packer_build
175-
# run: |
176-
# . venv/bin/activate
177-
# . environments/.stackhpc/activate
178-
# cd packer/
179-
# packer init
180-
# PACKER_LOG=1 packer build -except openstack.fatimage -on-error=ask -var-file=$PKR_VAR_environment_root/builder.pkrvars.hcl openstack.pkr.hcl
181-
# ../dev/output_manifest.py packer-manifest.json # Sets NEW_COMPUTE_IMAGE_ID outputs
182-
183-
# - name: Test reimage of compute nodes to new environment-specific image (via slurm)
184-
# run: |
185-
# . venv/bin/activate
186-
# . environments/.stackhpc/activate
187-
# ansible login -v -a "sudo scontrol reboot ASAP nextstate=RESUME reason='rebuild image:${{ steps.packer_build.outputs.NEW_COMPUTE_IMAGE_ID }}' ${TF_VAR_cluster_name}-compute-[0-3]"
188-
# ansible compute -m wait_for_connection -a 'delay=60 timeout=600' # delay allows node to go down
189-
# ansible-playbook -v ansible/ci/check_slurm.yml
190-
191173
- name: Test reimage of login and control nodes (via rebuild adhoc)
192174
run: |
193175
. venv/bin/activate
194176
. environments/.stackhpc/activate
195177
ansible-playbook -v --limit control,login ansible/adhoc/rebuild.yml
196-
ansible all -m wait_for_connection -a 'delay=60 timeout=600' # delay allows node to go down
197178
ansible-playbook -v ansible/site.yml
198179
ansible-playbook -v ansible/ci/check_slurm.yml
199180
181+
- name: Test reimage of compute nodes and compute-init (via rebuild adhoc)
182+
run: |
183+
. venv/bin/activate
184+
. environments/.stackhpc/activate
185+
ansible-playbook -v --limit compute ansible/adhoc/rebuild.yml
186+
ansible all -m wait_for_connection -a 'delay=60 timeout=600' # delay allows node to go down
187+
ansible-playbook -v ansible/ci/check_slurm.yml
188+
200189
- name: Check sacct state survived reimage
201190
run: |
202191
. venv/bin/activate

0 commit comments

Comments
 (0)