diff --git a/.github/workflows/extra.yml b/.github/workflows/extra.yml index dece242ce..bf438c336 100644 --- a/.github/workflows/extra.yml +++ b/.github/workflows/extra.yml @@ -8,12 +8,14 @@ on: - 'environments/.stackhpc/terraform/cluster_image.auto.tfvars.json' - 'ansible/roles/doca/**' - 'ansible/roles/cuda/**' + - 'ansible/roles/lustre/**' - '.github/workflows/extra.yml' pull_request: paths: - 'environments/.stackhpc/terraform/cluster_image.auto.tfvars.json' - 'ansible/roles/doca/**' - 'ansible/roles/cuda/**' + - 'ansible/roles/lustre/**' - '.github/workflows/extra.yml' jobs: @@ -29,11 +31,11 @@ jobs: build: - image_name: openhpc-extra-RL8 source_image_name_key: RL8 # key into environments/.stackhpc/terraform/cluster_image.auto.tfvars.json - inventory_groups: doca,cuda + inventory_groups: doca,cuda,lustre volume_size: 30 # needed for cuda - image_name: openhpc-extra-RL9 source_image_name_key: RL9 - inventory_groups: doca,cuda + inventory_groups: doca,cuda,lustre volume_size: 30 # needed for cuda env: ANSIBLE_FORCE_COLOR: True diff --git a/ansible/fatimage.yml b/ansible/fatimage.yml index 9f1e9107c..9a8828a35 100644 --- a/ansible/fatimage.yml +++ b/ansible/fatimage.yml @@ -230,14 +230,6 @@ name: cloudalchemy.grafana tasks_from: install.yml -- hosts: doca - become: yes - gather_facts: yes - tasks: - - name: Install NVIDIA DOCA - import_role: - name: doca - - name: Run post.yml hook vars: appliances_environment_root: "{{ lookup('env', 'APPLIANCES_ENVIRONMENT_ROOT') }}" diff --git a/ansible/roles/lustre/README.md b/ansible/roles/lustre/README.md index c0a25e037..3ba0dad56 100644 --- a/ansible/roles/lustre/README.md +++ b/ansible/roles/lustre/README.md @@ -8,7 +8,7 @@ Install and configure a Lustre client. This builds RPM packages from source. ## Role Variables -- `lustre_version`: Optional str. Version of lustre to build, default `2.15.5` which is the first version with EL9 support +- `lustre_version`: Optional str. Version of lustre to build, default `2.15.6` which is the first version with EL9.5 support - `lustre_lnet_label`: Optional str. The "lnet label" part of the host's NID, e.g. `tcp0`. Only the `tcp` protocol type is currently supported. Default `tcp`. - `lustre_mgs_nid`: Required str. The NID(s) for the MGS, e.g. `192.168.227.11@tcp1` (separate mutiple MGS NIDs using `:`). - `lustre_mounts`: Required list. Define Lustre filesystems and mountpoints as a list of dicts with keys: diff --git a/ansible/roles/lustre/defaults/main.yml b/ansible/roles/lustre/defaults/main.yml index be008ad55..40389970c 100644 --- a/ansible/roles/lustre/defaults/main.yml +++ b/ansible/roles/lustre/defaults/main.yml @@ -1,4 +1,4 @@ -lustre_version: '2.15.5' # https://www.lustre.org/lustre-2-15-5-released/ +lustre_version: '2.15.6' # https://www.lustre.org/lustre-2-15-6-released/ lustre_lnet_label: tcp #lustre_mgs_nid: lustre_mounts: [] diff --git a/ansible/roles/lustre/tasks/install.yml b/ansible/roles/lustre/tasks/install.yml index e0af857cf..852b4652f 100644 --- a/ansible/roles/lustre/tasks/install.yml +++ b/ansible/roles/lustre/tasks/install.yml @@ -41,30 +41,9 @@ ansible.builtin.dnf: name: "{{ _lustre_find_rpms.files | map(attribute='path')}}" disable_gpg_check: yes - -- block: - - name: Remove lustre build prerequisites - # NB Only remove ones this role installed which weren't upgrades - ansible.builtin.dnf: - name: "{{ _new_pkgs }}" - state: absent - vars: - _installed_pkgs: | - {{ - _lustre_dnf_build_packages.results | - select('match', 'Installed:') | - map('regex_replace', '^Installed: (.+?)-[0-9].*$', '\1') - }} - _removed_pkgs: | - {{ - _lustre_dnf_build_packages.results | - select('match', 'Removed:') | - map('regex_replace', '^Removed: (.+?)-[0-9].*$', '\1') - }} - _new_pkgs: "{{ _installed_pkgs | difference(_removed_pkgs) }}" - - - name: Delete lustre build dir - file: - path: "{{ lustre_build_dir }}" - state: absent + +- name: Delete lustre build dir + file: + path: "{{ lustre_build_dir }}" + state: absent when: lustre_build_cleanup | bool