Skip to content

Commit 35724c1

Browse files
committed
Merge branch 'main' into update/openhpc-b64-mungekey
2 parents 0dc629c + 642d500 commit 35724c1

File tree

18 files changed

+106
-42
lines changed

18 files changed

+106
-42
lines changed

.github/workflows/fatimage.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,7 @@ jobs:
3131
source_image_name: Rocky-8-GenericCloud-Base-8.10-20240528.0.x86_64.raw
3232
inventory_groups: control,compute,login,update
3333
- image_name: openhpc-RL9
34-
source_image_name: Rocky-9-GenericCloud-Base-9.5-20241118.0.x86_64.raw
34+
source_image_name: Rocky-9-GenericCloud-Base-9.6-20250531.0.x86_64.qcow2
3535
inventory_groups: control,compute,login,update
3636
env:
3737
ANSIBLE_FORCE_COLOR: True

.github/workflows/stackhpc.yml

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -9,8 +9,7 @@ on:
99
- '**'
1010
- '!dev/**'
1111
- 'dev/setup-env.sh'
12-
- '!docs/**'
13-
- '!README.md'
12+
- '!**.md'
1413
- '!.gitignore'
1514
- '!.github/workflows/'
1615
- '.github/workflows/stackhpc'
@@ -19,8 +18,7 @@ on:
1918
- '**'
2019
- '!dev/**'
2120
- 'dev/setup-env.sh'
22-
- '!docs/**'
23-
- '!README.md'
21+
- '!**.md'
2422
- '!.gitignore'
2523
- '!.github/workflows/'
2624
- '.github/workflows/stackhpc'

ansible/fatimage.yml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -190,6 +190,11 @@
190190
tasks_from: install.yml
191191
when: "'alertmanager' in group_names"
192192

193+
- name: Download HPL source
194+
include_role:
195+
name: hpctests
196+
tasks_from: source-hpl.yml
197+
193198
- hosts: prometheus
194199
become: yes
195200
gather_facts: yes
@@ -262,7 +267,7 @@
262267
name: grafana-dashboards
263268

264269
- name: Add support for NVIDIA GPU auto detection to Slurm
265-
hosts: cuda
270+
hosts: slurm_recompile
266271
become: yes
267272
tasks:
268273
- name: Recompile slurm

ansible/roles/dnf_repos/defaults/main.yml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -47,7 +47,8 @@ dnf_repos_openhpc_repolist:
4747
file: OpenHPC
4848
base_url: "{{ dnf_repos_pulp_content_url }}/{{ appliances_pulp_repos.openhpc_updates[ansible_distribution_major_version] | appliances_repo_to_subpath }}"
4949

50-
dnf_repos_repolist: "{{ dnf_repos_default_repolist + (dnf_repos_openhpc_repolist if (openhpc_install_type | default('ohpc')) == 'ohpc' else []) }}"
50+
dnf_repos_extra_repolist: []
51+
dnf_repos_repolist: "{{ dnf_repos_default_repolist + (dnf_repos_openhpc_repolist if (openhpc_install_type | default('ohpc')) == 'ohpc' else []) + dnf_repos_extra_repolist }}"
5152

5253
dnf_repos_epel_baseurl: "{{ dnf_repos_pulp_content_url }}/{{ appliances_pulp_repos.epel[ansible_distribution_major_version] | appliances_repo_to_subpath }}"
5354
dnf_repos_epel_description: "epel"

ansible/roles/hpctests/tasks/build-hpl.yml

Lines changed: 11 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -5,18 +5,21 @@
55
path: "{{ hpctests_rootdir }}/hpl"
66
state: directory
77

8-
- name: Download HPL sources
8+
- name: Unarchive HPL sources from /opt/hpl
99
unarchive:
10-
src: "http://www.netlib.org/benchmark/hpl/hpl-{{ hpctests_hpl_version }}.tar.gz"
11-
remote_src: yes
10+
src: "/opt/hpl/hpl-{{ hpctests_hpl_version }}.tar.gz"
1211
dest: "{{ hpctests_rootdir }}/hpl"
12+
remote_src: yes
13+
owner: "{{ hpctests_user }}"
14+
group: "{{ hpctests_group }}"
15+
mode: '0755'
1316
keep_newer: yes
1417

15-
- name: Copy BLAS make file
16-
command:
17-
cmd: "cp setup/Make.Linux_PII_CBLAS Make.{{ hpctests_hpl_arch }}"
18-
chdir: "{{ hpctests_hpl_srcdir }}"
19-
creates: "{{ hpctests_hpl_srcdir }}/Make.{{ hpctests_hpl_arch }}"
18+
- name: Copy BLAS makefile
19+
copy:
20+
src: "{{ hpctests_hpl_srcdir }}/setup/Make.Linux_PII_CBLAS"
21+
dest: "{{ hpctests_hpl_srcdir }}/Make.{{ hpctests_hpl_arch }}"
22+
remote_src: yes
2023

2124
- name: Modify make file
2225
replace:
Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,17 @@
1+
---
2+
3+
- name: Make directory
4+
file:
5+
path: "/opt/hpl"
6+
state: directory
7+
owner: root
8+
group: root
9+
mode: '0755'
10+
11+
- name: Download HPL tarball
12+
get_url:
13+
url: "http://www.netlib.org/benchmark/hpl/hpl-{{ hpctests_hpl_version }}.tar.gz"
14+
dest: "/opt/hpl/hpl-{{ hpctests_hpl_version }}.tar.gz"
15+
owner: root
16+
group: root
17+
mode: '0644'

ansible/roles/lustre/README.md

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -19,10 +19,8 @@ The following variables control configuration of Lustre clients.
1919
- `lustre_mount_options`. Optional default mount options. Default values are systemd defaults from [Lustre client docs](http://wiki.lustre.org/Mounting_a_Lustre_File_System_on_Client_Nodes).
2020

2121
The following variables control the package build and and install:
22-
- `lustre_version`: Optional str. Version of lustre to build, default `2.15.6/lu-18085`
23-
which is the first version with EL9.5 support, plus a fix for https://jira.whamcloud.com/browse/LU-18085.
24-
- `lustre_repo`: Optional str. URL for Lustre repo. Default is a StackHPC repo
25-
incorporating the above fix.
22+
- `lustre_version`: Optional str. Version of lustre to build, default `2.15.7`
23+
- `lustre_repo`: Optional str. URL for Lustre repo. Default is `git://git.whamcloud.com/fs/lustre-release`.git.
2624
- `lustre_build_packages`: Optional list. Prerequisite packages required to build Lustre. See `defaults/main.yml`.
2725
- `lustre_build_dir`: Optional str. Path to build lustre at, default `/tmp/lustre-release`.
2826
- `lustre_configure_opts`: Optional list. Options to `./configure` command. Default builds client rpms supporting Mellanox OFED, without support for GSS keys.

ansible/roles/lustre/defaults/main.yml

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,13 +1,12 @@
1-
lustre_repo: https://github.com/stackhpc/lustre-release.git
2-
lustre_version: '2.15.6/lu-18085' # Fixes https://jira.whamcloud.com/browse/LU-18085
1+
lustre_version: '2.15.7'
32
lustre_lnet_label: tcp
43
#lustre_mgs_nid:
54
lustre_mounts: []
65
lustre_mount_state: mounted
76
lustre_mount_options: 'defaults,_netdev,noauto,x-systemd.automount,x-systemd.requires=lnet.service,nosuid,nodev'
87

98
# below variables are for build and should not generally require changes
10-
lustre_git_repo: "git://git.whamcloud.com/fs/lustre-release.git"
9+
lustre_repo: "git://git.whamcloud.com/fs/lustre-release.git"
1110
lustre_build_packages:
1211
- "kernel-devel-{{ ansible_kernel }}"
1312
- git

ansible/roles/ofed/README.md

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,10 @@
11
# ofed
22

3+
> [!IMPORTANT]
4+
> This role is deprecated - it is not regularly maintained and StackHPC CI
5+
> does not test that it works. Consider using [ansible/roles/doca](../doca/README.md)
6+
> instead.
7+
38
This role installs Mellanox OFED:
49
- It checks that the running kernel is the latest installed one, and errors if not.
510
- Installation uses the `mlnxofedinstall` command, with support for the running kernel

ansible/roles/proxy/defaults/main.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# proxy_http_proxy:
22
proxy_https_proxy: "{{ proxy_http_proxy }}"
3-
proxy_no_proxy_defaults: "{{ ['localhost', '127.0.0.1'] + groups['all'] + hostvars.values() | map(attribute='ansible_host') }}"
3+
proxy_no_proxy_defaults: "{{ ['localhost', '127.0.0.1', '169.254.169.254'] + groups['all'] + hostvars.values() | map(attribute='ansible_host') }}"
44
proxy_no_proxy_extras: []
55
proxy_no_proxy: "{{ (proxy_no_proxy_defaults + proxy_no_proxy_extras) | unique | sort | join(',') }}"
66
proxy_dnf: true

0 commit comments

Comments
 (0)