Skip to content

Commit 2c0c787

Browse files
committed
Merge branch 'feat/alertmanager' of github.com:stackhpc/ansible-slurm-appliance into feat/alertmanager
2 parents 41c7331 + 1a6eff8 commit 2c0c787

File tree

5 files changed

+12
-17
lines changed

5 files changed

+12
-17
lines changed

ansible/roles/cuda/README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,6 @@ Requires OFED to be installed to provide required kernel-* packages.
1010

1111
- `cuda_repo_url`: Optional. URL of `.repo` file. Default is upstream for appropriate OS/architecture.
1212
- `cuda_nvidia_driver_stream`: Optional. Version of `nvidia-driver` stream to enable. This controls whether the open or proprietary drivers are installed and the major version. Changing this once the drivers are installed does not change the version.
13-
- `cuda_packages`: Optional. Default: `['cuda', 'nvidia-gds']`.
13+
- `cuda_packages`: Optional. Default: `['cuda', 'nvidia-gds', 'cmake', 'cuda-toolkit-12-8']`.
1414
- `cuda_package_version`: Optional. Default `latest` which will install the latest packages if not installed but won't upgrade already-installed packages. Use `'none'` to skip installing CUDA.
1515
- `cuda_persistenced_state`: Optional. State of systemd `nvidia-persistenced` service. Values as [ansible.builtin.systemd:state](https://docs.ansible.com/ansible/latest/collections/ansible/builtin/systemd_module.html#parameter-state). Default `started`.

ansible/roles/cuda/defaults/main.yml

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,13 +1,14 @@
11
cuda_repo_url: "https://developer.download.nvidia.com/compute/cuda/repos/rhel{{ ansible_distribution_major_version }}/{{ ansible_architecture }}/cuda-rhel{{ ansible_distribution_major_version }}.repo"
22
cuda_nvidia_driver_stream: '570-open'
33
cuda_package_version: '12.8.1-1'
4+
cuda_version_short: '12.8'
45
cuda_packages:
56
- "cuda{{ ('-' + cuda_package_version) if cuda_package_version != 'latest' else '' }}"
67
- nvidia-gds
7-
# _cuda_version_tuple: # discovered from installed package e.g. ('12', '1', '0')
8-
cuda_version_short: "{{ _cuda_version_tuple[0] }}.{{ _cuda_version_tuple[1] }}"
8+
- cmake
9+
- cuda-toolkit-12-8
910
cuda_samples_release_url: "https://github.com/NVIDIA/cuda-samples/archive/refs/tags/v{{ cuda_version_short }}.tar.gz"
10-
cuda_samples_path: "/home/{{ ansible_user }}/cuda_samples"
11+
cuda_samples_path: "/var/lib/{{ ansible_user }}/cuda_samples"
1112
cuda_samples_programs:
1213
- deviceQuery
1314
- bandwidthTest

ansible/roles/cuda/tasks/samples.yml

Lines changed: 0 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,3 @@
1-
- name: Read CUDA version file
2-
slurp:
3-
src: /usr/local/cuda/version.json
4-
register: _cuda_samples_version
5-
6-
- name: Set fact for discovered CUDA version
7-
set_fact:
8-
_cuda_version_tuple: "{{ (_cuda_samples_version.content | b64decode | from_json).cuda.version | split('.') }}" # e.g. '12.1.0'
9-
101
- name: Ensure cuda_samples_path exists
112
file:
123
state: directory

ansible/roles/eessi/defaults/main.yaml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -9,3 +9,5 @@ cvmfs_config_default:
99
cvmfs_config_overrides: {}
1010

1111
cvmfs_config: "{{ cvmfs_config_default | combine(cvmfs_config_overrides) }}"
12+
13+
cvmfs_gpg_checksum: "sha256:4ac81adff957565277cfa6a4a330cdc2ce5a8fdd73b8760d1a5a32bef71c4bd6"

ansible/roles/eessi/tasks/main.yaml

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,9 @@
11
---
22
- name: Download Cern GPG key
33
ansible.builtin.get_url:
4-
url: http://cvmrepo.web.cern.ch/cvmrepo/yum/RPM-GPG-KEY-CernVM
4+
url: http://cvmrepo.web.cern.ch/cvmrepo/yum/RPM-GPG-KEY-CernVM
55
dest: ./cvmfs-key.gpg
6+
checksum: "{{ cvmfs_gpg_checksum }}"
67

78
- name: Import downloaded GPG key
89
command: rpm --import cvmfs-key.gpg
@@ -24,7 +25,7 @@
2425

2526
# Alternative version using official repo - still no GPG key :(
2627
# - name: Add EESSI repo
27-
# dnf:
28+
# dnf:
2829
# name: http://repo.eessi-infra.org/eessi/rhel/8/noarch/eessi-release-0-1.noarch.rpm
2930

3031
# - name: Install EESSI CVMFS config
@@ -39,9 +40,9 @@
3940
value: "{{ item.value }}"
4041
no_extra_spaces: true
4142
loop: "{{ cvmfs_config | dict2items }}"
42-
43+
4344

4445
# NOTE: Not clear how to make this idempotent
4546
- name: Ensure CVMFS config is setup
4647
command:
47-
cmd: "cvmfs_config setup"
48+
cmd: "cvmfs_config setup"

0 commit comments

Comments
 (0)