Skip to content

Commit 033695b

Browse files
authored
Network configuration for OpenMPI/CXI (#52)
Add `network.yaml` files to the cluster configurations, to support building OpenMPI and low-level network libraries. The stackinator work that uses `network.yaml` was merged: eth-cscs/stackinator#256 Note that the definitions of libfabric, etc, are currently pinned to commits on `main`/`master` of the source repositories, which isn't ideal - but with this feature we can start using concrete versions when it is possible.
1 parent 030f280 commit 033695b

30 files changed

+3110
-0
lines changed

balfrin/network.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
../site/network/a100/network.yaml

beverin/network.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
../site/network/amdgpu/network.yaml

bristen/network.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
../site/network/a100/network.yaml

clariden/network.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
../site/network/gh200/network.yaml

daint/network.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
../site/network/gh200/network.yaml

eiger/network.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
../site/network/zen/network.yaml

pilatus/network.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
../site/network/zen/network.yaml

santis/network.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
../site/network/gh200/network.yaml

site/network/a100/network.yaml

Lines changed: 38 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,38 @@
1+
mpi:
2+
cray-mpich:
3+
specs: ["libfabric@1.22"]
4+
openmpi:
5+
specs: ["libfabric@2.2.0"]
6+
packages:
7+
# adding a variant to the variants field of a package
8+
# e.g. packages:openmpi:variants
9+
# is not strong enough: if that variant does not exist it simply will be ignored with no error message
10+
openmpi:
11+
buildable: true
12+
require:
13+
- 'schedulers=slurm'
14+
- 'fabrics=cma,ofi,xpmem'
15+
- '+internal-pmix'
16+
- '+cray-xpmem'
17+
prefer:
18+
- '+cuda'
19+
variants: []
20+
cray-mpich:
21+
buildable: true
22+
prefer:
23+
- '+cuda'
24+
- '@8.1.32'
25+
libfabric:
26+
buildable: true
27+
externals:
28+
- spec: libfabric@1.22.0 fabrics=cxi,rxm,tcp
29+
prefix: /opt/cray/libfabric/1.22.0/
30+
version: ["git.v2.2.0=main"]
31+
require: fabrics=cxi,rxm,tcp
32+
libcxi:
33+
version: ["git.be1f7149482581ad589a124e5f6764b9d20d2d45=main"]
34+
cxi-driver:
35+
version: ["git.08deb056fac4ca8b0d3d39b5f7cc0dad019ee266=main"]
36+
cassini-headers:
37+
version: ["git.59b6de6a91d9637809677c50cc48b607a91a9acb=main"]
38+

site/network/amdgpu/network.yaml

Lines changed: 38 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,38 @@
1+
mpi:
2+
cray-mpich:
3+
specs: ["libfabric@1.22"]
4+
openmpi:
5+
specs: ["libfabric@2.2.0"]
6+
packages:
7+
# adding a variant to the variants field of a package
8+
# e.g. packages:openmpi:variants
9+
# is not strong enough: if that variant does not exist it simply will be ignored with no error message
10+
openmpi:
11+
buildable: true
12+
require:
13+
- 'schedulers=slurm'
14+
- 'fabrics=cma,ofi,xpmem'
15+
- '+internal-pmix'
16+
- '+cray-xpmem'
17+
prefer:
18+
- '+rocm'
19+
variants: []
20+
cray-mpich:
21+
buildable: true
22+
prefer:
23+
- '+rocm'
24+
- '@8.1.32'
25+
libfabric:
26+
buildable: true
27+
externals:
28+
- spec: libfabric@1.22.0 fabrics=cxi,rxm,tcp
29+
prefix: /opt/cray/libfabric/1.22.0/
30+
version: ["git.v2.2.0=main"]
31+
require: fabrics=cxi,rxm,tcp
32+
libcxi:
33+
version: ["git.be1f7149482581ad589a124e5f6764b9d20d2d45=main"]
34+
cxi-driver:
35+
version: ["git.08deb056fac4ca8b0d3d39b5f7cc0dad019ee266=main"]
36+
cassini-headers:
37+
version: ["git.59b6de6a91d9637809677c50cc48b607a91a9acb=main"]
38+

0 commit comments

Comments
 (0)