Skip to content
This repository was archived by the owner on Mar 20, 2023. It is now read-only.

Commit 07e86a3

Browse files
committed
Fix Network Direct RDMA VM provisioning
- Resolves #299
1 parent 4ab3827 commit 07e86a3

File tree

2 files changed

+28
-17
lines changed

2 files changed

+28
-17
lines changed

CHANGELOG.md

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,10 @@
22

33
## [Unreleased]
44

5+
### Fixed
6+
- Provisioning Network Direct RDMA VM sizes (A8/A9/NC24rX/H16r/H16mr) resulted
7+
in start task failures
8+
59
## [3.8.0] - 2019-08-13
610
### Added
711
- Revamped Singularity support, including support for Singularity 3,

scripts/shipyard_nodeprep.sh

Lines changed: 24 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -1427,6 +1427,10 @@ EOF
14271427
}
14281428

14291429
check_for_mellanox_card() {
1430+
if [ "$vm_rdma_type" -eq 0 ]; then
1431+
log DEBUG "Not an RDMA capable VM size, skipping IB detection/setup"
1432+
return
1433+
fi
14301434
# check for mellanox card
14311435
set +e
14321436
local out
@@ -1436,28 +1440,31 @@ check_for_mellanox_card() {
14361440
set -e
14371441
echo "$out"
14381442
if [ $rc -ne 0 ]; then
1439-
if [ "$vm_rdma_type" -eq 0 ]; then
1440-
log INFO "No Mellanox card(s) detected"
1441-
else
1443+
if [ "$vm_rdma_type" -eq 1 ]; then
14421444
log ERROR "Expected Mellanox IB card not detected"
14431445
exit 1
1444-
fi
1445-
else
1446-
if [ "$vm_rdma_type" -eq 1 ]; then
1447-
# extract IB PKEY
1448-
export_ib_pkey
1449-
# get ofed info
1450-
ofed_info
1451-
# run ib tools
1452-
ibstatus
1453-
ibv_devinfo
14541446
elif [ "$vm_rdma_type" -eq 2 ]; then
1455-
# network direct rmda
1456-
install_intel_mpi
1457-
else
1458-
log DEBUG "Mellanox card is not IB/RDMA capable"
1447+
# check for ib device
1448+
if [ -e /dev/infiniband/uverbs0 ]; then
1449+
log INFO "IB device detected"
1450+
else
1451+
log ERROR "Expected IB device not detected"
1452+
exit 1
1453+
fi
14591454
fi
14601455
fi
1456+
if [ "$vm_rdma_type" -eq 1 ]; then
1457+
# extract IB PKEY
1458+
export_ib_pkey
1459+
# get ofed info
1460+
ofed_info
1461+
# run ib tools
1462+
ibstatus
1463+
ibv_devinfo
1464+
elif [ "$vm_rdma_type" -eq 2 ]; then
1465+
# network direct rmda
1466+
install_intel_mpi
1467+
fi
14611468
}
14621469

14631470
process_ib_rdma() {

0 commit comments

Comments
 (0)