This repository was archived by the owner on Mar 20, 2023. It is now read-only.
File tree Expand file tree Collapse file tree 2 files changed +28
-17
lines changed
Expand file tree Collapse file tree 2 files changed +28
-17
lines changed Original file line number Diff line number Diff line change 22
33## [ Unreleased]
44
5+ ### Fixed
6+ - Provisioning Network Direct RDMA VM sizes (A8/A9/NC24rX/H16r/H16mr) resulted
7+ in start task failures
8+
59## [ 3.8.0] - 2019-08-13
610### Added
711- Revamped Singularity support, including support for Singularity 3,
Original file line number Diff line number Diff line change @@ -1427,6 +1427,10 @@ EOF
14271427}
14281428
14291429check_for_mellanox_card () {
1430+ if [ " $vm_rdma_type " -eq 0 ]; then
1431+ log DEBUG " Not an RDMA capable VM size, skipping IB detection/setup"
1432+ return
1433+ fi
14301434 # check for mellanox card
14311435 set +e
14321436 local out
@@ -1436,28 +1440,31 @@ check_for_mellanox_card() {
14361440 set -e
14371441 echo " $out "
14381442 if [ $rc -ne 0 ]; then
1439- if [ " $vm_rdma_type " -eq 0 ]; then
1440- log INFO " No Mellanox card(s) detected"
1441- else
1443+ if [ " $vm_rdma_type " -eq 1 ]; then
14421444 log ERROR " Expected Mellanox IB card not detected"
14431445 exit 1
1444- fi
1445- else
1446- if [ " $vm_rdma_type " -eq 1 ]; then
1447- # extract IB PKEY
1448- export_ib_pkey
1449- # get ofed info
1450- ofed_info
1451- # run ib tools
1452- ibstatus
1453- ibv_devinfo
14541446 elif [ " $vm_rdma_type " -eq 2 ]; then
1455- # network direct rmda
1456- install_intel_mpi
1457- else
1458- log DEBUG " Mellanox card is not IB/RDMA capable"
1447+ # check for ib device
1448+ if [ -e /dev/infiniband/uverbs0 ]; then
1449+ log INFO " IB device detected"
1450+ else
1451+ log ERROR " Expected IB device not detected"
1452+ exit 1
1453+ fi
14591454 fi
14601455 fi
1456+ if [ " $vm_rdma_type " -eq 1 ]; then
1457+ # extract IB PKEY
1458+ export_ib_pkey
1459+ # get ofed info
1460+ ofed_info
1461+ # run ib tools
1462+ ibstatus
1463+ ibv_devinfo
1464+ elif [ " $vm_rdma_type " -eq 2 ]; then
1465+ # network direct rmda
1466+ install_intel_mpi
1467+ fi
14611468}
14621469
14631470process_ib_rdma () {
You can’t perform that action at this time.
0 commit comments