We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e01daae commit 4fd2897Copy full SHA for 4fd2897
samples/gpu/nccl_run_allreduce_H100.sh
@@ -57,7 +57,7 @@ do
57
--bind-to numa \
58
-npernode 8 \
59
--mca coll ^hcoll \
60
- -x NCCL_CROSS_NIC=1 \
+ -x NCCL_CROSS_NIC=2 \
61
-x NCCL_DEBUG=WARN \
62
-x NCCL_CUMEM_ENABLE=0 \
63
-x NCCL_IB_SPLIT_DATA_ON_QPS=0 \
@@ -78,6 +78,7 @@ do
78
-x NCCL_IGNORE_CPU_AFFINITY=1 \
79
-x NCCL_IB_HCA="${var_NCCL_IB_HCA}" \
80
-x NCCL_TOPO_FILE=~/H100-topology.xml \
81
+ -x NCCL_MIN_NCHANNELS=32 \
82
--np $np --hostfile $hostfile /opt/oci-hpc/nccl-test/build/all_reduce_perf -b 1G -e 16G -f 2 -g 1 >> $logfile
83
84
tail -n 32 $logfile
0 commit comments