Skip to content

Commit 4fd2897

Browse files
Update NCCL tuning parameters
1 parent e01daae commit 4fd2897

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

samples/gpu/nccl_run_allreduce_H100.sh

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -57,7 +57,7 @@ do
5757
--bind-to numa \
5858
-npernode 8 \
5959
--mca coll ^hcoll \
60-
-x NCCL_CROSS_NIC=1 \
60+
-x NCCL_CROSS_NIC=2 \
6161
-x NCCL_DEBUG=WARN \
6262
-x NCCL_CUMEM_ENABLE=0 \
6363
-x NCCL_IB_SPLIT_DATA_ON_QPS=0 \
@@ -78,6 +78,7 @@ do
7878
-x NCCL_IGNORE_CPU_AFFINITY=1 \
7979
-x NCCL_IB_HCA="${var_NCCL_IB_HCA}" \
8080
-x NCCL_TOPO_FILE=~/H100-topology.xml \
81+
-x NCCL_MIN_NCHANNELS=32 \
8182
--np $np --hostfile $hostfile /opt/oci-hpc/nccl-test/build/all_reduce_perf -b 1G -e 16G -f 2 -g 1 >> $logfile
8283

8384
tail -n 32 $logfile

0 commit comments

Comments
 (0)