We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
HWLOC_KEEP_NVIDIA_GPU_NUMA_NODES=0
1 parent 4ac8b3d commit 4e5afdcCopy full SHA for 4e5afdc
docs/running/slurm.md
@@ -300,8 +300,10 @@ if [[ $SLURM_LOCALID -eq 0 ]]; then
300
CUDA_VISIBLE_DEVICES=0,1,2,3 nvidia-cuda-mps-control -d
301
fi
302
303
-# Set CUDA device
304
-numa_nodes=$(hwloc-calc --physical --intersect NUMAnode $(hwloc-bind --get --taskset))
+# Set CUDA device. Disable HWLOC_KEEP_NVIDIA_GPU_NUMA_NODES to avoid GPU NUMA
+# nodes appearing in the list of CUDA devices. They start appearing in hwloc
305
+# version 2.11.
306
+numa_nodes=$(HWLOC_KEEP_NVIDIA_GPU_NUMA_NODES=0 hwloc-calc --physical --intersect NUMAnode $(hwloc-bind --get --taskset))
307
export CUDA_VISIBLE_DEVICES=$numa_nodes
308
309
# Wait for MPS to start
0 commit comments