Skip to content

Commit 4315db7

Browse files
committed
FIX Set NCCL_CUMEM_HOST_ENABLE=0 for ARM with CUDA 12.8
1 parent edcacd1 commit 4315db7

File tree

1 file changed

+8
-0
lines changed

1 file changed

+8
-0
lines changed

context/entrypoint.sh

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,14 @@ if [ "$EXTRA_PIP_PACKAGES" ]; then
2323
timeout ${PIP_TIMEOUT:-600} pip install $EXTRA_PIP_PACKAGES || exit $?
2424
fi
2525

26+
if [ "$(uname -m)" = "aarch64" ]; then
27+
# Check if the CUDA version is 12.8
28+
if nvcc --version | grep -q "CUDA 12.8"; then
29+
export NCCL_CUMEM_HOST_ENABLE=0
30+
echo "Set NCCL_CUMEM_HOST_ENABLE=0 for ARM with CUDA 12.8"
31+
fi
32+
fi
33+
2634
# Run whatever the user wants.
2735
if [ "${UNQUOTE}" = "true" ]; then
2836
exec $@

0 commit comments

Comments
 (0)