-
Notifications
You must be signed in to change notification settings - Fork 4
Expand file tree
/
Copy pathDockerfile-ofed
More file actions
30 lines (26 loc) · 1.21 KB
/
Dockerfile-ofed
File metadata and controls
30 lines (26 loc) · 1.21 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
ARG PYTHON_VERSION=310
ARG CUDA_VERSION=cu121
ARG BASE_IMAGE=quay.io/ado/ado:latest-py${PYTHON_VERSION}-${CUDA_VERSION}
FROM $BASE_IMAGE
# VV: Install MOFED from https://network.nvidia.com/products/infiniband-drivers/linux/mlnx_ofed/
USER 0
ENV MOFED_VER=24.10-1.1.4.0
ENV OS_VER=ubuntu22.04
ENV PLATFORM=x86_64
# AP: the ucx-cuda package depends on libnvidia-compute | libnvidia-ml1 (>= 560.35.03)
# Installing these libraries via:
# apt-get install -y libnvidia-compute-575 libnvidia-decode-575 libnvidia-gpucomp-575 ibverbs-providers
# would break the existing drivers with:
# Failed to initialize NVML: Driver/library version mismatch
# We can either install them and uninstall them, or add --without-ucx-cuda
RUN mkdir app && \
cd app && \
wget -q http://content.mellanox.com/ofed/MLNX_OFED-${MOFED_VER}/MLNX_OFED_LINUX-${MOFED_VER}-${OS_VER}-${PLATFORM}.tgz && \
tar -xvzf MLNX_OFED_LINUX-${MOFED_VER}-${OS_VER}-${PLATFORM}.tgz && \
cd MLNX_OFED_LINUX-${MOFED_VER}-${OS_VER}-${PLATFORM} && \
./mlnxofedinstall --user-space-only --without-fw-update --without-ucx-cuda --all --force --distro $OS_VER && \
cd .. && \
rm -rf MLNX* && \
apt-get -y clean && \
rm -rf /var/lib/apt/lists/*
USER 1000