|
| 1 | +ARG BASE_IMAGE=nvcr.io/nvidia/cuda:13.0.1-base-ubi10 |
| 2 | + |
| 3 | +FROM ${BASE_IMAGE} as build |
| 4 | + |
| 5 | +ARG TARGETARCH |
| 6 | +ARG GOLANG_VERSION |
| 7 | + |
| 8 | +# Arg to indicate if driver type is either of passthrough(baremetal) or vgpu |
| 9 | +ARG DRIVER_TYPE=passthrough |
| 10 | +ENV DRIVER_TYPE=$DRIVER_TYPE |
| 11 | + |
| 12 | +SHELL ["/bin/bash", "-c"] |
| 13 | + |
| 14 | +RUN dnf install -y git wget |
| 15 | + |
| 16 | +# download appropriate binary based on the target architecture for multi-arch builds |
| 17 | +RUN OS_ARCH=${TARGETARCH/x86_64/amd64} && OS_ARCH=${OS_ARCH/aarch64/arm64} && \ |
| 18 | + wget -nv -O - https://go.dev/dl/go${GOLANG_VERSION}.linux-${OS_ARCH}.tar.gz \ |
| 19 | + | tar -C /usr/local -xz |
| 20 | + |
| 21 | +ENV PATH /usr/local/go/bin:$PATH |
| 22 | + |
| 23 | +WORKDIR /work |
| 24 | + |
| 25 | +RUN if [ "$DRIVER_TYPE" = "vgpu" ]; then \ |
| 26 | + git clone https://github.com/NVIDIA/gpu-driver-container driver && \ |
| 27 | + cd driver/vgpu/src && \ |
| 28 | + go build -o vgpu-util && \ |
| 29 | + mv vgpu-util /work; fi |
| 30 | + |
| 31 | +FROM ${BASE_IMAGE} |
| 32 | + |
| 33 | +ARG TARGETARCH |
| 34 | +ENV TARGETARCH=$TARGETARCH |
| 35 | + |
| 36 | +SHELL ["/bin/bash", "-c"] |
| 37 | + |
| 38 | +#ARG BASE_URL=http://us.download.nvidia.com/XFree86/Linux-x86_64 |
| 39 | +ARG BASE_URL=https://us.download.nvidia.com/tesla |
| 40 | +ARG DRIVER_VERSION |
| 41 | +ENV DRIVER_VERSION=$DRIVER_VERSION |
| 42 | +ARG DRIVER_BRANCH |
| 43 | +ENV DRIVER_BRANCH=$DRIVER_BRANCH |
| 44 | + |
| 45 | +# Arg to indicate if driver type is either of passthrough/baremetal or vgpu |
| 46 | +ARG DRIVER_TYPE=passthrough |
| 47 | +ENV DRIVER_TYPE=$DRIVER_TYPE |
| 48 | +ARG VGPU_LICENSE_SERVER_TYPE=NLS |
| 49 | +ENV VGPU_LICENSE_SERVER_TYPE=$VGPU_LICENSE_SERVER_TYPE |
| 50 | +# Enable vGPU version compability check by default |
| 51 | +ARG DISABLE_VGPU_VERSION_CHECK=true |
| 52 | +ENV DISABLE_VGPU_VERSION_CHECK=$DISABLE_VGPU_VERSION_CHECK |
| 53 | +# Avoid dependency of container-toolkit for driver container |
| 54 | +ENV NVIDIA_VISIBLE_DEVICES=void |
| 55 | + |
| 56 | +ADD install.sh /tmp/ |
| 57 | + |
| 58 | +RUN NVIDIA_GPGKEY_SUM=afbea87d3b979b3788ef34223aeeb323ade481128e2c133723ae99b8a51368bb && \ |
| 59 | + OS_ARCH=${TARGETARCH/amd64/x86_64} && OS_ARCH=${OS_ARCH/arm64/sbsa} && \ |
| 60 | + curl -fsSL "https://developer.download.nvidia.com/compute/cuda/repos/rhel10/$OS_ARCH/CDF6BA43.pub" | sed '/^Version/d' > /etc/pki/rpm-gpg/RPM-GPG-KEY-NVIDIA && \ |
| 61 | + echo "$NVIDIA_GPGKEY_SUM /etc/pki/rpm-gpg/RPM-GPG-KEY-NVIDIA" | sha256sum -c --strict - |
| 62 | + |
| 63 | +RUN sh /tmp/install.sh depinstall && \ |
| 64 | + sh /tmp/install.sh setup_cuda_repo && \ |
| 65 | + curl -fsSL -o /usr/local/bin/donkey https://github.com/3XX0/donkey/releases/download/v1.1.0/donkey && \ |
| 66 | + curl -fsSL -o /usr/local/bin/extract-vmlinux https://raw.githubusercontent.com/torvalds/linux/master/scripts/extract-vmlinux && \ |
| 67 | + chmod +x /usr/local/bin/donkey /usr/local/bin/extract-vmlinux && \ |
| 68 | + ln -s /sbin/ldconfig /sbin/ldconfig.real |
| 69 | + |
| 70 | +ADD drivers drivers/ |
| 71 | + |
| 72 | +# Fetch the installer, fabricmanager and libnvidia-nscq automatically for passthrough/baremetal types |
| 73 | +RUN if [ "$DRIVER_TYPE" != "vgpu" ]; then \ |
| 74 | + cd drivers && \ |
| 75 | + DRIVER_ARCH=${TARGETARCH/amd64/x86_64} && DRIVER_ARCH=${DRIVER_ARCH/arm64/aarch64} && \ |
| 76 | + curl -fSsl -O $BASE_URL/$DRIVER_VERSION/NVIDIA-Linux-$DRIVER_ARCH-$DRIVER_VERSION.run && \ |
| 77 | + chmod +x NVIDIA-Linux-$DRIVER_ARCH-$DRIVER_VERSION.run; fi |
| 78 | + |
| 79 | +# Fetch the installer, fabricmanager, libnvidia-nscq, libnvsdm, imex packages |
| 80 | +RUN sh /tmp/install.sh extrapkgsinstall |
| 81 | + |
| 82 | +COPY nvidia-driver /usr/local/bin |
| 83 | +COPY ocp_dtk_entrypoint /usr/local/bin |
| 84 | +COPY common.sh /usr/local/bin |
| 85 | + |
| 86 | +COPY --from=build /work/vgpu-util* /usr/local/bin |
| 87 | + |
| 88 | +WORKDIR /drivers |
| 89 | + |
| 90 | +ARG PUBLIC_KEY=empty |
| 91 | +COPY ${PUBLIC_KEY} kernel/pubkey.x509 |
| 92 | + |
| 93 | +ARG PRIVATE_KEY |
| 94 | +ARG KERNEL_VERSION=latest |
| 95 | + |
| 96 | +LABEL io.k8s.display-name="NVIDIA Driver Container" |
| 97 | +LABEL name="NVIDIA Driver Container" |
| 98 | +LABEL vendor="NVIDIA" |
| 99 | +LABEL version="${DRIVER_VERSION}" |
| 100 | +LABEL release="N/A" |
| 101 | +LABEL summary="Provision the NVIDIA driver through containers" |
| 102 | +LABEL description="See summary" |
| 103 | + |
| 104 | +# Install / upgrade packages here that are required to resolve CVEs |
| 105 | +ARG CVE_UPDATES |
| 106 | +RUN if [ -n "${CVE_UPDATES}" ]; then \ |
| 107 | + yum update -y ${CVE_UPDATES} && \ |
| 108 | + rm -rf /var/cache/yum/*; \ |
| 109 | + fi |
| 110 | + |
| 111 | +# Remove cuda repository to avoid GPG errors |
| 112 | +RUN rm -f /etc/yum.repos.d/cuda.repo |
| 113 | + |
| 114 | +ENTRYPOINT ["nvidia-driver", "init"] |
0 commit comments