|
| 1 | +ARG CUDA_VERSION |
| 2 | +FROM nvidia/cuda:${CUDA_VERSION}-base-ubi9 as build |
| 3 | + |
| 4 | +ARG TARGETARCH |
| 5 | + |
| 6 | +SHELL ["/bin/bash", "-c"] |
| 7 | + |
| 8 | +RUN dnf install -y git wget |
| 9 | + |
| 10 | +ENV GOLANG_VERSION=1.22.0 |
| 11 | + |
| 12 | +# download appropriate binary based on the target architecture for multi-arch builds |
| 13 | +RUN OS_ARCH=${TARGETARCH/x86_64/amd64} && OS_ARCH=${OS_ARCH/aarch64/arm64} && \ |
| 14 | + curl https://storage.googleapis.com/golang/go${GOLANG_VERSION}.linux-${OS_ARCH}.tar.gz \ |
| 15 | + | tar -C /usr/local -xz |
| 16 | + |
| 17 | +ENV PATH /usr/local/go/bin:$PATH |
| 18 | + |
| 19 | +WORKDIR /work |
| 20 | + |
| 21 | +RUN git clone https://gitlab.com/nvidia/container-images/driver && \ |
| 22 | + cd driver/vgpu/src && \ |
| 23 | + go build -o vgpu-util && \ |
| 24 | + mv vgpu-util /work |
| 25 | + |
| 26 | +FROM nvidia/cuda:${CUDA_VERSION}-base-ubi9 |
| 27 | + |
| 28 | +ARG TARGETARCH |
| 29 | +ENV TARGETARCH=$TARGETARCH |
| 30 | + |
| 31 | +SHELL ["/bin/bash", "-c"] |
| 32 | + |
| 33 | +#ARG BASE_URL=http://us.download.nvidia.com/XFree86/Linux-x86_64 |
| 34 | +ARG BASE_URL=https://us.download.nvidia.com/tesla |
| 35 | +ARG DRIVER_VERSION |
| 36 | +ENV DRIVER_VERSION=$DRIVER_VERSION |
| 37 | + |
| 38 | +# Arg to indicate if driver type is either of passthrough/baremetal or vgpu |
| 39 | +ARG DRIVER_TYPE=passthrough |
| 40 | +ENV DRIVER_TYPE=$DRIVER_TYPE |
| 41 | +ARG VGPU_LICENSE_SERVER_TYPE=NLS |
| 42 | +ENV VGPU_LICENSE_SERVER_TYPE=$VGPU_LICENSE_SERVER_TYPE |
| 43 | +# Enable vGPU version compability check by default |
| 44 | +ARG DISABLE_VGPU_VERSION_CHECK=true |
| 45 | +ENV DISABLE_VGPU_VERSION_CHECK=$DISABLE_VGPU_VERSION_CHECK |
| 46 | +# Avoid dependency of container-toolkit for driver container |
| 47 | +ENV NVIDIA_VISIBLE_DEVICES=void |
| 48 | + |
| 49 | +ADD install.sh /tmp/ |
| 50 | + |
| 51 | +RUN NVIDIA_GPGKEY_SUM=d0664fbbdb8c32356d45de36c5984617217b2d0bef41b93ccecd326ba3b80c87 && \ |
| 52 | + OS_ARCH=${TARGETARCH/amd64/x86_64} && OS_ARCH=${OS_ARCH/arm64/sbsa} && \ |
| 53 | + curl -fsSL "https://developer.download.nvidia.com/compute/cuda/repos/rhel9/$OS_ARCH/D42D0685.pub" | sed '/^Version/d' > /etc/pki/rpm-gpg/RPM-GPG-KEY-NVIDIA && \ |
| 54 | + echo "$NVIDIA_GPGKEY_SUM /etc/pki/rpm-gpg/RPM-GPG-KEY-NVIDIA" | sha256sum -c --strict - |
| 55 | + |
| 56 | +RUN sh /tmp/install.sh depinstall && \ |
| 57 | + curl -fsSL -o /usr/local/bin/donkey https://github.com/3XX0/donkey/releases/download/v1.1.0/donkey && \ |
| 58 | + curl -fsSL -o /usr/local/bin/extract-vmlinux https://raw.githubusercontent.com/torvalds/linux/master/scripts/extract-vmlinux && \ |
| 59 | + chmod +x /usr/local/bin/donkey /usr/local/bin/extract-vmlinux && \ |
| 60 | + ln -s /sbin/ldconfig /sbin/ldconfig.real |
| 61 | + |
| 62 | +ADD drivers drivers/ |
| 63 | + |
| 64 | +# Fetch the installer automatically for passthrough/baremetal types |
| 65 | +RUN if [ "$DRIVER_TYPE" != "vgpu" ]; then \ |
| 66 | + cd drivers && \ |
| 67 | + DRIVER_ARCH=${TARGETARCH/amd64/x86_64} && DRIVER_ARCH=${DRIVER_ARCH/arm64/aarch64} && \ |
| 68 | + curl -fSsl -O $BASE_URL/$DRIVER_VERSION/NVIDIA-Linux-$DRIVER_ARCH-$DRIVER_VERSION.run && \ |
| 69 | + chmod +x NVIDIA-Linux-$DRIVER_ARCH-$DRIVER_VERSION.run; fi |
| 70 | + |
| 71 | +# Install fabric-manager packages |
| 72 | +RUN if [ "$DRIVER_TYPE" != "vgpu" ] && [ "$TARGETARCH" != "arm64" ]; then \ |
| 73 | + versionArray=(${DRIVER_VERSION//./ }); \ |
| 74 | + DRIVER_BRANCH=${versionArray[0]}; \ |
| 75 | + dnf module enable -y nvidia-driver:${DRIVER_BRANCH} && \ |
| 76 | + dnf install -y nvidia-fabric-manager-${DRIVER_VERSION}-1 libnvidia-nscq-${DRIVER_BRANCH}-${DRIVER_VERSION}-1; fi |
| 77 | + |
| 78 | +COPY nvidia-driver /usr/local/bin |
| 79 | +COPY ocp_dtk_entrypoint /usr/local/bin |
| 80 | +COPY common.sh /usr/local/bin |
| 81 | + |
| 82 | +COPY --from=build /work/vgpu-util /usr/local/bin |
| 83 | + |
| 84 | +WORKDIR /drivers |
| 85 | + |
| 86 | +ARG PUBLIC_KEY=empty |
| 87 | +COPY ${PUBLIC_KEY} kernel/pubkey.x509 |
| 88 | + |
| 89 | +ARG PRIVATE_KEY |
| 90 | +ARG KERNEL_VERSION=latest |
| 91 | + |
| 92 | +LABEL io.k8s.display-name="NVIDIA Driver Container" |
| 93 | +LABEL name="NVIDIA Driver Container" |
| 94 | +LABEL vendor="NVIDIA" |
| 95 | +LABEL version="${DRIVER_VERSION}" |
| 96 | +LABEL release="N/A" |
| 97 | +LABEL summary="Provision the NVIDIA driver through containers" |
| 98 | +LABEL description="See summary" |
| 99 | + |
| 100 | +# Add NGC DL license from the CUDA image |
| 101 | +RUN mkdir /licenses && mv /NGC-DL-CONTAINER-LICENSE /licenses/NGC-DL-CONTAINER-LICENSE |
| 102 | + |
| 103 | +# Install / upgrade packages here that are required to resolve CVEs |
| 104 | +ARG CVE_UPDATES |
| 105 | +RUN if [ -n "${CVE_UPDATES}" ]; then \ |
| 106 | + yum update -y ${CVE_UPDATES} && \ |
| 107 | + rm -rf /var/cache/yum/*; \ |
| 108 | + fi |
| 109 | + |
| 110 | +# Remove cuda repository to avoid GPG errors |
| 111 | +RUN rm -f /etc/yum.repos.d/cuda.repo |
| 112 | + |
| 113 | +ENTRYPOINT ["nvidia-driver", "init"] |
0 commit comments