|
| 1 | +ARG CUDA_VERSION=latest |
| 2 | + |
| 3 | +FROM nvcr.io/nvidia/cuda:${CUDA_VERSION}-base-amzn2023 AS build |
| 4 | +FROM amazonlinux:amzn2023 |
| 5 | + |
| 6 | +ARG TARGETARCH |
| 7 | +ARG CUDA_VERSION |
| 8 | + |
| 9 | +SHELL ["/bin/bash", "-c"] |
| 10 | + |
| 11 | +# Remove cuda repository to avoid GPG errors |
| 12 | +RUN rm -f /etc/yum.repos.d/cuda* |
| 13 | + |
| 14 | +RUN yum update -y && yum install -y yum-utils && \ |
| 15 | + yum install -y \ |
| 16 | + gcc \ |
| 17 | + gcc-c++ \ |
| 18 | + make \ |
| 19 | + ca-certificates \ |
| 20 | + kernel-headers \ |
| 21 | + git -y && \ |
| 22 | + yum clean all \ |
| 23 | + rm -rf /var/cache/yum/* |
| 24 | + |
| 25 | +ENV GOLANG_VERSION=1.23.1 |
| 26 | + |
| 27 | +# download appropriate binary based on the target architecture for multi-arch builds |
| 28 | +RUN OS_ARCH=${TARGETARCH/amd64/x86_64} && OS_ARCH=${OS_ARCH/arm64/aarch64} && \ |
| 29 | + curl https://storage.googleapis.com/golang/go${GOLANG_VERSION}.linux-${OS_ARCH}.tar.gz \ |
| 30 | + | tar -C /usr/local -xz |
| 31 | + |
| 32 | +ENV PATH /usr/local/bin:$PATH |
| 33 | +ENV PATH /usr/local/go/bin:$PATH |
| 34 | + |
| 35 | +WORKDIR /work |
| 36 | + |
| 37 | +RUN git clone https://github.com/NVIDIA/gpu-driver-container driver && \ |
| 38 | + cd driver/vgpu/src && \ |
| 39 | + go build -o vgpu-util && \ |
| 40 | + mv vgpu-util /work |
| 41 | +COPY --from=build /work/vgpu-util /usr/local/bin |
| 42 | + |
| 43 | +FROM nvcr.io/nvidia/cuda:${CUDA_VERSION}-base-amzn2023 |
| 44 | + |
| 45 | +SHELL ["/bin/bash", "-c"] |
| 46 | + |
| 47 | +ARG BASE_URL=https://us.download.nvidia.com/tesla |
| 48 | +ARG TARGETARCH |
| 49 | +ENV TARGETARCH=$TARGETARCH |
| 50 | +ARG DRIVER_VERSION |
| 51 | +ENV DRIVER_VERSION=$DRIVER_VERSION |
| 52 | + |
| 53 | +# Arg to indicate if driver type is either of passthrough(baremetal) or vgpu |
| 54 | +ARG DRIVER_TYPE=passthrough |
| 55 | +ENV DRIVER_TYPE=$DRIVER_TYPE |
| 56 | +ARG DRIVER_BRANCH=550 |
| 57 | +ENV DRIVER_BRANCH=$DRIVER_BRANCH |
| 58 | +ARG VGPU_LICENSE_SERVER_TYPE=NLS |
| 59 | +ENV VGPU_LICENSE_SERVER_TYPE=$VGPU_LICENSE_SERVER_TYPE |
| 60 | +# Enable vGPU version compability check by default |
| 61 | +ARG DISABLE_VGPU_VERSION_CHECK=true |
| 62 | +ENV DISABLE_VGPU_VERSION_CHECK=$DISABLE_VGPU_VERSION_CHECK |
| 63 | +ENV NVIDIA_VISIBLE_DEVICES=void |
| 64 | + |
| 65 | +RUN echo "TARGETARCH=$TARGETARCH" |
| 66 | + |
| 67 | +ADD install.sh /tmp |
| 68 | + |
| 69 | +RUN NVIDIA_GPGKEY_SUM=d0664fbbdb8c32356d45de36c5984617217b2d0bef41b93ccecd326ba3b80c87 && \ |
| 70 | + curl -fsSL https://developer.download.nvidia.com/compute/cuda/repos/amzn2023/x86_64/D42D0685.pub | sed '/^Version/d' > /etc/pki/rpm-gpg/RPM-GPG-KEY-NVIDIA && \ |
| 71 | + echo "$NVIDIA_GPGKEY_SUM /etc/pki/rpm-gpg/RPM-GPG-KEY-NVIDIA" | sha256sum -c --strict - && \ |
| 72 | + curl -fsSL -o /etc/yum.repos.d/cuda-amzn2023.repo https://developer.download.nvidia.com/compute/cuda/repos/amzn2023/x86_64/cuda-amzn2023.repo |
| 73 | + |
| 74 | +RUN /tmp/install.sh reposetup && /tmp/install.sh depinstall && \ |
| 75 | + curl -fsSL -o /usr/local/bin/donkey https://github.com/3XX0/donkey/releases/download/v1.1.0/donkey && \ |
| 76 | + chmod +x /usr/local/bin/donkey |
| 77 | + |
| 78 | +RUN curl -fsSL -o /usr/local/bin/extract-vmlinux https://raw.githubusercontent.com/torvalds/linux/master/scripts/extract-vmlinux && \ |
| 79 | + chmod +x /usr/local/bin/extract-vmlinux |
| 80 | + |
| 81 | +COPY nvidia-driver /usr/local/bin |
| 82 | + |
| 83 | +ADD drivers drivers/ |
| 84 | + |
| 85 | +# Fetch the installer automatically for passthrough/baremetal types |
| 86 | +RUN if [ "$DRIVER_TYPE" != "vgpu" ]; then \ |
| 87 | + cd drivers && \ |
| 88 | + /tmp/install.sh download_installer; fi |
| 89 | + |
| 90 | +RUN if [ "$DRIVER_TYPE" != "vgpu" ] && [ "$TARGETARCH" != "arm64" ]; then \ |
| 91 | + yum update -y && \ |
| 92 | + yum install -y \ |
| 93 | + coreutils-single \ |
| 94 | + nvidia-fabric-manager-${DRIVER_VERSION}-1 \ |
| 95 | + libnvidia-nscq-${DRIVER_BRANCH}-${DRIVER_VERSION}-1; fi |
| 96 | + |
| 97 | +WORKDIR /drivers |
| 98 | + |
| 99 | +ARG PUBLIC_KEY=empty |
| 100 | +COPY ${PUBLIC_KEY} kernel/pubkey.x509 |
| 101 | + |
| 102 | +# Install / upgrade packages here that are required to resolve CVEs |
| 103 | +ARG CVE_UPDATES |
| 104 | +RUN if [ -n "${CVE_UPDATES}" ]; then \ |
| 105 | + yum update -y && yum install -y yum-utils && \ |
| 106 | + yum install -y \ |
| 107 | + ${CVE_UPDATES} && \ |
| 108 | + yum clean all; fi |
| 109 | + |
| 110 | +# Remove cuda repository to avoid GPG errors |
| 111 | +RUN rm -f /etc/yum.repos.d/cuda* |
| 112 | + |
| 113 | +# Add NGC DL license from the CUDA image |
| 114 | +RUN mkdir /licenses && mv /NGC-DL-CONTAINER-LICENSE /licenses/NGC-DL-CONTAINER-LICENSE |
| 115 | + |
| 116 | +ENTRYPOINT ["nvidia-driver", "init"] |
0 commit comments