|
| 1 | +#!/usr/bin/env bash |
| 2 | +set -euxo pipefail |
| 3 | + |
| 4 | +source /opt/gpu/config.sh |
| 5 | + |
| 6 | +KERNEL_NAME=$(uname -r) |
| 7 | +LOG_FILE_NAME="/var/log/nvidia-installer-$(date +%s).log" |
| 8 | + |
| 9 | +# host needs these tools to build and load kernel module, can remove ca-certificates, was only for testing |
| 10 | +apt update && apt install -y kmod gcc make dkms initramfs-tools linux-headers-$(uname -r) ca-certificates --no-install-recommends |
| 11 | + |
| 12 | +# install cached nvidia debian packages for container runtime compatibility |
| 13 | +for apt_package in $NVIDIA_PACKAGES; do |
| 14 | + dpkg -i /opt/gpu/${apt_package}* |
| 15 | +done |
| 16 | +dpkg -i /opt/gpu/nvidia-container-runtime* |
| 17 | + |
| 18 | +# blacklist nouveau driver, nvidia driver dependency |
| 19 | +cp /opt/gpu/blacklist-nouveau.conf /etc/modprobe.d/blacklist-nouveau.conf |
| 20 | +update-initramfs -u |
| 21 | + |
| 22 | +# clean up lingering files from previous install |
| 23 | +set +e |
| 24 | +umount -l /usr/lib/x86_64-linux-gnu || true |
| 25 | +umount -l /tmp/overlay || true |
| 26 | +rm -r /tmp/overlay |
| 27 | +rm -r /opt/gpu/NVIDIA-Linux-x86_64-${DRIVER_VERSION} |
| 28 | +set -e |
| 29 | + |
| 30 | +# set up overlayfs to change install location of nvidia libs from /usr/lib/x86_64-linux-gnu to /usr/local/nvidia |
| 31 | +# add an extra layer of indirection via tmpfs because it's not possible to have an overlayfs on an overlayfs (i.e., inside a container) |
| 32 | +mkdir /tmp/overlay |
| 33 | +mount -t tmpfs tmpfs /tmp/overlay |
| 34 | +mkdir /tmp/overlay/{workdir,lib64} |
| 35 | +mkdir -p ${GPU_DEST}/lib64 |
| 36 | +mount -t overlay overlay -o lowerdir=/usr/lib/x86_64-linux-gnu,upperdir=/tmp/overlay/lib64,workdir=/tmp/overlay/workdir /usr/lib/x86_64-linux-gnu |
| 37 | + |
| 38 | +# clean up previously uncompressed driver, if it exists |
| 39 | +# causes driver installer to fail if it exists |
| 40 | +pushd /opt/gpu |
| 41 | +# extract runfile, takes some time, so do ahead of time |
| 42 | +sh /opt/gpu/NVIDIA-Linux-x86_64-${DRIVER_VERSION}.run -x |
| 43 | +popd |
| 44 | + |
| 45 | +# install nvidia drivers |
| 46 | +/opt/gpu/NVIDIA-Linux-x86_64-${DRIVER_VERSION}/nvidia-installer -s -k=$KERNEL_NAME --log-file-name=${LOG_FILE_NAME} -a --no-drm --dkms --utility-prefix="${GPU_DEST}" --opengl-prefix="${GPU_DEST}" |
| 47 | + |
| 48 | +# move nvidia libs to correct location from temporary overlayfs |
| 49 | +cp -a /tmp/overlay/lib64 ${GPU_DEST}/lib64 |
| 50 | + |
| 51 | +# move nvidia binaries to /usr/bin...because we like that? |
| 52 | +cp -rvT ${GPU_DEST}/bin /usr/bin |
| 53 | + |
| 54 | +# configure system to know about nvidia lib paths |
| 55 | +echo "${GPU_DEST}/lib64" > /etc/ld.so.conf.d/nvidia.conf |
| 56 | +ldconfig |
| 57 | + |
| 58 | +# unmount, cleanup |
| 59 | +set +e |
| 60 | +umount -l /usr/lib/x86_64-linux-gnu |
| 61 | +umount /tmp/overlay |
| 62 | +rm -r /tmp/overlay |
| 63 | +set -e |
| 64 | + |
| 65 | +# validate that nvidia driver is working |
| 66 | +dkms status |
| 67 | +nvidia-modprobe -u -c0 |
| 68 | +nvidia-smi |
0 commit comments