mirror of
https://github.com/k3s-io/kubernetes.git
synced 2025-07-22 19:31:44 +00:00
Fix COS GPU driver installation
* Rely on the built in GPU driver installer in COS as recommended in public docs - https://cloud.google.com/container-optimized-os/docs/how-to/run-gpus * Run `nvidia-smi` after installation to verify installation
This commit is contained in:
parent
8e37a3b324
commit
e1a951afe5
@ -2,15 +2,12 @@
|
|||||||
|
|
||||||
runcmd:
|
runcmd:
|
||||||
- modprobe configs
|
- modprobe configs
|
||||||
# Setup the installation target at make it executable
|
# Install GPU drivers - https://cloud.google.com/container-optimized-os/docs/how-to/run-gpus
|
||||||
- mkdir -p /home/kubernetes/bin/nvidia
|
- cos-extensions install gpu
|
||||||
- mount --bind /home/kubernetes/bin/nvidia /home/kubernetes/bin/nvidia
|
- mount --bind /var/lib/nvidia /var/lib/nvidia
|
||||||
- mount -o remount,exec /home/kubernetes/bin/nvidia
|
- mount -o remount,exec /var/lib/nvidia /var/lib/nvidia
|
||||||
# Compile and install the nvidia driver (precompiled driver installation currently fails)
|
# Run nvidia-smi to verify installation
|
||||||
- docker run --net=host --pid=host -v /dev:/dev -v /:/root -v /home/kubernetes/bin/nvidia:/usr/local/nvidia -e NVIDIA_INSTALL_DIR_HOST=/home/kubernetes/bin/nvidia -e NVIDIA_INSTALL_DIR_CONTAINER=/usr/local/nvidia -e NVIDIA_DRIVER_VERSION=460.91.03 --privileged gcr.io/cos-cloud/cos-gpu-installer:latest
|
- /var/lib/nvidia/bin/nvidia-smi
|
||||||
# Run the installer again, as on the first try it doesn't detect the libnvidia-ml.so
|
|
||||||
# on the second attempt we detect it and update the ld cache.
|
|
||||||
- docker run --net=host --pid=host -v /dev:/dev -v /:/root -v /home/kubernetes/bin/nvidia:/usr/local/nvidia -e NVIDIA_INSTALL_DIR_HOST=/home/kubernetes/bin/nvidia -e NVIDIA_INSTALL_DIR_CONTAINER=/usr/local/nvidia -e NVIDIA_DRIVER_VERSION=460.91.03 --privileged gcr.io/cos-cloud/cos-gpu-installer:latest
|
|
||||||
# Remove build containers. They're very large.
|
# Remove build containers. They're very large.
|
||||||
- docker rm -f $(docker ps -aq)
|
- docker rm -f $(docker ps -aq)
|
||||||
# Standard installation proceeds
|
# Standard installation proceeds
|
||||||
|
Loading…
Reference in New Issue
Block a user