From cd6fe5b61a7973d700d422c5b7bb60c487d4587a Mon Sep 17 00:00:00 2001 From: Michael Aspinwall Date: Fri, 27 Jun 2025 18:57:42 +0000 Subject: [PATCH] Fix docs to correctly install nvidia driver --- examples/demo_nvidia_dranet/values.yaml | 34 +++++++++++++++++++++++++ site/content/docs/user/nvidia-dranet.md | 4 ++- 2 files changed, 37 insertions(+), 1 deletion(-) create mode 100644 examples/demo_nvidia_dranet/values.yaml diff --git a/examples/demo_nvidia_dranet/values.yaml b/examples/demo_nvidia_dranet/values.yaml new file mode 100644 index 00000000..7135148b --- /dev/null +++ b/examples/demo_nvidia_dranet/values.yaml @@ -0,0 +1,34 @@ +# Copyright 2025 Google LLC +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# https://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +# Default values for k8s-dra-driver-gpu. +# This is a YAML-formatted file. +# Declare variables to be passed into your templates. + +# Specify the driver root on the host. +# If the NVIDIA GPU driver is managed using the NVIDIA GPU Driver Container, +# this is typically /run/nvidia/driver. +# For driver installed directly on a host, a value of `/` is used. +nvidiaDriverRoot: "/home/kubernetes/bin/nvidia" + +controller: + priorityClassName: "" + affinity: null + +kubeletPlugin: + priorityClassName: "" + tolerations: + - effect: NoSchedule + key: nvidia.com/gpu + operator: Exists diff --git a/site/content/docs/user/nvidia-dranet.md b/site/content/docs/user/nvidia-dranet.md index 5aac9912..6548fb67 100644 --- a/site/content/docs/user/nvidia-dranet.md +++ b/site/content/docs/user/nvidia-dranet.md @@ -98,9 +98,11 @@ kubectl apply -f https://raw.githubusercontent.com/google/dranet/refs/heads/main In order to install the NVIDIA DRA Drivers you will need to clone the [NVIDIA DRA](https://github.com/NVIDIA/k8s-dra-driver-gpu) repo. Ensure you have [helm](https://helm.sh/docs/intro/install/) installed. ``` -helm upgrade -i --create-namespace --namespace nvidia-dra-driver-gpu nvidia-dra-driver-gpu ./k8s-dra-driver-gpu/deployments/helm/nvidia-dra-driver-gpu --set gpuResourcesEnabledOverride=true --set nvidiaDriverRoot=/home/kubernetes/bin/nvidia --wait +helm upgrade -i --create-namespace --namespace nvidia-dra-driver-gpu nvidia-dra-driver-gpu ./k8s-dra-driver-gpu/deployments/helm/nvidia-dra-driver-gpu --set gpuResourcesEnabledOverride=true --values https://raw.githubusercontent.com/google/dranet/refs/heads/main/values.yaml --wait ``` +The values.yaml adds some additional tolerations and removes some priorities that need to be done in order to work nicely with GKE. + Once this is done, you can run ```sh