Skip to content

Commit

Permalink
Add envars dropped in helm chart refactor when introducing ComputeDomain
Browse files Browse the repository at this point in the history
Signed-off-by: Kevin Klues <[email protected]>
  • Loading branch information
klueska committed Feb 25, 2025
1 parent 5f4121d commit e64d5e2
Showing 1 changed file with 23 additions and 2 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -89,13 +89,34 @@ spec:
{{- toYaml .Values.kubeletPlugin.containers.gpus.securityContext | nindent 10 }}
image: {{ include "nvidia-dra-driver-gpu.fullimage" . }}
imagePullPolicy: {{ .Values.image.pullPolicy }}
command:
- gpu-kubelet-plugin
command: ["bash", "-c"]
args:
- |-
# Conditionally mask the params file to prevent this container from
# recreating any missing GPU device nodes. This is necessary, for
# example, when running under nvkind to limit the set GPUs governed
# by the plugin even though it has cgroup access to all of them.
if [ "${MASK_NVIDIA_DRIVER_PARAMS}" = "true" ]; then
cp /proc/driver/nvidia/params root/gpu-params
sed -i 's/^ModifyDeviceFiles: 1$/ModifyDeviceFiles: 0/' root/gpu-params
mount --bind root/gpu-params /proc/driver/nvidia/params
fi
gpu-kubelet-plugin
resources:
{{- toYaml .Values.kubeletPlugin.containers.gpus.resources | nindent 10 }}
env:
- name: MASK_NVIDIA_DRIVER_PARAMS
value: "{{ .Values.maskNvidiaDriverParams }}"
- name: NVIDIA_CTK_PATH
value: "{{ .Values.nvidiaCtkPath }}"
- name: NVIDIA_DRIVER_ROOT
value: "{{ .Values.nvidiaDriverRoot }}"
- name: NVIDIA_VISIBLE_DEVICES
value: void
- name: CDI_ROOT
value: /var/run/cdi
- name: NVIDIA_MIG_CONFIG_DEVICES
value: all
- name: NODE_NAME
valueFrom:
fieldRef:
Expand Down

0 comments on commit e64d5e2

Please sign in to comment.