4 Commits

Author SHA1 Message Date
Michael Thomson 4f5701ddb0 nvidia device plugin privileged 2026-05-12 14:25:20 -04:00
Michael Thomson fc162e8a1b nvidia gpu operator to device plugin 2026-05-12 14:15:33 -04:00
Michael Thomson 2354c431e3 nvidia gpu operator fix hostpaths 2026-05-12 13:29:27 -04:00
Michael Thomson 3eb32b8d66 nvidia gpu operator 2026-05-12 13:26:08 -04:00
6 changed files with 48 additions and 51 deletions
@@ -1,47 +0,0 @@
apiVersion: apps/v1
kind: DaemonSet
metadata:
name: generic-cdi-plugin-daemonset
namespace: generic-cdi-plugin
spec:
selector:
matchLabels:
name: generic-cdi-plugin
template:
metadata:
labels:
name: generic-cdi-plugin
app.kubernetes.io/component: generic-cdi-plugin
app.kubernetes.io/name: generic-cdi-plugin
spec:
containers:
- image: ghcr.io/olfillasodikno/generic-cdi-plugin:main
name: generic-cdi-plugin
command:
- /generic-cdi-plugin
- /var/run/cdi/nvidia-container-toolkit.json
imagePullPolicy: Always
securityContext:
privileged: true
tty: true
volumeMounts:
- name: kubelet
mountPath: /var/lib/kubelet
- name: nvidia-container-toolkit
mountPath: /var/run/cdi/nvidia-container-toolkit.json
volumes:
- name: kubelet
hostPath:
path: /var/lib/kubelet
- name: nvidia-container-toolkit
hostPath:
path: /var/run/cdi/nvidia-container-toolkit.json
affinity:
nodeAffinity:
requiredDuringSchedulingIgnoredDuringExecution:
nodeSelectorTerms:
- matchExpressions:
- key: "nixos-nvidia-cdi"
operator: In
values:
- "enabled"
@@ -0,0 +1,27 @@
apiVersion: helm.toolkit.fluxcd.io/v2
kind: HelmRelease
metadata:
name: nvidia-device-plugin
namespace: nvidia-device-plugin
spec:
chart:
spec:
chart: nvidia-device-plugin
version: 0.17.x
sourceRef:
kind: HelmRepository
name: nvdp
interval: 15m
releaseName: nvidia-device-plugin
values:
runtimeClassName: nvidia
config:
default: time-slicing
map:
time-slicing: |
version: v1
sharing:
timeSlicing:
resources:
- name: nvidia.com/gpu
replicas: 5
@@ -0,0 +1,8 @@
apiVersion: source.toolkit.fluxcd.io/v1
kind: HelmRepository
metadata:
name: nvdp
namespace: nvidia-device-plugin
spec:
interval: 15m
url: https://nvidia.github.io/k8s-device-plugin
@@ -0,0 +1,5 @@
apiVersion: node.k8s.io/v1
kind: RuntimeClass
metadata:
name: nvidia
handler: nvidia
@@ -1,4 +0,0 @@
apiVersion: v1
kind: Namespace
metadata:
name: generic-cdi-plugin
@@ -0,0 +1,8 @@
apiVersion: v1
kind: Namespace
metadata:
name: nvidia-device-plugin
labels:
pod-security.kubernetes.io/enforce: privileged
pod-security.kubernetes.io/audit: privileged
pod-security.kubernetes.io/warn: privileged