-
Notifications
You must be signed in to change notification settings - Fork 151
/
device-plugin.yaml
104 lines (104 loc) · 3.08 KB
/
device-plugin.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
# NOTE: This file is not the source of truth for GKE device plugins. Modifying this file would have no effect on GKE clusters.
apiVersion: apps/v1
kind: DaemonSet
metadata:
labels:
k8s-app: nvidia-gpu-device-plugin
name: nvidia-gpu-device-plugin
namespace: kube-system
spec:
selector:
matchLabels:
k8s-app: nvidia-gpu-device-plugin
template:
metadata:
labels:
k8s-app: nvidia-gpu-device-plugin
spec:
affinity:
nodeAffinity:
requiredDuringSchedulingIgnoredDuringExecution:
nodeSelectorTerms:
- matchExpressions:
- key: cloud.google.com/gke-accelerator
operator: Exists
containers:
- command:
- /usr/bin/nvidia-gpu-device-plugin
- -logtostderr
- --enable-container-gpu-metrics
- --enable-health-monitoring
env:
- name: XID_CONFIG
valueFrom:
configMapKeyRef:
key: HealthCriticalXid
name: xid-config
optional: true
- name: LD_LIBRARY_PATH
value: /usr/local/nvidia/lib64
- name: GOMAXPROCS
value: "1"
image: gcr.io/gke-release/nvidia-gpu-device-plugin@sha256:6b25281cd0fa3ca55f3e837a18be4a14b44952105568f466530dd85bcebde62f
name: nvidia-gpu-device-plugin
ports:
- containerPort: 2112
name: metrics
resources:
limits:
memory: 100Mi
requests:
cpu: 50m
memory: 100Mi
securityContext:
privileged: true
volumeMounts:
- mountPath: /device-plugin
name: device-plugin
- mountPath: /dev
name: dev
- mountPath: /usr/local/nvidia
name: nvidia
- mountPath: /var/lib/kubelet/pod-resources
name: pod-resources
- mountPath: /proc
name: proc
- mountPath: /etc/nvidia
name: nvidia-config
priorityClassName: system-node-critical
restartPolicy: Always
securityContext:
seccompProfile:
type: RuntimeDefault
tolerations:
- effect: NoExecute
operator: Exists
- effect: NoSchedule
operator: Exists
volumes:
- hostPath:
path: /var/lib/kubelet/device-plugins
type: Directory
name: device-plugin
- hostPath:
path: /dev
type: Directory
name: dev
- hostPath:
path: /var/lib/kubelet/pod-resources
type: Directory
name: pod-resources
- hostPath:
path: /proc
type: Directory
name: proc
- hostPath:
path: /etc/nvidia
type: DirectoryOrCreate
name: nvidia-config
- hostPath:
path: /home/kubernetes/bin/nvidia
type: Directory
name: nvidia
updateStrategy:
type: RollingUpdate