-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathdcgm-exporter.yaml
56 lines (56 loc) · 1.61 KB
/
dcgm-exporter.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
# Runs one instance of dcgm-exporter on every node (DaemonSet) and expose
apiVersion: apps/v1
kind: DaemonSet
metadata:
name: dcgm-exporter
labels:
app.kubernetes.io/name: dcgm-exporter
app.kubernetes.io/version: 3.0.4-3.0.0-ubuntu20.04
spec:
selector:
matchLabels:
app.kubernetes.io/name: dcgm-exporter
app.kubernetes.io/version: 3.0.4-3.0.0-ubuntu20.04
template:
metadata:
labels:
app.kubernetes.io/name: dcgm-exporter
app.kubernetes.io/version: 3.0.4-3.0.0-ubuntu20.04
annotations:
prometheus.io/scrape: "true"
prometheus.io/port: "9400"
spec:
nodeSelector:
kubernetes.io/arch: "amd64"
resource.gpu: "true"
priorityClassName: wes-high-priority
containers:
- securityContext:
capabilities:
add:
- SYS_ADMIN
image: nvcr.io/nvidia/k8s/dcgm-exporter:3.0.4-3.0.0-ubuntu20.04
imagePullPolicy: IfNotPresent
name: dcgm-exporter
env:
- name: DCGM_EXPORTER_KUBERNETES
value: "true"
resources:
limits:
cpu: 50m
memory: 50Mi
requests:
cpu: 50m
memory: 50Mi
ports:
- name: http
containerPort: 9400
hostPort: 9400
volumeMounts:
- name: "pod-gpu-resources"
readOnly: true
mountPath: "/var/lib/kubelet/pod-resources"
volumes:
- name: "pod-gpu-resources"
hostPath:
path: "/var/lib/kubelet/pod-resources"