Skip to content

Commit 17769b6

Browse files
Merge pull request #2558 from yevgeny-shnaidman/yevgeny/update-configmap-accelerators
MON-4189:Updating node-exporter accelerators configmap
2 parents 8804294 + 3781788 commit 17769b6

File tree

2 files changed

+182
-22
lines changed

2 files changed

+182
-22
lines changed

assets/node-exporter/accelerators-collector-configmap.yaml

Lines changed: 108 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -2,24 +2,118 @@ apiVersion: v1
22
data:
33
config.yaml: |-
44
- "models":
5-
- "modelName": "A100"
5+
- "modelName": "NVIDIA A800 PCIe 80GB"
6+
"pciID": "0x20f5"
7+
- "modelName": "NVIDIA A800 40GB PCIe active cooled"
8+
"pciID": "0x20f6"
9+
- "modelName": "NVIDIA AX800"
10+
"pciID": "0x20fd"
11+
- "modelName": "NVIDIA A100 PCIe 40GB"
12+
"pciID": "0x20f1"
13+
- "modelName": "NVIDIA A100 PCIe 80GB"
614
"pciID": "0x20b5"
7-
- "modelName": "RTX_A6000"
8-
"pciID": "0x2230"
9-
- "modelName": "RTX_4090"
10-
"pciID": "0x2717"
11-
- "modelName": "A40"
15+
- "modelName": "NVIDIA A40"
1216
"pciID": "0x2235"
13-
- "modelName": "V100"
14-
"pciID": "0x1df5"
15-
- "modelName": "A100 40G"
16-
"pciID": "0x20f1"
17-
- "modelName": "T400 4GB"
18-
"pciID": "0x1ff2"
19-
- "modelName": "Tesla T4"
20-
"pciID": "0x1eb8"
17+
- "modelName": "NVIDIA A30"
18+
"pciID": "0x20b7"
19+
- "modelName": "NVIDIA A10"
20+
"pciID": "0x2236"
21+
- "modelName": "NVIDIA A16"
22+
"pciID": "0x25b6"
23+
- "modelName": "H800 NVL"
24+
"pciID": "0x2322"
25+
- "modelName": "NVIDIA H100 NVL"
26+
"pciID": "0x2321"
27+
- "modelName": "NVIDIA H100 PCIe 80GB"
28+
"pciID": "0x2331"
29+
- "modelName": "NVIDIA L40"
30+
"pciID": "0x26b5"
31+
- "modelName": "NVIDIA L40S"
32+
"pciID": "0x26b9"
33+
- "modelName": "NVIDIA L20 liquid cooled"
34+
"pciID": "0x26bA"
35+
- "modelName": "NVIDIA L4"
36+
"pciID": "0x27b8"
37+
- "modelName": "NVIDIA L2"
38+
"pciID": "0x27b6"
39+
- "modelName": "NVIDIA RTX 6000 Ada"
40+
"pciID": "0x26b1"
41+
- "modelName": "NVIDIA RTX 5880 Ada"
42+
"pciID": "0x26b3"
43+
- "modelName": "NVIDIA RTX 5000 Ada"
44+
"pciID": "0x2231"
45+
- "modelName": "NVIDIA RTX A6000"
46+
"pciID": "0x2230"
47+
- "modelName": "NVIDIA RTX A5500"
48+
"pciID": "0x2233"
49+
- "modelName": "NVIDIA RTX 8000 passive"
50+
"pciID": "0x1e30"
51+
- "modelName": "NVIDIA RTX A2000"
52+
"pciID": "0x2531"
53+
- "modelName": "NVIDIA A100 SXM4 40GB"
54+
"pciID": "0x20b0"
55+
- "modelName": "NVIDIA H800 NVL"
56+
"pciID": "0x233a"
57+
- "modelName": "NVIDIA H200 NVL"
58+
"pciID": "0x233b"
59+
- "modelName": "NVIDIA A100 SXM4 80GB"
60+
"pciID": "0x20b2"
61+
- "modelName": "NVIDIA A100 SXM 64GB"
62+
"pciID": "0x20b3"
63+
- "modelName": "NVIDIA A800 SXM4 40GB"
64+
"pciID": "0x20bd"
65+
- "modelName": "NVIDIA A800 SXM4 80GB"
66+
"pciID": "0x20f3"
67+
- "modelName": "NVIDIA RTX A1000"
68+
"pciID": "0x25b0"
2169
"vendorID": "0x10de"
2270
"vendorName": "NVIDIA"
71+
- "models":
72+
- "modelName": "AMD MI210"
73+
"pciID": "0x740f"
74+
- "modelName": "AMD MI250"
75+
"pciID": "0x740c"
76+
- "modelName": "AMD MI250X"
77+
"pciID": "0x7408"
78+
- "modelName": "AMD MI300"
79+
"pciID": "0x74a0"
80+
- "modelName": "AMD MI300X"
81+
"pciID": "0x74a1"
82+
- "modelName": "AMD MI325X"
83+
"pciID": "0x74a5"
84+
- "modelName": "AMD MI308X"
85+
"pciID": "0x7aa2"
86+
- "modelName": "AMD MI300X VF"
87+
"pciID": "0x74b5"
88+
- "modelName": "AMD MI210 VF"
89+
"pciID": "0x7410"
90+
"vendorID": "0x1002"
91+
"vendorName": "AMD"
92+
- "models":
93+
- "modelName": "Gaudi 1"
94+
"pciID": "0x1000"
95+
- "modelName": "Gaudi 2"
96+
"pciID": "0x1020"
97+
"vendorID": "0x1da3"
98+
"vendorName": "GAUDI"
99+
- "models":
100+
- "modelName": "Intel Data Center GPU Max 1550"
101+
"pciID": "0x0bd5"
102+
- "modelName": "Intel Data Center GPU Max 1100"
103+
"pciID": "0x0bda"
104+
- "modelName": "Intel Data Center GPU Flex 170"
105+
"pciID": "0x56c0"
106+
- "modelName": "Intel Data Center GPU Flex 140"
107+
"pciID": "0x56c1"
108+
"vendorID": "0x8086"
109+
"vendorName": "Intel"
110+
- "models":
111+
- "modelName": "Qualcomm AI 100"
112+
"pciID": "0xa100"
113+
- "modelName": "Qualcomm AI 80"
114+
"pciID": "0xa080"
115+
"vendorID": "0x17cb"
116+
"vendorName": "Qualcomm"
23117
kind: ConfigMap
24118
metadata:
25119
labels:

jsonnet/components/node-exporter.libsonnet

Lines changed: 74 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -12,16 +12,82 @@ local acceleratorsConfigData = [
1212
vendorName: 'NVIDIA',
1313
vendorID: '0x10de',
1414
models: [
15-
{ pciID: '0x20b5', modelName: 'A100' },
16-
{ pciID: '0x2230', modelName: 'RTX_A6000' },
17-
{ pciID: '0x2717', modelName: 'RTX_4090' },
18-
{ pciID: '0x2235', modelName: 'A40' },
19-
{ pciID: '0x1df5', modelName: 'V100' },
20-
{ pciID: '0x20f1', modelName: 'A100 40G' },
21-
{ pciID: '0x1ff2', modelName: 'T400 4GB' },
22-
{ pciID: '0x1eb8', modelName: 'Tesla T4' },
15+
{ pciID: '0x20f5', modelName: 'NVIDIA A800 PCIe 80GB' },
16+
{ pciID: '0x20f6', modelName: 'NVIDIA A800 40GB PCIe active cooled' },
17+
{ pciID: '0x20fd', modelName: 'NVIDIA AX800' },
18+
{ pciID: '0x20f1', modelName: 'NVIDIA A100 PCIe 40GB' },
19+
{ pciID: '0x20b5', modelName: 'NVIDIA A100 PCIe 80GB' },
20+
{ pciID: '0x2235', modelName: 'NVIDIA A40' },
21+
{ pciID: '0x20b7', modelName: 'NVIDIA A30' },
22+
{ pciID: '0x2236', modelName: 'NVIDIA A10' },
23+
{ pciID: '0x25b6', modelName: 'NVIDIA A16' },
24+
{ pciID: '0x2322', modelName: 'H800 NVL' },
25+
{ pciID: '0x2321', modelName: 'NVIDIA H100 NVL' },
26+
{ pciID: '0x2331', modelName: 'NVIDIA H100 PCIe 80GB' },
27+
{ pciID: '0x26b5', modelName: 'NVIDIA L40' },
28+
{ pciID: '0x26b9', modelName: 'NVIDIA L40S' },
29+
{ pciID: '0x26bA', modelName: 'NVIDIA L20 liquid cooled' },
30+
{ pciID: '0x27b8', modelName: 'NVIDIA L4' },
31+
{ pciID: '0x27b6', modelName: 'NVIDIA L2' },
32+
{ pciID: '0x26b1', modelName: 'NVIDIA RTX 6000 Ada' },
33+
{ pciID: '0x26b3', modelName: 'NVIDIA RTX 5880 Ada' },
34+
{ pciID: '0x2231', modelName: 'NVIDIA RTX 5000 Ada' },
35+
{ pciID: '0x2230', modelName: 'NVIDIA RTX A6000' },
36+
{ pciID: '0x2233', modelName: 'NVIDIA RTX A5500' },
37+
{ pciID: '0x1e30', modelName: 'NVIDIA RTX 8000 passive' },
38+
{ pciID: '0x2531', modelName: 'NVIDIA RTX A2000' },
39+
{ pciID: '0x20b0', modelName: 'NVIDIA A100 SXM4 40GB' },
40+
{ pciID: '0x233a', modelName: 'NVIDIA H800 NVL' },
41+
{ pciID: '0x233b', modelName: 'NVIDIA H200 NVL' },
42+
{ pciID: '0x20b2', modelName: 'NVIDIA A100 SXM4 80GB' },
43+
{ pciID: '0x20b3', modelName: 'NVIDIA A100 SXM 64GB' },
44+
{ pciID: '0x20bd', modelName: 'NVIDIA A800 SXM4 40GB' },
45+
{ pciID: '0x20f3', modelName: 'NVIDIA A800 SXM4 80GB' },
46+
{ pciID: '0x25b0', modelName: 'NVIDIA RTX A1000' },
2347
],
2448
},
49+
{
50+
vendorName: 'AMD',
51+
vendorID: '0x1002',
52+
models: [
53+
{ pciID: '0x740f', modelName: 'AMD MI210' },
54+
{ pciID: '0x740c', modelName: 'AMD MI250' },
55+
{ pciID: '0x7408', modelName: 'AMD MI250X' },
56+
{ pciID: '0x74a0', modelName: 'AMD MI300' },
57+
{ pciID: '0x74a1', modelName: 'AMD MI300X' },
58+
{ pciID: '0x74a5', modelName: 'AMD MI325X' },
59+
{ pciID: '0x7aa2', modelName: 'AMD MI308X' },
60+
{ pciID: '0x74b5', modelName: 'AMD MI300X VF' },
61+
{ pciID: '0x7410', modelName: 'AMD MI210 VF' },
62+
],
63+
},
64+
{
65+
vendorName: 'GAUDI',
66+
vendorID: '0x1da3',
67+
models: [
68+
{ pciID: '0x1000', modelName: 'Gaudi 1' },
69+
{ pciID: '0x1020', modelName: 'Gaudi 2' },
70+
],
71+
},
72+
{
73+
vendorName: 'Intel',
74+
vendorID: '0x8086',
75+
models: [
76+
{ pciID: '0x0bd5', modelName: 'Intel Data Center GPU Max 1550' },
77+
{ pciID: '0x0bda', modelName: 'Intel Data Center GPU Max 1100' },
78+
{ pciID: '0x56c0', modelName: 'Intel Data Center GPU Flex 170' },
79+
{ pciID: '0x56c1', modelName: 'Intel Data Center GPU Flex 140' },
80+
],
81+
},
82+
{
83+
vendorName: 'Qualcomm',
84+
vendorID: '0x17cb',
85+
models: [
86+
{ pciID: '0xa100', modelName: 'Qualcomm AI 100' },
87+
{ pciID: '0xa080', modelName: 'Qualcomm AI 80' },
88+
],
89+
},
90+
2591
];
2692

2793
local nodeExporter = import 'github.com/prometheus-operator/kube-prometheus/jsonnet/kube-prometheus/components/node-exporter.libsonnet';

0 commit comments

Comments
 (0)