You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: gpu/metadata.csv
+4-2Lines changed: 4 additions & 2 deletions
Original file line number
Diff line number
Diff line change
@@ -15,7 +15,6 @@ gpu.clock.throttle_reasons.sw_power_cap,gauge,,,,GPU clocks that are throttled t
15
15
gpu.clock.throttle_reasons.sw_thermal_slowdown,gauge,,,,GPU clocks that are throttled to avoid exceeding temperaturelimits,0,gpu,clock.throttle_reasons.sw_thermal_slowdown,,
16
16
gpu.clock.throttle_reasons.sync_boost,gauge,,,,GPU clocks that are throttled to match clock speed of another GPU in the current sync boost group,0,gpu,clock.throttle_reasons.sync_boost,,
17
17
gpu.core.limit,gauge,,core,,Number of GPU cores that the process/container/device has available,0,gpu,core.limit,,
18
-
gpu.core.usage,gauge,,core,,Average number of GPU cores that a process was using in the interval. Only emitted when processes are active.,0,gpu,core.usage,,
19
18
gpu.decoder_utilization,gauge,,percent,,Percentage of time the decoder was active,0,gpu,decoder_utilization,,
20
19
gpu.device.total,gauge,,,,Number of devices active in the host,0,gpu,device.total,,
21
20
gpu.dram_active,gauge,,percent,,Percentage of time the DRAM was active,0,gpu,dram_active,,
@@ -29,9 +28,10 @@ gpu.integer_active,gauge,,percent,,Percentage of the time that the integer calcu
29
28
gpu.memory.bar1.free,gauge,,byte,,Unallocated BAR1 memory (in bytes),0,gpu,memory.bar1.free,,
30
29
gpu.memory.bar1.total,gauge,,byte,,Total BAR1 memory (in bytes).,0,gpu,memory.bar1.total,,
31
30
gpu.memory.bar1.used,gauge,,byte,,Allocated used memory (in bytes),0,gpu,memory.bar1.used,,
31
+
gpu.memory.free,gauge,,byte,,Unallocated device memory (in bytes).,0,gpu,memory.free,,
32
32
gpu.memory.limit,gauge,,byte,,The maximum amount of memory a process/container/device could allocate,0,gpu,memory.limit,,
33
+
gpu.memory.reserved,gauge,,byte,,Device memory (in bytes) reserved for system use (driver or firmware)..,0,gpu,memory.reserved,,
33
34
gpu.memory.temperature,gauge,,degree celsius,,Temperature of the memory chip,0,gpu,memory.temperature,,
34
-
gpu.memory.usage,gauge,,byte,,The memory used by this process at the point the metric was given. Only emitted when processes are active.,0,gpu,memory.usage,,
35
35
gpu.nvlink.count.active,gauge,,,,Number of active nvlinks for the device,0,gpu,,,
36
36
gpu.nvlink.count.inactive,gauge,,,,Number of inactive nvlinks for the device,0,gpu,,,
37
37
gpu.nvlink.count.total,gauge,,,,Number of total nvlinks for the device,0,gpu,,,
@@ -52,9 +52,11 @@ gpu.pci.throughput.tx,gauge,,byte,second,Bytes transmitted through PCI to the GP
52
52
gpu.performance_state,gauge,,,,Returns the current performance state of the device,0,gpu,performance_state,,
53
53
gpu.power.management_limit,gauge,,milliwatt,,Upper boundary for the device power draw.,0,gpu,power.management_limit,,
54
54
gpu.power.usage,gauge,,milliwatt,,"Power usage for the GPU device. On GA100 and older architectures this is the instantaneous power at that moment, in newer ones it represents the average power draw over one second",0,gpu,power.usage,,
55
+
gpu.process.core.usage,gauge,,core,,Average number of GPU cores that a process was using in the interval. Only emitted when processes are active.,0,gpu,process.core.usage,,
55
56
gpu.process.decoder_utilization,gauge,,percent,,Percentage of time the decoder was active for a specific process,0,gpu,process.decoder_utilization,,
56
57
gpu.process.dram_active,gauge,,percent,,Percentage of time the DRAM was active for a specific process,0,gpu,process.dram_active,,
57
58
gpu.process.encoder_utilization,gauge,,percent,,Percentage of time the encoder was active for a specific process,0,gpu,process.encoder_utilization,,
59
+
gpu.process.memory.usage,gauge,,byte,,The memory used by this process at the point the metric was given. Only emitted when processes are active.,0,gpu,process.memory.usage,,
58
60
gpu.process.sm_active,gauge,,percent,,Percentage of time the streaming multiprocessor was active for a specific process,0,gpu,process.sm_active,,
59
61
gpu.remapped_rows.correctable,count,,,,Number of rows remapped due to correctable errors,0,gpu,remapped_rows.correctable,,
60
62
gpu.remapped_rows.failed,count,,,,Number of rows that failed remapping,0,gpu,remapped_rows.failed,,
0 commit comments