@@ -69,7 +69,6 @@ local dcgm_metrics = [
6969 { name: 'DCGM_FI_DEV_MEM_COPY_UTIL' , title: 'Memory Copy Utilization' , unit: 'percent' },
7070 { name: 'DCGM_FI_DEV_ENC_UTIL' , title: 'Encoder Utilization' , unit: 'percent' },
7171 { name: 'DCGM_FI_DEV_DEC_UTIL' , title: 'Decoder Utilization' , unit: 'percent' },
72- { name: 'DCGM_FI_DEV_XID_ERRORS' , title: 'Value of the last XID error encountered' , unit: 'none' },
7372 { name: 'DCGM_FI_DEV_FB_FREE' , title: 'Framebuffer memory free (in MiB)' , unit: 'megabytes' },
7473 { name: 'DCGM_FI_DEV_FB_USED' , title: 'Framebuffer memory used (in MiB)' , unit: 'megabytes' },
7574 { name: 'DCGM_FI_DEV_NVLINK_BANDWIDTH_TOTAL' , title: 'Total number of NVLink bandwidth counters for all lanes' , unit: 'none' },
@@ -83,6 +82,7 @@ local dcgm_errors = [
8382 { name: 'DCGM_FI_DEV_UNCORRECTABLE_REMAPPED_ROWS' , title: 'Number of remapped rows for uncorrectable errors' , unit: 'cps' },
8483 { name: 'DCGM_FI_DEV_CORRECTABLE_REMAPPED_ROWS' , title: 'Number of remapped rows for correctable errors' , unit: 'cps' },
8584 { name: 'DCGM_FI_DEV_ROW_REMAP_FAILURE' , title: 'Whether remapping of rows has failed' , unit: 'cps' },
85+ { name: 'DCGM_FI_DEV_XID_ERRORS' , title: 'Value of the last XID error encountered' , unit: 'none' },
8686];
8787
8888local nvlink_metrics = [
0 commit comments