Skip to content

FCPSE-3679: Add error counts / dimm channel for edac collector#3571

Open
Manognagrandhi wants to merge 1 commit intoprometheus:masterfrom
Manognagrandhi:FCPSE-3679
Open

FCPSE-3679: Add error counts / dimm channel for edac collector#3571
Manognagrandhi wants to merge 1 commit intoprometheus:masterfrom
Manognagrandhi:FCPSE-3679

Conversation

@Manognagrandhi
Copy link

@Manognagrandhi Manognagrandhi commented Mar 4, 2026

# TYPE node_edac_correctable_errors_total counter
node_edac_correctable_errors_total{controller="0"} 0
node_edac_correctable_errors_total{controller="1"} 0
node_edac_correctable_errors_total{controller="2"} 0
node_edac_correctable_errors_total{controller="3"} 0
# HELP node_edac_dimm_correctable_errors_total Total correctable memory errors for this dimm.
# TYPE node_edac_dimm_correctable_errors_total counter
node_edac_dimm_correctable_errors_total{controller="0",dimm="0"} 0
node_edac_dimm_correctable_errors_total{controller="0",dimm="1"} 0
node_edac_dimm_correctable_errors_total{controller="0",dimm="2"} 0
node_edac_dimm_correctable_errors_total{controller="0",dimm="3"} 0
node_edac_dimm_correctable_errors_total{controller="1",dimm="0"} 0
node_edac_dimm_correctable_errors_total{controller="1",dimm="1"} 0
node_edac_dimm_correctable_errors_total{controller="1",dimm="2"} 0
node_edac_dimm_correctable_errors_total{controller="1",dimm="3"} 0
node_edac_dimm_correctable_errors_total{controller="2",dimm="0"} 0
node_edac_dimm_correctable_errors_total{controller="2",dimm="1"} 0
node_edac_dimm_correctable_errors_total{controller="2",dimm="2"} 0
node_edac_dimm_correctable_errors_total{controller="2",dimm="3"} 0
node_edac_dimm_correctable_errors_total{controller="3",dimm="0"} 0
node_edac_dimm_correctable_errors_total{controller="3",dimm="1"} 0
node_edac_dimm_correctable_errors_total{controller="3",dimm="2"} 0
node_edac_dimm_correctable_errors_total{controller="3",dimm="3"} 0
# HELP node_edac_dimm_label Label of the dimm.
# TYPE node_edac_dimm_label gauge
node_edac_dimm_label{channel="0",controller="0",dimm="0",label="CPU_SrcID#0_MC#0_Chan#0_DIMM#0"} 1
node_edac_dimm_label{channel="0",controller="0",dimm="1",label="CPU_SrcID#0_MC#0_Chan#0_DIMM#1"} 1
node_edac_dimm_label{channel="0",controller="1",dimm="0",label="CPU_SrcID#0_MC#1_Chan#0_DIMM#0"} 1
node_edac_dimm_label{channel="0",controller="1",dimm="1",label="CPU_SrcID#0_MC#1_Chan#0_DIMM#1"} 1
node_edac_dimm_label{channel="0",controller="2",dimm="0",label="CPU_SrcID#1_MC#0_Chan#0_DIMM#0"} 1
node_edac_dimm_label{channel="0",controller="2",dimm="1",label="CPU_SrcID#1_MC#0_Chan#0_DIMM#1"} 1
node_edac_dimm_label{channel="0",controller="3",dimm="0",label="CPU_SrcID#1_MC#1_Chan#0_DIMM#0"} 1
node_edac_dimm_label{channel="0",controller="3",dimm="1",label="CPU_SrcID#1_MC#1_Chan#0_DIMM#1"} 1
node_edac_dimm_label{channel="1",controller="0",dimm="2",label="CPU_SrcID#0_MC#0_Chan#1_DIMM#0"} 1
node_edac_dimm_label{channel="1",controller="0",dimm="3",label="CPU_SrcID#0_MC#0_Chan#1_DIMM#1"} 1
node_edac_dimm_label{channel="1",controller="1",dimm="2",label="CPU_SrcID#0_MC#1_Chan#1_DIMM#0"} 1
node_edac_dimm_label{channel="1",controller="1",dimm="3",label="CPU_SrcID#0_MC#1_Chan#1_DIMM#1"} 1
node_edac_dimm_label{channel="1",controller="2",dimm="2",label="CPU_SrcID#1_MC#0_Chan#1_DIMM#0"} 1
node_edac_dimm_label{channel="1",controller="2",dimm="3",label="CPU_SrcID#1_MC#0_Chan#1_DIMM#1"} 1
node_edac_dimm_label{channel="1",controller="3",dimm="2",label="CPU_SrcID#1_MC#1_Chan#1_DIMM#0"} 1
node_edac_dimm_label{channel="1",controller="3",dimm="3",label="CPU_SrcID#1_MC#1_Chan#1_DIMM#1"} 1
# HELP node_edac_dimm_uncorrectable_errors_total Total uncorrectable memory errors for this dimm.
# TYPE node_edac_dimm_uncorrectable_errors_total counter
node_edac_dimm_uncorrectable_errors_total{controller="0",dimm="0"} 0
node_edac_dimm_uncorrectable_errors_total{controller="0",dimm="1"} 0
node_edac_dimm_uncorrectable_errors_total{controller="0",dimm="2"} 0
node_edac_dimm_uncorrectable_errors_total{controller="0",dimm="3"} 0
node_edac_dimm_uncorrectable_errors_total{controller="1",dimm="0"} 0
node_edac_dimm_uncorrectable_errors_total{controller="1",dimm="1"} 0
node_edac_dimm_uncorrectable_errors_total{controller="1",dimm="2"} 0
node_edac_dimm_uncorrectable_errors_total{controller="1",dimm="3"} 0
node_edac_dimm_uncorrectable_errors_total{controller="2",dimm="0"} 0
node_edac_dimm_uncorrectable_errors_total{controller="2",dimm="1"} 0
node_edac_dimm_uncorrectable_errors_total{controller="2",dimm="2"} 0
node_edac_dimm_uncorrectable_errors_total{controller="2",dimm="3"} 0
node_edac_dimm_uncorrectable_errors_total{controller="3",dimm="0"} 0
node_edac_dimm_uncorrectable_errors_total{controller="3",dimm="1"} 0
node_edac_dimm_uncorrectable_errors_total{controller="3",dimm="2"} 0
node_edac_dimm_uncorrectable_errors_total{controller="3",dimm="3"} 0
# HELP node_edac_uncorrectable_errors_total Total uncorrectable memory errors.
# TYPE node_edac_uncorrectable_errors_total counter
node_edac_uncorrectable_errors_total{controller="0"} 0
node_edac_uncorrectable_errors_total{controller="1"} 0
node_edac_uncorrectable_errors_total{controller="2"} 0
node_edac_uncorrectable_errors_total{controller="3"} 0

@Manognagrandhi Manognagrandhi changed the title add error counts / dimm channel for edac collector FCPSE-3679: Add error counts / dimm channel for edac collector Mar 4, 2026
@SuperQ
Copy link
Member

SuperQ commented Mar 4, 2026

This needs a DCO sign-off. You can use git commit -s --amend to add it.

Copy link
Member

@SuperQ SuperQ left a comment

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Tests don't pass.

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment

Labels

None yet

Projects

None yet

Development

Successfully merging this pull request may close these issues.

2 participants