linux-kernel.vger.kernel.org archive mirror
 help / color / mirror / Atom feed
From: Robert Richter <rrichter@marvell.com>
To: Borislav Petkov <bp@alien8.de>, James Morse <james.morse@arm.com>,
	"Mauro Carvalho Chehab" <mchehab@kernel.org>
Cc: "linux-edac@vger.kernel.org" <linux-edac@vger.kernel.org>,
	"linux-kernel@vger.kernel.org" <linux-kernel@vger.kernel.org>,
	Robert Richter <rrichter@marvell.com>
Subject: [PATCH v2 17/24] EDAC, ghes: Create one memory controller device per node
Date: Mon, 24 Jun 2019 15:09:29 +0000	[thread overview]
Message-ID: <20190624150758.6695-18-rrichter@marvell.com> (raw)
In-Reply-To: <20190624150758.6695-1-rrichter@marvell.com>

Typically for most systems, there is one edac memory controller device
per node. This patch implements the same for the ghes driver. Now,
create multiple mc devices and map the dimms based on the node id.

We need at least one node that is used as fallback if no node
information is available in the error report.

Here a complete and consistent error report from a ThunderX2 system
(zero counter values dropped):

 # find /sys/devices/system/edac/mc/ -name \*count | sort -V | xargs grep . | sed -e '/:0/d'
 /sys/devices/system/edac/mc/mc0/ce_count:11
 /sys/devices/system/edac/mc/mc0/ce_noinfo_count:1
 /sys/devices/system/edac/mc/mc0/csrow2/ce_count:5
 /sys/devices/system/edac/mc/mc0/csrow2/ch0_ce_count:5
 /sys/devices/system/edac/mc/mc0/csrow3/ce_count:3
 /sys/devices/system/edac/mc/mc0/csrow3/ch0_ce_count:3
 /sys/devices/system/edac/mc/mc0/csrow4/ce_count:2
 /sys/devices/system/edac/mc/mc0/csrow4/ch0_ce_count:2
 /sys/devices/system/edac/mc/mc0/dimm2/dimm_ce_count:5
 /sys/devices/system/edac/mc/mc0/dimm3/dimm_ce_count:3
 /sys/devices/system/edac/mc/mc0/dimm4/dimm_ce_count:2
 /sys/devices/system/edac/mc/mc1/ce_count:7
 /sys/devices/system/edac/mc/mc1/csrow2/ce_count:4
 /sys/devices/system/edac/mc/mc1/csrow2/ch0_ce_count:4
 /sys/devices/system/edac/mc/mc1/csrow3/ce_count:1
 /sys/devices/system/edac/mc/mc1/csrow3/ch0_ce_count:1
 /sys/devices/system/edac/mc/mc1/csrow6/ce_count:2
 /sys/devices/system/edac/mc/mc1/csrow6/ch0_ce_count:2
 /sys/devices/system/edac/mc/mc1/dimm2/dimm_ce_count:4
 /sys/devices/system/edac/mc/mc1/dimm3/dimm_ce_count:1
 /sys/devices/system/edac/mc/mc1/dimm6/dimm_ce_count:2

Signed-off-by: Robert Richter <rrichter@marvell.com>
---
 drivers/edac/ghes_edac.c | 126 ++++++++++++++++++++++++++++++++-------
 1 file changed, 104 insertions(+), 22 deletions(-)

diff --git a/drivers/edac/ghes_edac.c b/drivers/edac/ghes_edac.c
index 13b74368ad81..63de11654649 100644
--- a/drivers/edac/ghes_edac.c
+++ b/drivers/edac/ghes_edac.c
@@ -16,6 +16,7 @@
 #include <ras/ras_event.h>
 
 struct ghes_edac_pvt {
+	struct device dev;
 	struct list_head list;
 	struct ghes *ghes;
 	struct mem_ctl_info *mci;
@@ -26,7 +27,7 @@ struct ghes_edac_pvt {
 };
 
 static atomic_t ghes_init = ATOMIC_INIT(0);
-static struct ghes_edac_pvt *ghes_pvt;
+struct mem_ctl_info *fallback;
 
 /*
  * Sync with other, potentially concurrent callers of
@@ -172,15 +173,15 @@ static void ghes_edac_set_nid(const struct dmi_header *dh, void *arg)
 	}
 }
 
-static int get_dimm_smbios_index(u16 handle)
+static int get_dimm_smbios_index(struct mem_ctl_info *mci, u16 handle)
 {
-	struct mem_ctl_info *mci = ghes_pvt->mci;
 	struct dimm_info *dimm;
 
 	mci_for_each_dimm(mci, dimm) {
 		if (dimm->smbios_handle == handle)
 			return dimm->idx;
 	}
+
 	return -1;
 }
 
@@ -364,6 +365,9 @@ static void mem_info_prepare_mci(struct mem_ctl_info *mci)
 	int index = 0;
 
 	for_each_dimm(dimm) {
+		if (mci->mc_idx != dimm->numa_node)
+			continue;
+
 		dmi_dimm = &dimm->dimm_info;
 		mci_dimm = edac_get_dimm_by_index(mci, index);
 
@@ -384,17 +388,35 @@ static void mem_info_prepare_mci(struct mem_ctl_info *mci)
 			index, mci->tot_dimms);
 }
 
+static struct mem_ctl_info *get_mc_by_node(int nid)
+{
+	struct mem_ctl_info *mci = edac_mc_find(nid);
+
+	if (mci)
+		return mci;
+
+	if (num_possible_nodes() > 1) {
+		edac_mc_printk(fallback, KERN_WARNING,
+			"Invalid or no node information, falling back to first node: %s",
+			fallback->dev_name);
+	}
+
+	return fallback;
+}
+
 void ghes_edac_report_mem_error(int sev, struct cper_sec_mem_err *mem_err)
 {
 	struct dimm_info *dimm_info;
 	enum hw_event_mc_err_type type;
 	struct edac_raw_error_desc *e;
 	struct mem_ctl_info *mci;
-	struct ghes_edac_pvt *pvt = ghes_pvt;
+	struct ghes_edac_pvt *pvt;
 	unsigned long flags;
 	char *p;
+	int nid = NUMA_NO_NODE;
 
-	if (!pvt)
+	/* We need at least one mc */
+	if (WARN_ON_ONCE(!fallback))
 		return;
 
 	/*
@@ -407,7 +429,11 @@ void ghes_edac_report_mem_error(int sev, struct cper_sec_mem_err *mem_err)
 
 	spin_lock_irqsave(&ghes_lock, flags);
 
-	mci = pvt->mci;
+	/* select the node's mc device */
+	if (mem_err->validation_bits & CPER_MEM_VALID_NODE)
+		nid = mem_err->node;
+	mci = get_mc_by_node(nid);
+	pvt = mci->pvt_info;
 	e = &mci->error_desc;
 
 	/* Cleans the error report buffer */
@@ -541,7 +567,7 @@ void ghes_edac_report_mem_error(int sev, struct cper_sec_mem_err *mem_err)
 			p += sprintf(p, "DIMM DMI handle: 0x%.4x ",
 				     mem_err->mem_dev_handle);
 
-		index = get_dimm_smbios_index(mem_err->mem_dev_handle);
+		index = get_dimm_smbios_index(mci, mem_err->mem_dev_handle);
 		if (index >= 0)
 			e->top_layer = index;
 	}
@@ -640,15 +666,29 @@ static struct acpi_platform_list plat_list[] = {
 	{ } /* End */
 };
 
+void ghes_edac_release(struct device *dev)
+{
+	struct ghes_edac_pvt *ghes_pvt;
+	struct mem_ctl_info *mci;
+
+	ghes_pvt = container_of(dev, struct ghes_edac_pvt, dev);
+
+	mci = ghes_pvt->mci;
+	edac_mc_del_mc(mci->pdev);
+	edac_mc_free(mci);
+}
+
 static int
 ghes_edac_register_one(int nid, struct ghes *ghes, struct device *parent)
 {
+	struct device *dev;
+	struct ghes_edac_pvt *ghes_pvt;
 	int rc;
 	struct mem_ctl_info *mci;
 	struct edac_mc_layer layers[1];
 
 	layers[0].type = EDAC_MC_LAYER_ALL_MEM;
-	layers[0].size = mem_info.num_dimm;
+	layers[0].size = mem_info.dimms_per_node[nid];
 	layers[0].is_virt_csrow = true;
 
 	mci = edac_mc_alloc(nid, ARRAY_SIZE(layers), layers,
@@ -662,43 +702,69 @@ ghes_edac_register_one(int nid, struct ghes *ghes, struct device *parent)
 	ghes_pvt->ghes	= ghes;
 	ghes_pvt->mci	= mci;
 
-	mci->pdev = parent;
+	dev		= &ghes_pvt->dev;
+	dev->parent	= parent;
+	dev->release	= ghes_edac_release;
+	dev_set_name(dev, "ghes_mc%d", nid);
+
+	rc = device_register(dev);
+	if (rc) {
+		pr_err("Can't create EDAC device (%d)\n", rc);
+		goto fail;
+	}
+
+	mci->pdev = dev;
 	mci->mtype_cap = MEM_FLAG_EMPTY;
 	mci->edac_ctl_cap = EDAC_FLAG_NONE;
 	mci->edac_cap = EDAC_FLAG_NONE;
 	mci->mod_name = "ghes_edac.c";
-	mci->ctl_name = "ghes_edac";
-	mci->dev_name = "ghes";
+	mci->ctl_name = "ghes_mc";
+	mci->dev_name = dev_name(dev);
 
 	mem_info_prepare_mci(mci);
 
 	rc = edac_mc_add_mc(mci);
 	if (rc < 0) {
-		pr_err("Can't register at EDAC core\n");
-		edac_mc_free(mci);
-		return -ENODEV;
+		pr_err("Can't register at EDAC core (%d)\n", rc);
+		goto fail;
 	}
+
 	return 0;
+fail:
+	put_device(dev);
+	return rc;
+}
+
+static void ghes_edac_unregister_one(struct mem_ctl_info *mci)
+{
+	struct ghes_edac_pvt *pvt = mci->pvt_info;
+
+	put_device(&pvt->dev);
 }
 
 void ghes_edac_unregister(struct ghes *ghes)
 {
 	struct mem_ctl_info *mci;
+	int nid;
 
-	if (!ghes_pvt)
-		return;
-
-	mci = ghes_pvt->mci;
-	edac_mc_del_mc(mci->pdev);
-	edac_mc_free(mci);
+	for_each_node(nid) {
+		mci = edac_mc_find(nid);
+		/* stop fallback at last */
+		if (mci && mci != fallback)
+			ghes_edac_unregister_one(mci);
+	}
 
+	ghes_edac_unregister_one(fallback);
+	fallback = NULL;
 	kfree(mem_info.dimms);
+	atomic_dec(&ghes_init);
 }
 
 int ghes_edac_register(struct ghes *ghes, struct device *dev)
 {
 	bool fake = false;
 	int rc;
+	int nid;
 	int idx = -1;
 
 	if (IS_ENABLED(CONFIG_X86)) {
@@ -738,7 +804,23 @@ int ghes_edac_register(struct ghes *ghes, struct device *dev)
 		pr_info("This system has %d DIMM sockets.\n", mem_info.num_dimm);
 	}
 
-	rc = ghes_edac_register_one(0, ghes, dev);
+	for_each_node(nid) {
+		if (!mem_info.dimms_per_node[nid])
+			continue;
 
-	return rc;
+		rc = ghes_edac_register_one(nid, ghes, dev);
+		if (rc) {
+			ghes_edac_unregister(ghes);
+			return rc;
+		}
+
+		/*
+		 * use the first node's mc as fallback in case we can
+		 * not detect the node from the error information
+		 */
+		if (!fallback)
+			fallback = edac_mc_find(nid);
+	}
+
+	return 0;
 }
-- 
2.20.1


  parent reply	other threads:[~2019-06-24 15:09 UTC|newest]

Thread overview: 52+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2019-06-24 15:08 [PATCH v2 00/24] EDAC, mc, ghes: Fixes and updates to improve memory error reporting Robert Richter
2019-06-24 15:08 ` [PATCH v2 01/24] EDAC, mc: Fix grain_bits calculation Robert Richter
2019-08-03 10:08   ` Borislav Petkov
2019-06-24 15:08 ` [PATCH v2 02/24] EDAC, ghes: Fix grain calculation Robert Richter
2019-08-09 13:15   ` Borislav Petkov
2019-08-12  6:42     ` Robert Richter
2019-08-12  7:32       ` Borislav Petkov
2019-08-12 12:05         ` Robert Richter
2019-08-12 12:38           ` Borislav Petkov
2019-06-24 15:08 ` [PATCH v2 03/24] EDAC, ghes: Remove pvt->detail_location string Robert Richter
2019-08-02 17:04   ` James Morse
2019-08-07  9:00     ` Robert Richter
2019-08-13  8:09   ` Borislav Petkov
2019-06-24 15:09 ` [PATCH v2 04/24] EDAC, ghes: Unify trace_mc_event() code with edac_mc driver Robert Richter
2019-06-24 15:09 ` [PATCH v2 05/24] EDAC, mc: Fix and improve sysfs init functions Robert Richter
2019-08-13  8:26   ` Borislav Petkov
2019-06-24 15:09 ` [PATCH v2 06/24] EDAC: Kill EDAC_DIMM_PTR() macro Robert Richter
2019-08-13 14:59   ` Borislav Petkov
2019-08-27 12:20     ` Robert Richter
2019-06-24 15:09 ` [PATCH v2 07/24] EDAC: Kill EDAC_DIMM_OFF() macro Robert Richter
2019-08-14 14:52   ` Borislav Petkov
2019-06-24 15:09 ` [PATCH v2 08/24] EDAC: Introduce mci_for_each_dimm() iterator Robert Richter
2019-08-14 15:18   ` Borislav Petkov
2019-08-28  8:18     ` Robert Richter
2019-06-24 15:09 ` [PATCH v2 09/24] EDAC, mc: Cleanup _edac_mc_free() code Robert Richter
2019-08-14 16:31   ` Borislav Petkov
2019-06-24 15:09 ` [PATCH v2 10/24] EDAC, mc: Remove per layer counters Robert Richter
2019-08-16  9:24   ` Borislav Petkov
2019-06-24 15:09 ` [PATCH v2 11/24] EDAC, mc: Rework edac_raw_mc_handle_error() to use struct dimm_info Robert Richter
2019-06-24 15:09 ` [PATCH v2 12/24] EDAC, ghes: Use standard kernel macros for page calculations Robert Richter
2019-08-02 17:04   ` James Morse
2019-08-07  9:52     ` Robert Richter
2019-06-24 15:09 ` [PATCH v2 13/24] EDAC, ghes: Add support for legacy API counters Robert Richter
2019-08-16  9:55   ` Borislav Petkov
2019-08-30  9:35     ` Robert Richter
2019-06-24 15:09 ` [PATCH v2 14/24] EDAC, ghes: Rework memory hierarchy detection Robert Richter
2019-08-20  8:56   ` Borislav Petkov
2019-06-24 15:09 ` [PATCH v2 15/24] EDAC, ghes: Extract numa node information for each dimm Robert Richter
2019-08-02 17:05   ` James Morse
2019-08-09 13:09     ` Robert Richter
2019-06-24 15:09 ` [PATCH v2 16/24] EDAC, ghes: Moving code around ghes_edac_register() Robert Richter
2019-06-24 15:09 ` Robert Richter [this message]
2019-06-24 15:09 ` [PATCH v2 18/24] EDAC, ghes: Fill sysfs with the DMI DIMM label information Robert Richter
2019-06-24 15:09 ` [PATCH v2 19/24] EDAC, mc: Introduce edac_mc_alloc_by_dimm() for per dimm allocation Robert Richter
2019-06-24 15:09 ` [PATCH v2 20/24] EDAC, ghes: Identify dimm by node, card, module and handle Robert Richter
2019-06-24 15:09 ` [PATCH v2 21/24] EDAC, ghes: Enable per-layer reporting based on card/module Robert Richter
2019-06-24 15:09 ` [PATCH v2 22/24] EDAC, ghes: Move struct member smbios_handle to struct ghes_dimm_info Robert Richter
2019-06-24 15:09 ` [PATCH v2 23/24] EDAC, Documentation: Describe CPER module definition and DIMM ranks Robert Richter
2019-06-24 15:09 ` [PATCH v2 24/24] EDAC, ghes: Disable legacy API for ARM64 Robert Richter
2019-06-26  9:33   ` James Morse
2019-06-26 10:11     ` Robert Richter
2019-08-02  7:58 ` [PATCH v2 00/24] EDAC, mc, ghes: Fixes and updates to improve memory error reporting Robert Richter

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=20190624150758.6695-18-rrichter@marvell.com \
    --to=rrichter@marvell.com \
    --cc=bp@alien8.de \
    --cc=james.morse@arm.com \
    --cc=linux-edac@vger.kernel.org \
    --cc=linux-kernel@vger.kernel.org \
    --cc=mchehab@kernel.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).