[PATCH 2/2] EDAC: add ARM Cortex A15 L2 internal asynchronous error detection driver

From: Wiebe, Wladislav (Nokia - DE/Ulm)
Date: Tue Jan 08 2019 - 03:10:54 EST


This driver adds support for L2 internal asynchronous error detection
caused by L2 RAM double-bit ECC error or illegal writes to the
Interrupt Controller memory-map region on the Cortex A15.

Signed-off-by: Wladislav Wiebe <wladislav.wiebe@xxxxxxxxx>
---
MAINTAINERS | 1 +
drivers/edac/Kconfig | 11 +++
drivers/edac/Makefile | 1 +
drivers/edac/cortex_a15_l2_async_edac.c | 134 ++++++++++++++++++++++++++++++++
4 files changed, 147 insertions(+)
create mode 100644 drivers/edac/cortex_a15_l2_async_edac.c

diff --git a/MAINTAINERS b/MAINTAINERS
index 0796ad6e6490..84dc501b2582 100644
--- a/MAINTAINERS
+++ b/MAINTAINERS
@@ -1100,6 +1100,7 @@ L: linux-edac@xxxxxxxxxxxxxxx
L: linux-arm-kernel@xxxxxxxxxxxxxxxxxxx (moderated for non-subscribers)
S: Supported
F: Documentation/devicetree/bindings/edac/cortex_a15_l2_async_edac.txt
+F: drivers/edac/cortex_a15_l2_async_edac.c

ARM INTEGRATOR, VERSATILE AND REALVIEW SUPPORT
M: Linus Walleij <linus.walleij@xxxxxxxxxx>
diff --git a/drivers/edac/Kconfig b/drivers/edac/Kconfig
index 41c9ccdd20d6..8722203948e0 100644
--- a/drivers/edac/Kconfig
+++ b/drivers/edac/Kconfig
@@ -475,4 +475,15 @@ config EDAC_QCOM
For debugging issues having to do with stability and overall system
health, you should probably say 'Y' here.

+config EDAC_CORTEX_A15_L2_ASYNC
+ tristate "Cortex A15 ASYNC L2 & illegal GIC write error detection"
+ depends on ARM
+ help
+ Support for L2 internal asynchronous error detection caused by L2 RAM
+ double-bit ECC error or illegal writes to the Interrupt Controller
+ memory-map region on the Cortex A15.
+
+ This driver works in interrupt mode triggered by the nINTERRIRQ and
+ reports only uncorrectable errors.
+
endif # EDAC
diff --git a/drivers/edac/Makefile b/drivers/edac/Makefile
index 716096d08ea0..12d15cf5ff4e 100644
--- a/drivers/edac/Makefile
+++ b/drivers/edac/Makefile
@@ -78,3 +78,4 @@ obj-$(CONFIG_EDAC_SYNOPSYS) += synopsys_edac.o
obj-$(CONFIG_EDAC_XGENE) += xgene_edac.o
obj-$(CONFIG_EDAC_TI) += ti_edac.o
obj-$(CONFIG_EDAC_QCOM) += qcom_edac.o
+obj-$(CONFIG_EDAC_CORTEX_A15_L2_ASYNC) += cortex_a15_l2_async_edac.o
diff --git a/drivers/edac/cortex_a15_l2_async_edac.c b/drivers/edac/cortex_a15_l2_async_edac.c
new file mode 100644
index 000000000000..26252568e961
--- /dev/null
+++ b/drivers/edac/cortex_a15_l2_async_edac.c
@@ -0,0 +1,134 @@
+// SPDX-License-Identifier: GPL-2.0
+/*
+ * Copyright (C) 2018 Nokia Corporation
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License along with
+ * this program. If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#include <linux/module.h>
+#include <linux/interrupt.h>
+#include <linux/platform_device.h>
+#include <linux/of.h>
+
+#include "edac_module.h"
+
+#define DRIVER_NAME "cortex_a15_l2_async_edac"
+
+#define L2ECTLR_L2_ASYNC_ERR BIT(30)
+
+static irqreturn_t cortex_a15_l2_async_edac_err_handler(int irq, void *dev_id)
+{
+ struct edac_device_ctl_info *dci = dev_id;
+ u32 status = 0;
+
+ /*
+ * Read and clear L2ECTLR L2 ASYNC error bit caused by INTERRIRQ.
+ * Reason could be a L2 RAM double-bit ECC error or illegal writes
+ * to the Interrupt Controller memory-map region.
+ */
+ asm("mrc p15, 1, %0, c9, c0, 3" : "=r" (status));
+ if (status & L2ECTLR_L2_ASYNC_ERR) {
+ status &= ~L2ECTLR_L2_ASYNC_ERR;
+ asm("mcr p15, 1, %0, c9, c0, 3" : : "r" (status));
+ edac_printk(KERN_EMERG, DRIVER_NAME,
+ "L2 internal asynchronous error occurred!\n");
+ edac_device_handle_ue(dci, 0, 0, dci->ctl_name);
+
+ return IRQ_HANDLED;
+ }
+
+ return IRQ_NONE;
+}
+
+static int cortex_a15_l2_async_edac_probe(struct platform_device *pdev)
+{
+ struct edac_device_ctl_info *dci;
+ struct device_node *np = pdev->dev.of_node;
+ char *ctl_name = (char *)np->name;
+ int i = 0, ret = 0, err_irq = 0, irq_count = 0;
+
+ /* We can have multiple CPU clusters with one INTERRIRQ per cluster */
+ irq_count = platform_irq_count(pdev);
+ if (irq_count < 0) {
+ edac_printk(KERN_ERR, DRIVER_NAME,
+ "No L2 ASYNC error IRQ found!\n");
+ return -EINVAL;
+ }
+
+ dci = edac_device_alloc_ctl_info(0, ctl_name, 1, ctl_name,
+ irq_count, 0, NULL, 0,
+ edac_device_alloc_index());
+ if (!dci)
+ return -ENOMEM;
+
+ dci->dev = &pdev->dev;
+ dci->mod_name = DRIVER_NAME;
+ dci->ctl_name = ctl_name;
+ dci->dev_name = dev_name(&pdev->dev);
+ platform_set_drvdata(pdev, dci);
+
+ if (edac_device_add_device(dci))
+ goto err;
+
+ for (i = 0; i < irq_count; i++) {
+ err_irq = platform_get_irq(pdev, i);
+ ret = devm_request_irq(&pdev->dev, err_irq,
+ cortex_a15_l2_async_edac_err_handler, 0,
+ dev_name(&pdev->dev), dci);
+
+ if (ret < 0) {
+ edac_printk(KERN_ERR, DRIVER_NAME,
+ "Failed to register L2 ASYNC error IRQ %d\n",
+ err_irq);
+ goto err2;
+ }
+ }
+
+ return 0;
+err2:
+ edac_device_del_device(&pdev->dev);
+err:
+ edac_device_free_ctl_info(dci);
+
+ return ret;
+}
+
+static int cortex_a15_l2_async_edac_remove(struct platform_device *pdev)
+{
+ struct edac_device_ctl_info *dci = platform_get_drvdata(pdev);
+
+ edac_device_del_device(&pdev->dev);
+ edac_device_free_ctl_info(dci);
+
+ return 0;
+}
+
+static const struct of_device_id cortex_a15_l2_async_edac_of_match[] = {
+ { .compatible = "arm,cortex-a15-l2-async-edac", },
+ {},
+};
+MODULE_DEVICE_TABLE(of, cortex_a15_l2_async_edac_of_match);
+
+static struct platform_driver cortex_a15_l2_async_edac_driver = {
+ .probe = cortex_a15_l2_async_edac_probe,
+ .remove = cortex_a15_l2_async_edac_remove,
+ .driver = {
+ .name = DRIVER_NAME,
+ .of_match_table = cortex_a15_l2_async_edac_of_match,
+ },
+};
+module_platform_driver(cortex_a15_l2_async_edac_driver);
+
+MODULE_AUTHOR("Wladislav Wiebe <wladislav.wiebe@xxxxxxxxx>");
+MODULE_DESCRIPTION("ARM Cortex A15 L2 internal asynchronous error detection");
+MODULE_LICENSE("GPL v2");
--
2.16.1