On Mon, Aug 07, 2017 at 09:39:25AM +0200, Michal Simek wrote:
> From: Naga Sureshkumar Relli <naga.sureshkumar.re...@xilinx.com>
> 
> This patch adds EDAC ECC support for ZynqMP DDRC IP

It does much more and the commit message could talk about it.

> Signed-off-by: Naga Sureshkumar Relli <nagas...@xilinx.com>
> Signed-off-by: Michal Simek <michal.si...@xilinx.com>
> ---
> 
> Changes in v2:
> - Add binding doc to this series to resolve checkpatch warning
> - Rebased on the top of
>   https://git.kernel.org/pub/scm/linux/kernel/git/bp/bp.git/log/?h=for-next
>   and resolve conflict caused by "EDAC: Get rid of mci->mod_ver" patch
> - Add changes done in previous patch
> 
>  drivers/edac/Kconfig         |   2 +-
>  drivers/edac/synopsys_edac.c | 305 
> ++++++++++++++++++++++++++++++++++++++++++-
>  2 files changed, 302 insertions(+), 5 deletions(-)
> 
> diff --git a/drivers/edac/Kconfig b/drivers/edac/Kconfig
> index 96afb2aeed18..e2f62dda8944 100644
> --- a/drivers/edac/Kconfig
> +++ b/drivers/edac/Kconfig
> @@ -445,7 +445,7 @@ config EDAC_ALTERA_SDMMC
>  
>  config EDAC_SYNOPSYS
>       tristate "Synopsys DDR Memory Controller"
> -     depends on ARCH_ZYNQ
> +     depends on ARCH_ZYNQ || ARM64

This is an unrelated change and it needs a separate patch and a commit
message explaining that you're enabling the driver on arm64 now too.

>       help
>         Support for error detection and correction on the Synopsys DDR
>         memory controller.
> diff --git a/drivers/edac/synopsys_edac.c b/drivers/edac/synopsys_edac.c
> index 293380f884fe..11016cd13a08 100644
> --- a/drivers/edac/synopsys_edac.c
> +++ b/drivers/edac/synopsys_edac.c
> @@ -22,6 +22,7 @@
>  #include <linux/edac.h>
>  #include <linux/module.h>
>  #include <linux/platform_device.h>
> +#include <linux/interrupt.h>
>  #include <linux/of.h>
>  
>  #include "edac_module.h"
> @@ -99,6 +100,87 @@
>  /* DDR ECC Quirks */
>  #define DDR_ECC_INTR_SUPPORT         BIT(0)
>  
> +/* ZynqMP Enhanced DDR memory controller registers that are relevant to ECC 
> */
> +/* ECC Configuration Registers */
> +#define ECC_CFG0_OFST        0x70
> +#define ECC_CFG1_OFST        0x74
> +
> +/* ECC Status Register */
> +#define ECC_STAT_OFST        0x78
> +
> +/* ECC Clear Register */
> +#define ECC_CLR_OFST 0x7C
> +
> +/* ECC Error count Register */
> +#define ECC_ERRCNT_OFST      0x80

Some of those are unused. Kill them if they remain unused.

> +
> +/* ECC Corrected Error Address Register */
> +#define ECC_CEADDR0_OFST     0x84
> +#define ECC_CEADDR1_OFST     0x88
> +
> +/* ECC Syndrome Registers */
> +#define ECC_CSYND0_OFST      0x8C
> +#define ECC_CSYND1_OFST      0x90
> +#define ECC_CSYND2_OFST      0x94
> +
> +/* ECC Bit Mask0 Address Register */
> +#define ECC_BITMASK0_OFST    0x98
> +#define ECC_BITMASK1_OFST    0x9C
> +#define ECC_BITMASK2_OFST    0xA0
> +
> +/* ECC UnCorrected Error Address Register */
> +#define ECC_UEADDR0_OFST     0xA4
> +#define ECC_UEADDR1_OFST     0xA8
> +
> +/* ECC Syndrome Registers */
> +#define ECC_UESYND0_OFST     0xAC
> +#define ECC_UESYND1_OFST     0xB0
> +#define ECC_UESYND2_OFST     0xB4
> +
> +/* ECC Poison Address Reg */
> +#define ECC_POISON0_OFST     0xB8
> +#define ECC_POISON1_OFST     0xBC
> +
> +/* Control register bitfield definitions */
> +#define ECC_CTRL_BUSWIDTH_MASK       0x3000
> +#define ECC_CTRL_BUSWIDTH_SHIFT      12
> +#define ECC_CTRL_CLR_CE_ERRCNT       BIT(2)
> +#define ECC_CTRL_CLR_UE_ERRCNT       BIT(3)
> +
> +/* DDR Control Register width definitions  */
> +#define DDRCTL_EWDTH_16              2
> +#define DDRCTL_EWDTH_32              1
> +#define DDRCTL_EWDTH_64              0
> +
> +/* ECC status register definitions */
> +#define ECC_STAT_UECNT_MASK  0xF0000
> +#define ECC_STAT_UECNT_SHIFT 16
> +#define ECC_STAT_CECNT_MASK  0xF00
> +#define ECC_STAT_CECNT_SHIFT 8
> +#define ECC_STAT_BITNUM_MASK 0x7F
> +
> +/* DDR QOS Interrupt register definitions */
> +#define DDR_QOS_IRQ_STAT_OFST        0x20200
> +#define DDR_QOSUE_MASK               0x4
> +#define DDR_QOSCE_MASK               0x2
> +#define ECC_CE_UE_INTR_MASK  0x6
> +
> +/* ECC Corrected Error Register Mask and Shifts*/
> +#define ECC_CEADDR0_RW_MASK  0x3FFFF
> +#define ECC_CEADDR0_RNK_MASK BIT(24)
> +#define ECC_CEADDR1_BNKGRP_MASK      0x3000000
> +#define ECC_CEADDR1_BNKNR_MASK       0x70000
> +#define ECC_CEADDR1_BLKNR_MASK       0xFFF
> +#define ECC_CEADDR1_BNKGRP_SHIFT     24
> +#define ECC_CEADDR1_BNKNR_SHIFT      16
> +
> +/* DDR Memory type defines */
> +#define MEM_TYPE_DDR3        0x1
> +#define MEM_TYPE_LPDDR3      0x1
> +#define MEM_TYPE_DDR2        0x4
> +#define MEM_TYPE_DDR4        0x10
> +#define MEM_TYPE_LPDDR4      0x10
> +
>  /**
>   * struct ecc_error_info - ECC error log information
>   * @row:     Row number
> @@ -106,6 +188,8 @@
>   * @bank:    Bank number
>   * @bitpos:  Bit position
>   * @data:    Data causing the error
> + * @bankgrpnr:       Bank group number
> + * @blknr:   Block number
>   */
>  struct ecc_error_info {
>       u32 row;
> @@ -113,6 +197,8 @@ struct ecc_error_info {
>       u32 bank;
>       u32 bitpos;
>       u32 data;
> +     u32 bankgrpnr;
> +     u32 blknr;

u32? Can those fit in a smaller integer?

>  };
>  
>  /**
> @@ -171,7 +257,7 @@ struct synps_platform_data {
>   *
>   * Determines there is any ecc error or not
>   *
> - * Return: one if there is no error otherwise returns zero
> + * Return: 1 if there is no error otherwise returns 0

So you corrected this to use numbers (1 and 0) which is as arbitrary
change as any...

>   */
>  static int synps_edac_geterror_info(void __iomem *base,
>                                   struct synps_ecc_status *p)
> @@ -219,6 +305,65 @@ static int synps_edac_geterror_info(void __iomem *base,
>  }
>  
>  /**
> + * synps_enh_edac_geterror_info - Get the current ecc error info
> + * @base:    Pointer to the base address of the ddr memory controller
> + * @p:               Pointer to the synopsys ecc status structure
> + *
> + * Determines there is any ecc error or not
> + *
> + * Return: one if there is no error otherwise returns zero

... and yet copied the old text and didn't change it here. Looks like
this needs making up mind.

> + */
> +static int synps_enh_edac_geterror_info(void __iomem *base,
> +                                     struct synps_ecc_status *p)

And you have "_edac_" in all those functions which are static and which
only encumbers readability. I think naming scheme like

        get_error_info
        zynq_mp_get_error_info
        ...

should be much easier on the eyes.

> +{
> +     u32 regval, clearval = 0;
> +
> +     regval = readl(base + ECC_STAT_OFST);
> +     if (!regval)
> +             return 1;
> +
> +     p->ce_cnt = (regval & ECC_STAT_CECNT_MASK) >> ECC_STAT_CECNT_SHIFT;
> +     p->ue_cnt = (regval & ECC_STAT_UECNT_MASK) >> ECC_STAT_UECNT_SHIFT;
> +     p->ceinfo.bitpos = (regval & ECC_STAT_BITNUM_MASK);
> +
> +     regval = readl(base + ECC_CEADDR0_OFST);
> +     if (!(p->ce_cnt))
> +             goto ue_err;
> +
> +     p->ceinfo.row = (regval & ECC_CEADDR0_RW_MASK);
> +     regval = readl(base + ECC_CEADDR1_OFST);
> +     p->ceinfo.bank = (regval & ECC_CEADDR1_BNKNR_MASK) >>
> +                                     ECC_CEADDR1_BNKNR_SHIFT;
> +     p->ceinfo.bankgrpnr = (regval & ECC_CEADDR1_BNKGRP_MASK) >>
> +                                     ECC_CEADDR1_BNKGRP_SHIFT;
> +     p->ceinfo.blknr = (regval & ECC_CEADDR1_BLKNR_MASK);
> +     p->ceinfo.data = readl(base + ECC_CSYND0_OFST);

Align vertically and let it stick out for better readability, like this:

        p->ceinfo.bank      = (regval & ECC_CEADDR1_BNKNR_MASK) >> 
ECC_CEADDR1_BNKNR_SHIFT;
        p->ceinfo.bankgrpnr = (regval & ECC_CEADDR1_BNKGRP_MASK) >> 
ECC_CEADDR1_BNKGRP_SHIFT;
        p->ceinfo.blknr     = (regval & ECC_CEADDR1_BLKNR_MASK);
        p->ceinfo.data      = readl(base + ECC_CSYND0_OFST);

> +     edac_dbg(3, "ce bit position: %d data: %d\n", p->ceinfo.bitpos,
> +              p->ceinfo.data);
> +
> +ue_err:
> +     regval = readl(base + ECC_UEADDR0_OFST);
> +     if (!(p->ue_cnt))
> +             goto out;
> +
> +     p->ueinfo.row = (regval & ECC_CEADDR0_RW_MASK);
> +     regval = readl(base + ECC_UEADDR1_OFST);
> +     p->ueinfo.bankgrpnr = (regval & ECC_CEADDR1_BNKGRP_MASK) >>
> +                                     ECC_CEADDR1_BNKGRP_SHIFT;
> +     p->ueinfo.bank = (regval & ECC_CEADDR1_BNKNR_MASK) >>
> +                                     ECC_CEADDR1_BNKNR_SHIFT;
> +     p->ueinfo.blknr = (regval & ECC_CEADDR1_BLKNR_MASK);
> +     p->ueinfo.data = readl(base + ECC_UESYND0_OFST);

Ditto.

> +out:
> +     clearval = ECC_CTRL_CLR_CE_ERR | ECC_CTRL_CLR_CE_ERRCNT;
> +     clearval |= ECC_CTRL_CLR_UE_ERR | ECC_CTRL_CLR_UE_ERRCNT;
> +     writel(clearval, base + ECC_CLR_OFST);
> +     writel(0x0, base + ECC_CLR_OFST);
> +
> +     return 0;
> +}
> +
> +/**
>   * synps_edac_handle_error - Handle controller error types CE and UE
>   * @mci:     Pointer to the edac memory controller instance
>   * @p:               Pointer to the synopsys ecc status structure
> @@ -255,6 +400,41 @@ static void synps_edac_handle_error(struct mem_ctl_info 
> *mci,
>  }
>  
>  /**
> + * synps_edac_intr_handler - synps edac isr
> + * @irq:     irq number
> + * @dev_id:  device id poniter
> + *
> + * This is the Isr routine called by edac core interrupt thread.

s/[iI]sr/ISR/g

> + * Used to check and post ECC errors.
> + *
> + * Return: IRQ_NONE, if interrupt not set or IRQ_HANDLED otherwise
> + */
> +static irqreturn_t synps_edac_intr_handler(int irq, void *dev_id)
> +{
> +     struct mem_ctl_info *mci = dev_id;
> +     struct synps_edac_priv *priv = mci->pvt_info;
> +     int status, regval;
> +
> +     regval = readl(priv->baseaddr + DDR_QOS_IRQ_STAT_OFST) &
> +                     (DDR_QOSCE_MASK | DDR_QOSUE_MASK);
> +     if (!(regval & ECC_CE_UE_INTR_MASK))
> +             return IRQ_NONE;

newline.

> +     status = priv->p_data->edac_geterror_info(priv->baseaddr,
> +                                               &priv->stat);

Let it stick out.

> +     if (status)
> +             return IRQ_NONE;
> +
> +     priv->ce_cnt += priv->stat.ce_cnt;
> +     priv->ue_cnt += priv->stat.ue_cnt;
> +     synps_edac_handle_error(mci, &priv->stat);
> +
> +     edac_dbg(3, "Total error count ce %d ue %d\n",
> +              priv->ce_cnt, priv->ue_cnt);
> +     writel(regval, priv->baseaddr + DDR_QOS_IRQ_STAT_OFST);
> +     return IRQ_HANDLED;
> +}
> +
> +/**
>   * synps_edac_check - Check controller for ECC errors
>   * @mci:     Pointer to the edac memory controller instance
>   *
> @@ -310,6 +490,40 @@ static enum dev_type synps_edac_get_dtype(const void 
> __iomem *base)
>  }
>  
>  /**
> + * synps_enh_edac_get_dtype - Return the controller memory width
> + * @base:    Pointer to the ddr memory controller base address
> + *
> + * Get the EDAC device type width appropriate for the current controller
> + * configuration.
> + *
> + * Return: a device type width enumeration.

"... or unknown."

> + */
> +static enum dev_type synps_enh_edac_get_dtype(const void __iomem *base)
> +{
> +     enum dev_type dt;
> +     u32 width;
> +
> +     width = readl(base + CTRL_OFST);
> +     width = (width & ECC_CTRL_BUSWIDTH_MASK) >>
> +             ECC_CTRL_BUSWIDTH_SHIFT;

Let it stick out - the 80 cols rule is not a hard one.

> +     switch (width) {
> +     case DDRCTL_EWDTH_16:
> +             dt = DEV_X2;

You can save yourself the assignment if you do

                return DEV_X2;

here and below, respectively.

> +             break;
> +     case DDRCTL_EWDTH_32:
> +             dt = DEV_X4;
> +             break;
> +     case DDRCTL_EWDTH_64:
> +             dt = DEV_X8;
> +             break;
> +     default:
> +             dt = DEV_UNKNOWN;
> +     }
> +
> +     return dt;
> +}
> +
> +/**
>   * synps_edac_get_eccstate - Return the controller ecc enable/disable status
>   * @base:    Pointer to the ddr memory controller base address
>   *
> @@ -335,6 +549,32 @@ static bool synps_edac_get_eccstate(void __iomem *base)
>  }
>  
>  /**
> + * synps_enh_edac_get_eccstate - Return the controller ecc enable/disable 
> status

s/ecc/ECC/g

> + * @base:    Pointer to the ddr memory controller base address
> + *
> + * Get the ECC enable/disable status for the controller
> + *
> + * Return: a ecc status boolean i.e true/false - enabled/disabled.
> + */
> +static bool synps_enh_edac_get_eccstate(void __iomem *base)
> +{
> +     enum dev_type dt;
> +     u32 ecctype;
> +     bool state = false;
> +
> +     dt = synps_enh_edac_get_dtype(base);
> +     if (dt == DEV_UNKNOWN)
> +             return state;
> +
> +     ecctype = readl(base + ECC_CFG0_OFST) & SCRUB_MODE_MASK;
> +     if ((ecctype == SCRUB_MODE_SECDED) &&
> +         ((dt == DEV_X2) || (dt == DEV_X4) || (dt == DEV_X8)))
> +             state = true;
> +
> +     return state;

Ditto: you don't need the assignment here - just return the boolean value.

> +}
> +
> +/**
>   * synps_edac_get_memsize - reads the size of the attached memory device
>   *
>   * Return: the memory size in bytes
> @@ -373,6 +613,32 @@ static enum mem_type synps_edac_get_mtype(const void 
> __iomem *base)
>  }
>  
>  /**
> + * synps_enh_edac_get_mtype - Returns controller memory type
> + * @base:    pointer to the synopsys ecc status structure
> + *
> + * Get the EDAC memory type appropriate for the current controller
> + * configuration.
> + *
> + * Return: a memory type enumeration.
> + */
> +static enum mem_type synps_enh_edac_get_mtype(const void __iomem *base)
> +{
> +     enum mem_type mt = MEM_UNKNOWN;
> +     u32 memtype;
> +
> +     memtype = readl(base + CTRL_OFST);
> +
> +     if ((memtype & MEM_TYPE_DDR3) || (memtype & MEM_TYPE_LPDDR3))
> +             mt = MEM_DDR3;
> +     else if (memtype & MEM_TYPE_DDR2)
> +             mt = MEM_RDDR2;
> +     else if ((memtype & MEM_TYPE_LPDDR4) || (memtype & MEM_TYPE_DDR4))
> +             mt = MEM_DDR4;
> +
> +     return mt;

Ditto.

> +}
> +
> +/**
>   * synps_edac_init_csrows - Initialize the cs row data
>   * @mci:     Pointer to the edac memory controller instance
>   *
> @@ -440,8 +706,12 @@ static int synps_edac_mc_init(struct mem_ctl_info *mci,
>       mci->dev_name = SYNPS_EDAC_MOD_STRING;
>       mci->mod_name = SYNPS_EDAC_MOD_VER;
>  
> -     edac_op_state = EDAC_OPSTATE_POLL;
> -     mci->edac_check = synps_edac_check;
> +     if (priv->p_data->quirks & DDR_ECC_INTR_SUPPORT) {
> +             edac_op_state = EDAC_OPSTATE_INT;
> +     } else {
> +             edac_op_state = EDAC_OPSTATE_POLL;
> +             mci->edac_check = synps_edac_check;
> +     }
>       mci->ctl_page_to_phys = NULL;
>  
>       status = synps_edac_init_csrows(mci);
> @@ -457,8 +727,18 @@ static int synps_edac_mc_init(struct mem_ctl_info *mci,
>       .quirks                 = 0,
>  };
>  
> +static const struct synps_platform_data zynqmp_enh_edac_def = {
> +     .edac_geterror_info     = synps_enh_edac_geterror_info,
> +     .edac_get_mtype         = synps_enh_edac_get_mtype,
> +     .edac_get_dtype         = synps_enh_edac_get_dtype,
> +     .edac_get_eccstate      = synps_enh_edac_get_eccstate,
> +     .quirks                 = DDR_ECC_INTR_SUPPORT,
> +};
> +
>  static const struct of_device_id synps_edac_match[] = {
>       { .compatible = "xlnx,zynq-ddrc-a05", .data = (void *)&zynq_edac_def },
> +     { .compatible = "xlnx,zynqmp-ddrc-2.40a",
> +                             .data = (void *)&zynqmp_enh_edac_def},
>       { /* end of table */ }
>  };
>  
> @@ -478,7 +758,7 @@ static int synps_edac_mc_probe(struct platform_device 
> *pdev)
>       struct mem_ctl_info *mci;
>       struct edac_mc_layer layers[2];
>       struct synps_edac_priv *priv;
> -     int rc;
> +     int rc, irq, status;
>       struct resource *res;
>       void __iomem *baseaddr;
>       const struct of_device_id *match;
> @@ -527,6 +807,23 @@ static int synps_edac_mc_probe(struct platform_device 
> *pdev)
>               goto free_edac_mc;
>       }
>  
> +     if (priv->p_data->quirks & DDR_ECC_INTR_SUPPORT) {
> +             irq = platform_get_irq(pdev, 0);
> +             if (irq < 0) {
> +                     edac_printk(KERN_ERR, EDAC_MC,
> +                                 "No irq %d in DT\n", irq);
> +                     return -ENODEV;

If you return here, you're leaking memory.

> +             }
> +
> +             status = devm_request_irq(&pdev->dev, irq,
> +                                       synps_edac_intr_handler,
> +                                       0, dev_name(&pdev->dev), mci);
> +             if (status < 0) {
> +                     edac_printk(KERN_ERR, EDAC_MC, "Failed to request 
> Irq\n");
> +                     goto free_edac_mc;
> +             }
> +     }
> +
>       rc = edac_mc_add_mc(mci);
>       if (rc) {
>               edac_printk(KERN_ERR, EDAC_MC,
> -- 
> 1.9.1
> 

-- 
Regards/Gruss,
    Boris.

ECO tip #101: Trim your mails when you reply.
--

Reply via email to