1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * Cell MIC driver for ECC counting
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * Copyright 2007 Benjamin Herrenschmidt, IBM Corp.
5*4882a593Smuzhiyun * <benh@kernel.crashing.org>
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * This file may be distributed under the terms of the
8*4882a593Smuzhiyun * GNU General Public License.
9*4882a593Smuzhiyun */
10*4882a593Smuzhiyun #undef DEBUG
11*4882a593Smuzhiyun
12*4882a593Smuzhiyun #include <linux/edac.h>
13*4882a593Smuzhiyun #include <linux/module.h>
14*4882a593Smuzhiyun #include <linux/init.h>
15*4882a593Smuzhiyun #include <linux/platform_device.h>
16*4882a593Smuzhiyun #include <linux/stop_machine.h>
17*4882a593Smuzhiyun #include <linux/io.h>
18*4882a593Smuzhiyun #include <linux/of_address.h>
19*4882a593Smuzhiyun #include <asm/machdep.h>
20*4882a593Smuzhiyun #include <asm/cell-regs.h>
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun #include "edac_module.h"
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun struct cell_edac_priv
25*4882a593Smuzhiyun {
26*4882a593Smuzhiyun struct cbe_mic_tm_regs __iomem *regs;
27*4882a593Smuzhiyun int node;
28*4882a593Smuzhiyun int chanmask;
29*4882a593Smuzhiyun #ifdef DEBUG
30*4882a593Smuzhiyun u64 prev_fir;
31*4882a593Smuzhiyun #endif
32*4882a593Smuzhiyun };
33*4882a593Smuzhiyun
cell_edac_count_ce(struct mem_ctl_info * mci,int chan,u64 ar)34*4882a593Smuzhiyun static void cell_edac_count_ce(struct mem_ctl_info *mci, int chan, u64 ar)
35*4882a593Smuzhiyun {
36*4882a593Smuzhiyun struct cell_edac_priv *priv = mci->pvt_info;
37*4882a593Smuzhiyun struct csrow_info *csrow = mci->csrows[0];
38*4882a593Smuzhiyun unsigned long address, pfn, offset, syndrome;
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun dev_dbg(mci->pdev, "ECC CE err on node %d, channel %d, ar = 0x%016llx\n",
41*4882a593Smuzhiyun priv->node, chan, ar);
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun /* Address decoding is likely a bit bogus, to dbl check */
44*4882a593Smuzhiyun address = (ar & 0xffffffffe0000000ul) >> 29;
45*4882a593Smuzhiyun if (priv->chanmask == 0x3)
46*4882a593Smuzhiyun address = (address << 1) | chan;
47*4882a593Smuzhiyun pfn = address >> PAGE_SHIFT;
48*4882a593Smuzhiyun offset = address & ~PAGE_MASK;
49*4882a593Smuzhiyun syndrome = (ar & 0x000000001fe00000ul) >> 21;
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun /* TODO: Decoding of the error address */
52*4882a593Smuzhiyun edac_mc_handle_error(HW_EVENT_ERR_CORRECTED, mci, 1,
53*4882a593Smuzhiyun csrow->first_page + pfn, offset, syndrome,
54*4882a593Smuzhiyun 0, chan, -1, "", "");
55*4882a593Smuzhiyun }
56*4882a593Smuzhiyun
cell_edac_count_ue(struct mem_ctl_info * mci,int chan,u64 ar)57*4882a593Smuzhiyun static void cell_edac_count_ue(struct mem_ctl_info *mci, int chan, u64 ar)
58*4882a593Smuzhiyun {
59*4882a593Smuzhiyun struct cell_edac_priv *priv = mci->pvt_info;
60*4882a593Smuzhiyun struct csrow_info *csrow = mci->csrows[0];
61*4882a593Smuzhiyun unsigned long address, pfn, offset;
62*4882a593Smuzhiyun
63*4882a593Smuzhiyun dev_dbg(mci->pdev, "ECC UE err on node %d, channel %d, ar = 0x%016llx\n",
64*4882a593Smuzhiyun priv->node, chan, ar);
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun /* Address decoding is likely a bit bogus, to dbl check */
67*4882a593Smuzhiyun address = (ar & 0xffffffffe0000000ul) >> 29;
68*4882a593Smuzhiyun if (priv->chanmask == 0x3)
69*4882a593Smuzhiyun address = (address << 1) | chan;
70*4882a593Smuzhiyun pfn = address >> PAGE_SHIFT;
71*4882a593Smuzhiyun offset = address & ~PAGE_MASK;
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun /* TODO: Decoding of the error address */
74*4882a593Smuzhiyun edac_mc_handle_error(HW_EVENT_ERR_UNCORRECTED, mci, 1,
75*4882a593Smuzhiyun csrow->first_page + pfn, offset, 0,
76*4882a593Smuzhiyun 0, chan, -1, "", "");
77*4882a593Smuzhiyun }
78*4882a593Smuzhiyun
cell_edac_check(struct mem_ctl_info * mci)79*4882a593Smuzhiyun static void cell_edac_check(struct mem_ctl_info *mci)
80*4882a593Smuzhiyun {
81*4882a593Smuzhiyun struct cell_edac_priv *priv = mci->pvt_info;
82*4882a593Smuzhiyun u64 fir, addreg, clear = 0;
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun fir = in_be64(&priv->regs->mic_fir);
85*4882a593Smuzhiyun #ifdef DEBUG
86*4882a593Smuzhiyun if (fir != priv->prev_fir) {
87*4882a593Smuzhiyun dev_dbg(mci->pdev, "fir change : 0x%016lx\n", fir);
88*4882a593Smuzhiyun priv->prev_fir = fir;
89*4882a593Smuzhiyun }
90*4882a593Smuzhiyun #endif
91*4882a593Smuzhiyun if ((priv->chanmask & 0x1) && (fir & CBE_MIC_FIR_ECC_SINGLE_0_ERR)) {
92*4882a593Smuzhiyun addreg = in_be64(&priv->regs->mic_df_ecc_address_0);
93*4882a593Smuzhiyun clear |= CBE_MIC_FIR_ECC_SINGLE_0_RESET;
94*4882a593Smuzhiyun cell_edac_count_ce(mci, 0, addreg);
95*4882a593Smuzhiyun }
96*4882a593Smuzhiyun if ((priv->chanmask & 0x2) && (fir & CBE_MIC_FIR_ECC_SINGLE_1_ERR)) {
97*4882a593Smuzhiyun addreg = in_be64(&priv->regs->mic_df_ecc_address_1);
98*4882a593Smuzhiyun clear |= CBE_MIC_FIR_ECC_SINGLE_1_RESET;
99*4882a593Smuzhiyun cell_edac_count_ce(mci, 1, addreg);
100*4882a593Smuzhiyun }
101*4882a593Smuzhiyun if ((priv->chanmask & 0x1) && (fir & CBE_MIC_FIR_ECC_MULTI_0_ERR)) {
102*4882a593Smuzhiyun addreg = in_be64(&priv->regs->mic_df_ecc_address_0);
103*4882a593Smuzhiyun clear |= CBE_MIC_FIR_ECC_MULTI_0_RESET;
104*4882a593Smuzhiyun cell_edac_count_ue(mci, 0, addreg);
105*4882a593Smuzhiyun }
106*4882a593Smuzhiyun if ((priv->chanmask & 0x2) && (fir & CBE_MIC_FIR_ECC_MULTI_1_ERR)) {
107*4882a593Smuzhiyun addreg = in_be64(&priv->regs->mic_df_ecc_address_1);
108*4882a593Smuzhiyun clear |= CBE_MIC_FIR_ECC_MULTI_1_RESET;
109*4882a593Smuzhiyun cell_edac_count_ue(mci, 1, addreg);
110*4882a593Smuzhiyun }
111*4882a593Smuzhiyun
112*4882a593Smuzhiyun /* The procedure for clearing FIR bits is a bit ... weird */
113*4882a593Smuzhiyun if (clear) {
114*4882a593Smuzhiyun fir &= ~(CBE_MIC_FIR_ECC_ERR_MASK | CBE_MIC_FIR_ECC_SET_MASK);
115*4882a593Smuzhiyun fir |= CBE_MIC_FIR_ECC_RESET_MASK;
116*4882a593Smuzhiyun fir &= ~clear;
117*4882a593Smuzhiyun out_be64(&priv->regs->mic_fir, fir);
118*4882a593Smuzhiyun (void)in_be64(&priv->regs->mic_fir);
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun mb(); /* sync up */
121*4882a593Smuzhiyun #ifdef DEBUG
122*4882a593Smuzhiyun fir = in_be64(&priv->regs->mic_fir);
123*4882a593Smuzhiyun dev_dbg(mci->pdev, "fir clear : 0x%016lx\n", fir);
124*4882a593Smuzhiyun #endif
125*4882a593Smuzhiyun }
126*4882a593Smuzhiyun }
127*4882a593Smuzhiyun
cell_edac_init_csrows(struct mem_ctl_info * mci)128*4882a593Smuzhiyun static void cell_edac_init_csrows(struct mem_ctl_info *mci)
129*4882a593Smuzhiyun {
130*4882a593Smuzhiyun struct csrow_info *csrow = mci->csrows[0];
131*4882a593Smuzhiyun struct dimm_info *dimm;
132*4882a593Smuzhiyun struct cell_edac_priv *priv = mci->pvt_info;
133*4882a593Smuzhiyun struct device_node *np;
134*4882a593Smuzhiyun int j;
135*4882a593Smuzhiyun u32 nr_pages;
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun for_each_node_by_name(np, "memory") {
138*4882a593Smuzhiyun struct resource r;
139*4882a593Smuzhiyun
140*4882a593Smuzhiyun /* We "know" that the Cell firmware only creates one entry
141*4882a593Smuzhiyun * in the "memory" nodes. If that changes, this code will
142*4882a593Smuzhiyun * need to be adapted.
143*4882a593Smuzhiyun */
144*4882a593Smuzhiyun if (of_address_to_resource(np, 0, &r))
145*4882a593Smuzhiyun continue;
146*4882a593Smuzhiyun if (of_node_to_nid(np) != priv->node)
147*4882a593Smuzhiyun continue;
148*4882a593Smuzhiyun csrow->first_page = r.start >> PAGE_SHIFT;
149*4882a593Smuzhiyun nr_pages = resource_size(&r) >> PAGE_SHIFT;
150*4882a593Smuzhiyun csrow->last_page = csrow->first_page + nr_pages - 1;
151*4882a593Smuzhiyun
152*4882a593Smuzhiyun for (j = 0; j < csrow->nr_channels; j++) {
153*4882a593Smuzhiyun dimm = csrow->channels[j]->dimm;
154*4882a593Smuzhiyun dimm->mtype = MEM_XDR;
155*4882a593Smuzhiyun dimm->edac_mode = EDAC_SECDED;
156*4882a593Smuzhiyun dimm->nr_pages = nr_pages / csrow->nr_channels;
157*4882a593Smuzhiyun }
158*4882a593Smuzhiyun dev_dbg(mci->pdev,
159*4882a593Smuzhiyun "Initialized on node %d, chanmask=0x%x,"
160*4882a593Smuzhiyun " first_page=0x%lx, nr_pages=0x%x\n",
161*4882a593Smuzhiyun priv->node, priv->chanmask,
162*4882a593Smuzhiyun csrow->first_page, nr_pages);
163*4882a593Smuzhiyun break;
164*4882a593Smuzhiyun }
165*4882a593Smuzhiyun of_node_put(np);
166*4882a593Smuzhiyun }
167*4882a593Smuzhiyun
cell_edac_probe(struct platform_device * pdev)168*4882a593Smuzhiyun static int cell_edac_probe(struct platform_device *pdev)
169*4882a593Smuzhiyun {
170*4882a593Smuzhiyun struct cbe_mic_tm_regs __iomem *regs;
171*4882a593Smuzhiyun struct mem_ctl_info *mci;
172*4882a593Smuzhiyun struct edac_mc_layer layers[2];
173*4882a593Smuzhiyun struct cell_edac_priv *priv;
174*4882a593Smuzhiyun u64 reg;
175*4882a593Smuzhiyun int rc, chanmask, num_chans;
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun regs = cbe_get_cpu_mic_tm_regs(cbe_node_to_cpu(pdev->id));
178*4882a593Smuzhiyun if (regs == NULL)
179*4882a593Smuzhiyun return -ENODEV;
180*4882a593Smuzhiyun
181*4882a593Smuzhiyun edac_op_state = EDAC_OPSTATE_POLL;
182*4882a593Smuzhiyun
183*4882a593Smuzhiyun /* Get channel population */
184*4882a593Smuzhiyun reg = in_be64(®s->mic_mnt_cfg);
185*4882a593Smuzhiyun dev_dbg(&pdev->dev, "MIC_MNT_CFG = 0x%016llx\n", reg);
186*4882a593Smuzhiyun chanmask = 0;
187*4882a593Smuzhiyun if (reg & CBE_MIC_MNT_CFG_CHAN_0_POP)
188*4882a593Smuzhiyun chanmask |= 0x1;
189*4882a593Smuzhiyun if (reg & CBE_MIC_MNT_CFG_CHAN_1_POP)
190*4882a593Smuzhiyun chanmask |= 0x2;
191*4882a593Smuzhiyun if (chanmask == 0) {
192*4882a593Smuzhiyun dev_warn(&pdev->dev,
193*4882a593Smuzhiyun "Yuck ! No channel populated ? Aborting !\n");
194*4882a593Smuzhiyun return -ENODEV;
195*4882a593Smuzhiyun }
196*4882a593Smuzhiyun dev_dbg(&pdev->dev, "Initial FIR = 0x%016llx\n",
197*4882a593Smuzhiyun in_be64(®s->mic_fir));
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun /* Allocate & init EDAC MC data structure */
200*4882a593Smuzhiyun num_chans = chanmask == 3 ? 2 : 1;
201*4882a593Smuzhiyun
202*4882a593Smuzhiyun layers[0].type = EDAC_MC_LAYER_CHIP_SELECT;
203*4882a593Smuzhiyun layers[0].size = 1;
204*4882a593Smuzhiyun layers[0].is_virt_csrow = true;
205*4882a593Smuzhiyun layers[1].type = EDAC_MC_LAYER_CHANNEL;
206*4882a593Smuzhiyun layers[1].size = num_chans;
207*4882a593Smuzhiyun layers[1].is_virt_csrow = false;
208*4882a593Smuzhiyun mci = edac_mc_alloc(pdev->id, ARRAY_SIZE(layers), layers,
209*4882a593Smuzhiyun sizeof(struct cell_edac_priv));
210*4882a593Smuzhiyun if (mci == NULL)
211*4882a593Smuzhiyun return -ENOMEM;
212*4882a593Smuzhiyun priv = mci->pvt_info;
213*4882a593Smuzhiyun priv->regs = regs;
214*4882a593Smuzhiyun priv->node = pdev->id;
215*4882a593Smuzhiyun priv->chanmask = chanmask;
216*4882a593Smuzhiyun mci->pdev = &pdev->dev;
217*4882a593Smuzhiyun mci->mtype_cap = MEM_FLAG_XDR;
218*4882a593Smuzhiyun mci->edac_ctl_cap = EDAC_FLAG_NONE | EDAC_FLAG_EC | EDAC_FLAG_SECDED;
219*4882a593Smuzhiyun mci->edac_cap = EDAC_FLAG_EC | EDAC_FLAG_SECDED;
220*4882a593Smuzhiyun mci->mod_name = "cell_edac";
221*4882a593Smuzhiyun mci->ctl_name = "MIC";
222*4882a593Smuzhiyun mci->dev_name = dev_name(&pdev->dev);
223*4882a593Smuzhiyun mci->edac_check = cell_edac_check;
224*4882a593Smuzhiyun cell_edac_init_csrows(mci);
225*4882a593Smuzhiyun
226*4882a593Smuzhiyun /* Register with EDAC core */
227*4882a593Smuzhiyun rc = edac_mc_add_mc(mci);
228*4882a593Smuzhiyun if (rc) {
229*4882a593Smuzhiyun dev_err(&pdev->dev, "failed to register with EDAC core\n");
230*4882a593Smuzhiyun edac_mc_free(mci);
231*4882a593Smuzhiyun return rc;
232*4882a593Smuzhiyun }
233*4882a593Smuzhiyun
234*4882a593Smuzhiyun return 0;
235*4882a593Smuzhiyun }
236*4882a593Smuzhiyun
cell_edac_remove(struct platform_device * pdev)237*4882a593Smuzhiyun static int cell_edac_remove(struct platform_device *pdev)
238*4882a593Smuzhiyun {
239*4882a593Smuzhiyun struct mem_ctl_info *mci = edac_mc_del_mc(&pdev->dev);
240*4882a593Smuzhiyun if (mci)
241*4882a593Smuzhiyun edac_mc_free(mci);
242*4882a593Smuzhiyun return 0;
243*4882a593Smuzhiyun }
244*4882a593Smuzhiyun
245*4882a593Smuzhiyun static struct platform_driver cell_edac_driver = {
246*4882a593Smuzhiyun .driver = {
247*4882a593Smuzhiyun .name = "cbe-mic",
248*4882a593Smuzhiyun },
249*4882a593Smuzhiyun .probe = cell_edac_probe,
250*4882a593Smuzhiyun .remove = cell_edac_remove,
251*4882a593Smuzhiyun };
252*4882a593Smuzhiyun
cell_edac_init(void)253*4882a593Smuzhiyun static int __init cell_edac_init(void)
254*4882a593Smuzhiyun {
255*4882a593Smuzhiyun /* Sanity check registers data structure */
256*4882a593Smuzhiyun BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
257*4882a593Smuzhiyun mic_df_ecc_address_0) != 0xf8);
258*4882a593Smuzhiyun BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
259*4882a593Smuzhiyun mic_df_ecc_address_1) != 0x1b8);
260*4882a593Smuzhiyun BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
261*4882a593Smuzhiyun mic_df_config) != 0x218);
262*4882a593Smuzhiyun BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
263*4882a593Smuzhiyun mic_fir) != 0x230);
264*4882a593Smuzhiyun BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
265*4882a593Smuzhiyun mic_mnt_cfg) != 0x210);
266*4882a593Smuzhiyun BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
267*4882a593Smuzhiyun mic_exc) != 0x208);
268*4882a593Smuzhiyun
269*4882a593Smuzhiyun return platform_driver_register(&cell_edac_driver);
270*4882a593Smuzhiyun }
271*4882a593Smuzhiyun
cell_edac_exit(void)272*4882a593Smuzhiyun static void __exit cell_edac_exit(void)
273*4882a593Smuzhiyun {
274*4882a593Smuzhiyun platform_driver_unregister(&cell_edac_driver);
275*4882a593Smuzhiyun }
276*4882a593Smuzhiyun
277*4882a593Smuzhiyun module_init(cell_edac_init);
278*4882a593Smuzhiyun module_exit(cell_edac_exit);
279*4882a593Smuzhiyun
280*4882a593Smuzhiyun MODULE_LICENSE("GPL");
281*4882a593Smuzhiyun MODULE_AUTHOR("Benjamin Herrenschmidt <benh@kernel.crashing.org>");
282*4882a593Smuzhiyun MODULE_DESCRIPTION("ECC counting for Cell MIC");
283