xref: /OK3568_Linux_fs/kernel/drivers/edac/cell_edac.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * Cell MIC driver for ECC counting
3*4882a593Smuzhiyun  *
4*4882a593Smuzhiyun  * Copyright 2007 Benjamin Herrenschmidt, IBM Corp.
5*4882a593Smuzhiyun  *                <benh@kernel.crashing.org>
6*4882a593Smuzhiyun  *
7*4882a593Smuzhiyun  * This file may be distributed under the terms of the
8*4882a593Smuzhiyun  * GNU General Public License.
9*4882a593Smuzhiyun  */
10*4882a593Smuzhiyun #undef DEBUG
11*4882a593Smuzhiyun 
12*4882a593Smuzhiyun #include <linux/edac.h>
13*4882a593Smuzhiyun #include <linux/module.h>
14*4882a593Smuzhiyun #include <linux/init.h>
15*4882a593Smuzhiyun #include <linux/platform_device.h>
16*4882a593Smuzhiyun #include <linux/stop_machine.h>
17*4882a593Smuzhiyun #include <linux/io.h>
18*4882a593Smuzhiyun #include <linux/of_address.h>
19*4882a593Smuzhiyun #include <asm/machdep.h>
20*4882a593Smuzhiyun #include <asm/cell-regs.h>
21*4882a593Smuzhiyun 
22*4882a593Smuzhiyun #include "edac_module.h"
23*4882a593Smuzhiyun 
24*4882a593Smuzhiyun struct cell_edac_priv
25*4882a593Smuzhiyun {
26*4882a593Smuzhiyun 	struct cbe_mic_tm_regs __iomem	*regs;
27*4882a593Smuzhiyun 	int				node;
28*4882a593Smuzhiyun 	int				chanmask;
29*4882a593Smuzhiyun #ifdef DEBUG
30*4882a593Smuzhiyun 	u64				prev_fir;
31*4882a593Smuzhiyun #endif
32*4882a593Smuzhiyun };
33*4882a593Smuzhiyun 
cell_edac_count_ce(struct mem_ctl_info * mci,int chan,u64 ar)34*4882a593Smuzhiyun static void cell_edac_count_ce(struct mem_ctl_info *mci, int chan, u64 ar)
35*4882a593Smuzhiyun {
36*4882a593Smuzhiyun 	struct cell_edac_priv		*priv = mci->pvt_info;
37*4882a593Smuzhiyun 	struct csrow_info		*csrow = mci->csrows[0];
38*4882a593Smuzhiyun 	unsigned long			address, pfn, offset, syndrome;
39*4882a593Smuzhiyun 
40*4882a593Smuzhiyun 	dev_dbg(mci->pdev, "ECC CE err on node %d, channel %d, ar = 0x%016llx\n",
41*4882a593Smuzhiyun 		priv->node, chan, ar);
42*4882a593Smuzhiyun 
43*4882a593Smuzhiyun 	/* Address decoding is likely a bit bogus, to dbl check */
44*4882a593Smuzhiyun 	address = (ar & 0xffffffffe0000000ul) >> 29;
45*4882a593Smuzhiyun 	if (priv->chanmask == 0x3)
46*4882a593Smuzhiyun 		address = (address << 1) | chan;
47*4882a593Smuzhiyun 	pfn = address >> PAGE_SHIFT;
48*4882a593Smuzhiyun 	offset = address & ~PAGE_MASK;
49*4882a593Smuzhiyun 	syndrome = (ar & 0x000000001fe00000ul) >> 21;
50*4882a593Smuzhiyun 
51*4882a593Smuzhiyun 	/* TODO: Decoding of the error address */
52*4882a593Smuzhiyun 	edac_mc_handle_error(HW_EVENT_ERR_CORRECTED, mci, 1,
53*4882a593Smuzhiyun 			     csrow->first_page + pfn, offset, syndrome,
54*4882a593Smuzhiyun 			     0, chan, -1, "", "");
55*4882a593Smuzhiyun }
56*4882a593Smuzhiyun 
cell_edac_count_ue(struct mem_ctl_info * mci,int chan,u64 ar)57*4882a593Smuzhiyun static void cell_edac_count_ue(struct mem_ctl_info *mci, int chan, u64 ar)
58*4882a593Smuzhiyun {
59*4882a593Smuzhiyun 	struct cell_edac_priv		*priv = mci->pvt_info;
60*4882a593Smuzhiyun 	struct csrow_info		*csrow = mci->csrows[0];
61*4882a593Smuzhiyun 	unsigned long			address, pfn, offset;
62*4882a593Smuzhiyun 
63*4882a593Smuzhiyun 	dev_dbg(mci->pdev, "ECC UE err on node %d, channel %d, ar = 0x%016llx\n",
64*4882a593Smuzhiyun 		priv->node, chan, ar);
65*4882a593Smuzhiyun 
66*4882a593Smuzhiyun 	/* Address decoding is likely a bit bogus, to dbl check */
67*4882a593Smuzhiyun 	address = (ar & 0xffffffffe0000000ul) >> 29;
68*4882a593Smuzhiyun 	if (priv->chanmask == 0x3)
69*4882a593Smuzhiyun 		address = (address << 1) | chan;
70*4882a593Smuzhiyun 	pfn = address >> PAGE_SHIFT;
71*4882a593Smuzhiyun 	offset = address & ~PAGE_MASK;
72*4882a593Smuzhiyun 
73*4882a593Smuzhiyun 	/* TODO: Decoding of the error address */
74*4882a593Smuzhiyun 	edac_mc_handle_error(HW_EVENT_ERR_UNCORRECTED, mci, 1,
75*4882a593Smuzhiyun 			     csrow->first_page + pfn, offset, 0,
76*4882a593Smuzhiyun 			     0, chan, -1, "", "");
77*4882a593Smuzhiyun }
78*4882a593Smuzhiyun 
cell_edac_check(struct mem_ctl_info * mci)79*4882a593Smuzhiyun static void cell_edac_check(struct mem_ctl_info *mci)
80*4882a593Smuzhiyun {
81*4882a593Smuzhiyun 	struct cell_edac_priv		*priv = mci->pvt_info;
82*4882a593Smuzhiyun 	u64				fir, addreg, clear = 0;
83*4882a593Smuzhiyun 
84*4882a593Smuzhiyun 	fir = in_be64(&priv->regs->mic_fir);
85*4882a593Smuzhiyun #ifdef DEBUG
86*4882a593Smuzhiyun 	if (fir != priv->prev_fir) {
87*4882a593Smuzhiyun 		dev_dbg(mci->pdev, "fir change : 0x%016lx\n", fir);
88*4882a593Smuzhiyun 		priv->prev_fir = fir;
89*4882a593Smuzhiyun 	}
90*4882a593Smuzhiyun #endif
91*4882a593Smuzhiyun 	if ((priv->chanmask & 0x1) && (fir & CBE_MIC_FIR_ECC_SINGLE_0_ERR)) {
92*4882a593Smuzhiyun 		addreg = in_be64(&priv->regs->mic_df_ecc_address_0);
93*4882a593Smuzhiyun 		clear |= CBE_MIC_FIR_ECC_SINGLE_0_RESET;
94*4882a593Smuzhiyun 		cell_edac_count_ce(mci, 0, addreg);
95*4882a593Smuzhiyun 	}
96*4882a593Smuzhiyun 	if ((priv->chanmask & 0x2) && (fir & CBE_MIC_FIR_ECC_SINGLE_1_ERR)) {
97*4882a593Smuzhiyun 		addreg = in_be64(&priv->regs->mic_df_ecc_address_1);
98*4882a593Smuzhiyun 		clear |= CBE_MIC_FIR_ECC_SINGLE_1_RESET;
99*4882a593Smuzhiyun 		cell_edac_count_ce(mci, 1, addreg);
100*4882a593Smuzhiyun 	}
101*4882a593Smuzhiyun 	if ((priv->chanmask & 0x1) && (fir & CBE_MIC_FIR_ECC_MULTI_0_ERR)) {
102*4882a593Smuzhiyun 		addreg = in_be64(&priv->regs->mic_df_ecc_address_0);
103*4882a593Smuzhiyun 		clear |= CBE_MIC_FIR_ECC_MULTI_0_RESET;
104*4882a593Smuzhiyun 		cell_edac_count_ue(mci, 0, addreg);
105*4882a593Smuzhiyun 	}
106*4882a593Smuzhiyun 	if ((priv->chanmask & 0x2) && (fir & CBE_MIC_FIR_ECC_MULTI_1_ERR)) {
107*4882a593Smuzhiyun 		addreg = in_be64(&priv->regs->mic_df_ecc_address_1);
108*4882a593Smuzhiyun 		clear |= CBE_MIC_FIR_ECC_MULTI_1_RESET;
109*4882a593Smuzhiyun 		cell_edac_count_ue(mci, 1, addreg);
110*4882a593Smuzhiyun 	}
111*4882a593Smuzhiyun 
112*4882a593Smuzhiyun 	/* The procedure for clearing FIR bits is a bit ... weird */
113*4882a593Smuzhiyun 	if (clear) {
114*4882a593Smuzhiyun 		fir &= ~(CBE_MIC_FIR_ECC_ERR_MASK | CBE_MIC_FIR_ECC_SET_MASK);
115*4882a593Smuzhiyun 		fir |= CBE_MIC_FIR_ECC_RESET_MASK;
116*4882a593Smuzhiyun 		fir &= ~clear;
117*4882a593Smuzhiyun 		out_be64(&priv->regs->mic_fir, fir);
118*4882a593Smuzhiyun 		(void)in_be64(&priv->regs->mic_fir);
119*4882a593Smuzhiyun 
120*4882a593Smuzhiyun 		mb();	/* sync up */
121*4882a593Smuzhiyun #ifdef DEBUG
122*4882a593Smuzhiyun 		fir = in_be64(&priv->regs->mic_fir);
123*4882a593Smuzhiyun 		dev_dbg(mci->pdev, "fir clear  : 0x%016lx\n", fir);
124*4882a593Smuzhiyun #endif
125*4882a593Smuzhiyun 	}
126*4882a593Smuzhiyun }
127*4882a593Smuzhiyun 
cell_edac_init_csrows(struct mem_ctl_info * mci)128*4882a593Smuzhiyun static void cell_edac_init_csrows(struct mem_ctl_info *mci)
129*4882a593Smuzhiyun {
130*4882a593Smuzhiyun 	struct csrow_info		*csrow = mci->csrows[0];
131*4882a593Smuzhiyun 	struct dimm_info		*dimm;
132*4882a593Smuzhiyun 	struct cell_edac_priv		*priv = mci->pvt_info;
133*4882a593Smuzhiyun 	struct device_node		*np;
134*4882a593Smuzhiyun 	int				j;
135*4882a593Smuzhiyun 	u32				nr_pages;
136*4882a593Smuzhiyun 
137*4882a593Smuzhiyun 	for_each_node_by_name(np, "memory") {
138*4882a593Smuzhiyun 		struct resource r;
139*4882a593Smuzhiyun 
140*4882a593Smuzhiyun 		/* We "know" that the Cell firmware only creates one entry
141*4882a593Smuzhiyun 		 * in the "memory" nodes. If that changes, this code will
142*4882a593Smuzhiyun 		 * need to be adapted.
143*4882a593Smuzhiyun 		 */
144*4882a593Smuzhiyun 		if (of_address_to_resource(np, 0, &r))
145*4882a593Smuzhiyun 			continue;
146*4882a593Smuzhiyun 		if (of_node_to_nid(np) != priv->node)
147*4882a593Smuzhiyun 			continue;
148*4882a593Smuzhiyun 		csrow->first_page = r.start >> PAGE_SHIFT;
149*4882a593Smuzhiyun 		nr_pages = resource_size(&r) >> PAGE_SHIFT;
150*4882a593Smuzhiyun 		csrow->last_page = csrow->first_page + nr_pages - 1;
151*4882a593Smuzhiyun 
152*4882a593Smuzhiyun 		for (j = 0; j < csrow->nr_channels; j++) {
153*4882a593Smuzhiyun 			dimm = csrow->channels[j]->dimm;
154*4882a593Smuzhiyun 			dimm->mtype = MEM_XDR;
155*4882a593Smuzhiyun 			dimm->edac_mode = EDAC_SECDED;
156*4882a593Smuzhiyun 			dimm->nr_pages = nr_pages / csrow->nr_channels;
157*4882a593Smuzhiyun 		}
158*4882a593Smuzhiyun 		dev_dbg(mci->pdev,
159*4882a593Smuzhiyun 			"Initialized on node %d, chanmask=0x%x,"
160*4882a593Smuzhiyun 			" first_page=0x%lx, nr_pages=0x%x\n",
161*4882a593Smuzhiyun 			priv->node, priv->chanmask,
162*4882a593Smuzhiyun 			csrow->first_page, nr_pages);
163*4882a593Smuzhiyun 		break;
164*4882a593Smuzhiyun 	}
165*4882a593Smuzhiyun 	of_node_put(np);
166*4882a593Smuzhiyun }
167*4882a593Smuzhiyun 
cell_edac_probe(struct platform_device * pdev)168*4882a593Smuzhiyun static int cell_edac_probe(struct platform_device *pdev)
169*4882a593Smuzhiyun {
170*4882a593Smuzhiyun 	struct cbe_mic_tm_regs __iomem	*regs;
171*4882a593Smuzhiyun 	struct mem_ctl_info		*mci;
172*4882a593Smuzhiyun 	struct edac_mc_layer		layers[2];
173*4882a593Smuzhiyun 	struct cell_edac_priv		*priv;
174*4882a593Smuzhiyun 	u64				reg;
175*4882a593Smuzhiyun 	int				rc, chanmask, num_chans;
176*4882a593Smuzhiyun 
177*4882a593Smuzhiyun 	regs = cbe_get_cpu_mic_tm_regs(cbe_node_to_cpu(pdev->id));
178*4882a593Smuzhiyun 	if (regs == NULL)
179*4882a593Smuzhiyun 		return -ENODEV;
180*4882a593Smuzhiyun 
181*4882a593Smuzhiyun 	edac_op_state = EDAC_OPSTATE_POLL;
182*4882a593Smuzhiyun 
183*4882a593Smuzhiyun 	/* Get channel population */
184*4882a593Smuzhiyun 	reg = in_be64(&regs->mic_mnt_cfg);
185*4882a593Smuzhiyun 	dev_dbg(&pdev->dev, "MIC_MNT_CFG = 0x%016llx\n", reg);
186*4882a593Smuzhiyun 	chanmask = 0;
187*4882a593Smuzhiyun 	if (reg & CBE_MIC_MNT_CFG_CHAN_0_POP)
188*4882a593Smuzhiyun 		chanmask |= 0x1;
189*4882a593Smuzhiyun 	if (reg & CBE_MIC_MNT_CFG_CHAN_1_POP)
190*4882a593Smuzhiyun 		chanmask |= 0x2;
191*4882a593Smuzhiyun 	if (chanmask == 0) {
192*4882a593Smuzhiyun 		dev_warn(&pdev->dev,
193*4882a593Smuzhiyun 			 "Yuck ! No channel populated ? Aborting !\n");
194*4882a593Smuzhiyun 		return -ENODEV;
195*4882a593Smuzhiyun 	}
196*4882a593Smuzhiyun 	dev_dbg(&pdev->dev, "Initial FIR = 0x%016llx\n",
197*4882a593Smuzhiyun 		in_be64(&regs->mic_fir));
198*4882a593Smuzhiyun 
199*4882a593Smuzhiyun 	/* Allocate & init EDAC MC data structure */
200*4882a593Smuzhiyun 	num_chans = chanmask == 3 ? 2 : 1;
201*4882a593Smuzhiyun 
202*4882a593Smuzhiyun 	layers[0].type = EDAC_MC_LAYER_CHIP_SELECT;
203*4882a593Smuzhiyun 	layers[0].size = 1;
204*4882a593Smuzhiyun 	layers[0].is_virt_csrow = true;
205*4882a593Smuzhiyun 	layers[1].type = EDAC_MC_LAYER_CHANNEL;
206*4882a593Smuzhiyun 	layers[1].size = num_chans;
207*4882a593Smuzhiyun 	layers[1].is_virt_csrow = false;
208*4882a593Smuzhiyun 	mci = edac_mc_alloc(pdev->id, ARRAY_SIZE(layers), layers,
209*4882a593Smuzhiyun 			    sizeof(struct cell_edac_priv));
210*4882a593Smuzhiyun 	if (mci == NULL)
211*4882a593Smuzhiyun 		return -ENOMEM;
212*4882a593Smuzhiyun 	priv = mci->pvt_info;
213*4882a593Smuzhiyun 	priv->regs = regs;
214*4882a593Smuzhiyun 	priv->node = pdev->id;
215*4882a593Smuzhiyun 	priv->chanmask = chanmask;
216*4882a593Smuzhiyun 	mci->pdev = &pdev->dev;
217*4882a593Smuzhiyun 	mci->mtype_cap = MEM_FLAG_XDR;
218*4882a593Smuzhiyun 	mci->edac_ctl_cap = EDAC_FLAG_NONE | EDAC_FLAG_EC | EDAC_FLAG_SECDED;
219*4882a593Smuzhiyun 	mci->edac_cap = EDAC_FLAG_EC | EDAC_FLAG_SECDED;
220*4882a593Smuzhiyun 	mci->mod_name = "cell_edac";
221*4882a593Smuzhiyun 	mci->ctl_name = "MIC";
222*4882a593Smuzhiyun 	mci->dev_name = dev_name(&pdev->dev);
223*4882a593Smuzhiyun 	mci->edac_check = cell_edac_check;
224*4882a593Smuzhiyun 	cell_edac_init_csrows(mci);
225*4882a593Smuzhiyun 
226*4882a593Smuzhiyun 	/* Register with EDAC core */
227*4882a593Smuzhiyun 	rc = edac_mc_add_mc(mci);
228*4882a593Smuzhiyun 	if (rc) {
229*4882a593Smuzhiyun 		dev_err(&pdev->dev, "failed to register with EDAC core\n");
230*4882a593Smuzhiyun 		edac_mc_free(mci);
231*4882a593Smuzhiyun 		return rc;
232*4882a593Smuzhiyun 	}
233*4882a593Smuzhiyun 
234*4882a593Smuzhiyun 	return 0;
235*4882a593Smuzhiyun }
236*4882a593Smuzhiyun 
cell_edac_remove(struct platform_device * pdev)237*4882a593Smuzhiyun static int cell_edac_remove(struct platform_device *pdev)
238*4882a593Smuzhiyun {
239*4882a593Smuzhiyun 	struct mem_ctl_info *mci = edac_mc_del_mc(&pdev->dev);
240*4882a593Smuzhiyun 	if (mci)
241*4882a593Smuzhiyun 		edac_mc_free(mci);
242*4882a593Smuzhiyun 	return 0;
243*4882a593Smuzhiyun }
244*4882a593Smuzhiyun 
245*4882a593Smuzhiyun static struct platform_driver cell_edac_driver = {
246*4882a593Smuzhiyun 	.driver		= {
247*4882a593Smuzhiyun 		.name	= "cbe-mic",
248*4882a593Smuzhiyun 	},
249*4882a593Smuzhiyun 	.probe		= cell_edac_probe,
250*4882a593Smuzhiyun 	.remove		= cell_edac_remove,
251*4882a593Smuzhiyun };
252*4882a593Smuzhiyun 
cell_edac_init(void)253*4882a593Smuzhiyun static int __init cell_edac_init(void)
254*4882a593Smuzhiyun {
255*4882a593Smuzhiyun 	/* Sanity check registers data structure */
256*4882a593Smuzhiyun 	BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
257*4882a593Smuzhiyun 			      mic_df_ecc_address_0) != 0xf8);
258*4882a593Smuzhiyun 	BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
259*4882a593Smuzhiyun 			      mic_df_ecc_address_1) != 0x1b8);
260*4882a593Smuzhiyun 	BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
261*4882a593Smuzhiyun 			      mic_df_config) != 0x218);
262*4882a593Smuzhiyun 	BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
263*4882a593Smuzhiyun 			      mic_fir) != 0x230);
264*4882a593Smuzhiyun 	BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
265*4882a593Smuzhiyun 			      mic_mnt_cfg) != 0x210);
266*4882a593Smuzhiyun 	BUILD_BUG_ON(offsetof(struct cbe_mic_tm_regs,
267*4882a593Smuzhiyun 			      mic_exc) != 0x208);
268*4882a593Smuzhiyun 
269*4882a593Smuzhiyun 	return platform_driver_register(&cell_edac_driver);
270*4882a593Smuzhiyun }
271*4882a593Smuzhiyun 
cell_edac_exit(void)272*4882a593Smuzhiyun static void __exit cell_edac_exit(void)
273*4882a593Smuzhiyun {
274*4882a593Smuzhiyun 	platform_driver_unregister(&cell_edac_driver);
275*4882a593Smuzhiyun }
276*4882a593Smuzhiyun 
277*4882a593Smuzhiyun module_init(cell_edac_init);
278*4882a593Smuzhiyun module_exit(cell_edac_exit);
279*4882a593Smuzhiyun 
280*4882a593Smuzhiyun MODULE_LICENSE("GPL");
281*4882a593Smuzhiyun MODULE_AUTHOR("Benjamin Herrenschmidt <benh@kernel.crashing.org>");
282*4882a593Smuzhiyun MODULE_DESCRIPTION("ECC counting for Cell MIC");
283