xref: /OK3568_Linux_fs/u-boot/arch/arm/mach-uniphier/dram/umc-pxs2.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * Copyright (C) 2015-2017 Socionext Inc.
3*4882a593Smuzhiyun  *   Author: Masahiro Yamada <yamada.masahiro@socionext.com>
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * based on commit 21b6e480f92ccc38fe0502e3116411d6509d3bf2 of Diag by:
6*4882a593Smuzhiyun  * Copyright (C) 2015 Socionext Inc.
7*4882a593Smuzhiyun  *
8*4882a593Smuzhiyun  * SPDX-License-Identifier:	GPL-2.0+
9*4882a593Smuzhiyun  */
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun #include <common.h>
12*4882a593Smuzhiyun #include <linux/errno.h>
13*4882a593Smuzhiyun #include <linux/io.h>
14*4882a593Smuzhiyun #include <linux/sizes.h>
15*4882a593Smuzhiyun #include <asm/processor.h>
16*4882a593Smuzhiyun 
17*4882a593Smuzhiyun #include "../init.h"
18*4882a593Smuzhiyun #include "../soc-info.h"
19*4882a593Smuzhiyun #include "ddrmphy-regs.h"
20*4882a593Smuzhiyun #include "umc-regs.h"
21*4882a593Smuzhiyun 
22*4882a593Smuzhiyun #define DRAM_CH_NR	3
23*4882a593Smuzhiyun 
24*4882a593Smuzhiyun enum dram_freq {
25*4882a593Smuzhiyun 	DRAM_FREQ_1866M,
26*4882a593Smuzhiyun 	DRAM_FREQ_2133M,
27*4882a593Smuzhiyun 	DRAM_FREQ_NR,
28*4882a593Smuzhiyun };
29*4882a593Smuzhiyun 
30*4882a593Smuzhiyun enum dram_size {
31*4882a593Smuzhiyun 	DRAM_SZ_256M,
32*4882a593Smuzhiyun 	DRAM_SZ_512M,
33*4882a593Smuzhiyun 	DRAM_SZ_NR,
34*4882a593Smuzhiyun };
35*4882a593Smuzhiyun 
36*4882a593Smuzhiyun /* PHY */
37*4882a593Smuzhiyun static u32 ddrphy_pgcr2[DRAM_FREQ_NR] = {0x00FC7E5D, 0x00FC90AB};
38*4882a593Smuzhiyun static u32 ddrphy_ptr0[DRAM_FREQ_NR] = {0x0EA09205, 0x10C0A6C6};
39*4882a593Smuzhiyun static u32 ddrphy_ptr1[DRAM_FREQ_NR] = {0x0DAC041B, 0x0FA104B1};
40*4882a593Smuzhiyun static u32 ddrphy_ptr3[DRAM_FREQ_NR] = {0x15171e45, 0x18182357};
41*4882a593Smuzhiyun static u32 ddrphy_ptr4[DRAM_FREQ_NR] = {0x0e9ad8e9, 0x10b34157};
42*4882a593Smuzhiyun static u32 ddrphy_dtpr0[DRAM_FREQ_NR] = {0x35a00d88, 0x39e40e88};
43*4882a593Smuzhiyun static u32 ddrphy_dtpr1[DRAM_FREQ_NR] = {0x2288cc2c, 0x228a04d0};
44*4882a593Smuzhiyun static u32 ddrphy_dtpr2[DRAM_FREQ_NR] = {0x50005e00, 0x50006a00};
45*4882a593Smuzhiyun static u32 ddrphy_dtpr3[DRAM_FREQ_NR] = {0x0010cb49, 0x0010ec89};
46*4882a593Smuzhiyun static u32 ddrphy_mr0[DRAM_FREQ_NR] = {0x00000115, 0x00000125};
47*4882a593Smuzhiyun static u32 ddrphy_mr2[DRAM_FREQ_NR] = {0x000002a0, 0x000002a8};
48*4882a593Smuzhiyun 
49*4882a593Smuzhiyun /* dependent on package and board design */
50*4882a593Smuzhiyun static u32 ddrphy_acbdlr0[DRAM_CH_NR] = {0x0000000c, 0x0000000c, 0x00000009};
51*4882a593Smuzhiyun 
52*4882a593Smuzhiyun /* DDR multiPHY */
ddrphy_get_rank(int dx)53*4882a593Smuzhiyun static inline int ddrphy_get_rank(int dx)
54*4882a593Smuzhiyun {
55*4882a593Smuzhiyun 	return dx / 2;
56*4882a593Smuzhiyun }
57*4882a593Smuzhiyun 
ddrphy_fifo_reset(void __iomem * phy_base)58*4882a593Smuzhiyun static void ddrphy_fifo_reset(void __iomem *phy_base)
59*4882a593Smuzhiyun {
60*4882a593Smuzhiyun 	u32 tmp;
61*4882a593Smuzhiyun 
62*4882a593Smuzhiyun 	tmp = readl(phy_base + MPHY_PGCR0);
63*4882a593Smuzhiyun 	tmp &= ~MPHY_PGCR0_PHYFRST;
64*4882a593Smuzhiyun 	writel(tmp, phy_base + MPHY_PGCR0);
65*4882a593Smuzhiyun 
66*4882a593Smuzhiyun 	udelay(1);
67*4882a593Smuzhiyun 
68*4882a593Smuzhiyun 	tmp |= MPHY_PGCR0_PHYFRST;
69*4882a593Smuzhiyun 	writel(tmp, phy_base + MPHY_PGCR0);
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun 	udelay(1);
72*4882a593Smuzhiyun }
73*4882a593Smuzhiyun 
ddrphy_vt_ctrl(void __iomem * phy_base,int enable)74*4882a593Smuzhiyun static void ddrphy_vt_ctrl(void __iomem *phy_base, int enable)
75*4882a593Smuzhiyun {
76*4882a593Smuzhiyun 	u32 tmp;
77*4882a593Smuzhiyun 
78*4882a593Smuzhiyun 	tmp = readl(phy_base + MPHY_PGCR1);
79*4882a593Smuzhiyun 
80*4882a593Smuzhiyun 	if (enable)
81*4882a593Smuzhiyun 		tmp &= ~MPHY_PGCR1_INHVT;
82*4882a593Smuzhiyun 	else
83*4882a593Smuzhiyun 		tmp |= MPHY_PGCR1_INHVT;
84*4882a593Smuzhiyun 
85*4882a593Smuzhiyun 	writel(tmp, phy_base + MPHY_PGCR1);
86*4882a593Smuzhiyun 
87*4882a593Smuzhiyun 	if (!enable) {
88*4882a593Smuzhiyun 		while (!(readl(phy_base + MPHY_PGSR1) & MPHY_PGSR1_VTSTOP))
89*4882a593Smuzhiyun 			cpu_relax();
90*4882a593Smuzhiyun 	}
91*4882a593Smuzhiyun }
92*4882a593Smuzhiyun 
ddrphy_dqs_delay_fixup(void __iomem * phy_base,int nr_dx,int step)93*4882a593Smuzhiyun static void ddrphy_dqs_delay_fixup(void __iomem *phy_base, int nr_dx, int step)
94*4882a593Smuzhiyun {
95*4882a593Smuzhiyun 	int dx;
96*4882a593Smuzhiyun 	u32 lcdlr1, rdqsd;
97*4882a593Smuzhiyun 	void __iomem *dx_base = phy_base + MPHY_DX_BASE;
98*4882a593Smuzhiyun 
99*4882a593Smuzhiyun 	ddrphy_vt_ctrl(phy_base, 0);
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun 	for (dx = 0; dx < nr_dx; dx++) {
102*4882a593Smuzhiyun 		lcdlr1 = readl(dx_base + MPHY_DX_LCDLR1);
103*4882a593Smuzhiyun 		rdqsd = (lcdlr1 >> 8) & 0xff;
104*4882a593Smuzhiyun 		rdqsd = clamp(rdqsd + step, 0U, 0xffU);
105*4882a593Smuzhiyun 		lcdlr1 = (lcdlr1 & ~(0xff << 8)) | (rdqsd << 8);
106*4882a593Smuzhiyun 		writel(lcdlr1, dx_base + MPHY_DX_LCDLR1);
107*4882a593Smuzhiyun 		readl(dx_base + MPHY_DX_LCDLR1); /* relax */
108*4882a593Smuzhiyun 		dx_base += MPHY_DX_STRIDE;
109*4882a593Smuzhiyun 	}
110*4882a593Smuzhiyun 
111*4882a593Smuzhiyun 	ddrphy_vt_ctrl(phy_base, 1);
112*4882a593Smuzhiyun }
113*4882a593Smuzhiyun 
ddrphy_get_system_latency(void __iomem * phy_base,int width)114*4882a593Smuzhiyun static int ddrphy_get_system_latency(void __iomem *phy_base, int width)
115*4882a593Smuzhiyun {
116*4882a593Smuzhiyun 	void __iomem *dx_base = phy_base + MPHY_DX_BASE;
117*4882a593Smuzhiyun 	const int nr_dx = width / 8;
118*4882a593Smuzhiyun 	int dx, rank;
119*4882a593Smuzhiyun 	u32 gtr;
120*4882a593Smuzhiyun 	int dgsl, dgsl_min = INT_MAX, dgsl_max = 0;
121*4882a593Smuzhiyun 
122*4882a593Smuzhiyun 	for (dx = 0; dx < nr_dx; dx++) {
123*4882a593Smuzhiyun 		gtr = readl(dx_base + MPHY_DX_GTR);
124*4882a593Smuzhiyun 		for (rank = 0; rank < 4; rank++) {
125*4882a593Smuzhiyun 			dgsl = gtr & 0x7;
126*4882a593Smuzhiyun 			/* if dgsl is zero, this rank was not trained. skip. */
127*4882a593Smuzhiyun 			if (dgsl) {
128*4882a593Smuzhiyun 				dgsl_min = min(dgsl_min, dgsl);
129*4882a593Smuzhiyun 				dgsl_max = max(dgsl_max, dgsl);
130*4882a593Smuzhiyun 			}
131*4882a593Smuzhiyun 			gtr >>= 3;
132*4882a593Smuzhiyun 		}
133*4882a593Smuzhiyun 		dx_base += MPHY_DX_STRIDE;
134*4882a593Smuzhiyun 	}
135*4882a593Smuzhiyun 
136*4882a593Smuzhiyun 	if (dgsl_min != dgsl_max)
137*4882a593Smuzhiyun 		printf("DQS Gateing System Latencies are not all leveled.\n");
138*4882a593Smuzhiyun 
139*4882a593Smuzhiyun 	return dgsl_max;
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun 
ddrphy_init(void __iomem * phy_base,enum dram_freq freq,int width,int ch)142*4882a593Smuzhiyun static void ddrphy_init(void __iomem *phy_base, enum dram_freq freq, int width,
143*4882a593Smuzhiyun 			int ch)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun 	u32 tmp;
146*4882a593Smuzhiyun 	void __iomem *zq_base, *dx_base;
147*4882a593Smuzhiyun 	int zq, dx;
148*4882a593Smuzhiyun 	int nr_dx;
149*4882a593Smuzhiyun 
150*4882a593Smuzhiyun 	nr_dx = width / 8;
151*4882a593Smuzhiyun 
152*4882a593Smuzhiyun 	writel(MPHY_PIR_ZCALBYP,        phy_base + MPHY_PIR);
153*4882a593Smuzhiyun 	/*
154*4882a593Smuzhiyun 	 * Disable RGLVT bit (Read DQS Gating LCDL Delay VT Compensation)
155*4882a593Smuzhiyun 	 * to avoid read error issue.
156*4882a593Smuzhiyun 	 */
157*4882a593Smuzhiyun 	writel(0x07d81e37, phy_base + MPHY_PGCR0);
158*4882a593Smuzhiyun 	writel(0x0200c4e0, phy_base + MPHY_PGCR1);
159*4882a593Smuzhiyun 
160*4882a593Smuzhiyun 	tmp = ddrphy_pgcr2[freq];
161*4882a593Smuzhiyun 	if (width >= 32)
162*4882a593Smuzhiyun 		tmp |= MPHY_PGCR2_DUALCHN | MPHY_PGCR2_ACPDDC;
163*4882a593Smuzhiyun 	writel(tmp, phy_base + MPHY_PGCR2);
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun 	writel(ddrphy_ptr0[freq], phy_base + MPHY_PTR0);
166*4882a593Smuzhiyun 	writel(ddrphy_ptr1[freq], phy_base + MPHY_PTR1);
167*4882a593Smuzhiyun 	writel(0x00083def, phy_base + MPHY_PTR2);
168*4882a593Smuzhiyun 	writel(ddrphy_ptr3[freq], phy_base + MPHY_PTR3);
169*4882a593Smuzhiyun 	writel(ddrphy_ptr4[freq], phy_base + MPHY_PTR4);
170*4882a593Smuzhiyun 
171*4882a593Smuzhiyun 	writel(ddrphy_acbdlr0[ch], phy_base + MPHY_ACBDLR0);
172*4882a593Smuzhiyun 
173*4882a593Smuzhiyun 	writel(0x55555555, phy_base + MPHY_ACIOCR1);
174*4882a593Smuzhiyun 	writel(0x00000000, phy_base + MPHY_ACIOCR2);
175*4882a593Smuzhiyun 	writel(0x55555555, phy_base + MPHY_ACIOCR3);
176*4882a593Smuzhiyun 	writel(0x00000000, phy_base + MPHY_ACIOCR4);
177*4882a593Smuzhiyun 	writel(0x00000055, phy_base + MPHY_ACIOCR5);
178*4882a593Smuzhiyun 	writel(0x00181aa4, phy_base + MPHY_DXCCR);
179*4882a593Smuzhiyun 
180*4882a593Smuzhiyun 	writel(0x0024641e, phy_base + MPHY_DSGCR);
181*4882a593Smuzhiyun 	writel(0x0000040b, phy_base + MPHY_DCR);
182*4882a593Smuzhiyun 	writel(ddrphy_dtpr0[freq], phy_base + MPHY_DTPR0);
183*4882a593Smuzhiyun 	writel(ddrphy_dtpr1[freq], phy_base + MPHY_DTPR1);
184*4882a593Smuzhiyun 	writel(ddrphy_dtpr2[freq], phy_base + MPHY_DTPR2);
185*4882a593Smuzhiyun 	writel(ddrphy_dtpr3[freq], phy_base + MPHY_DTPR3);
186*4882a593Smuzhiyun 	writel(ddrphy_mr0[freq], phy_base + MPHY_MR0);
187*4882a593Smuzhiyun 	writel(0x00000006, phy_base + MPHY_MR1);
188*4882a593Smuzhiyun 	writel(ddrphy_mr2[freq], phy_base + MPHY_MR2);
189*4882a593Smuzhiyun 	writel(0x00000000, phy_base + MPHY_MR3);
190*4882a593Smuzhiyun 
191*4882a593Smuzhiyun 	tmp = 0;
192*4882a593Smuzhiyun 	for (dx = 0; dx < nr_dx; dx++)
193*4882a593Smuzhiyun 		tmp |= BIT(MPHY_DTCR_RANKEN_SHIFT + ddrphy_get_rank(dx));
194*4882a593Smuzhiyun 	writel(0x90003087 | tmp, phy_base + MPHY_DTCR);
195*4882a593Smuzhiyun 
196*4882a593Smuzhiyun 	writel(0x00000000, phy_base + MPHY_DTAR0);
197*4882a593Smuzhiyun 	writel(0x00000008, phy_base + MPHY_DTAR1);
198*4882a593Smuzhiyun 	writel(0x00000010, phy_base + MPHY_DTAR2);
199*4882a593Smuzhiyun 	writel(0x00000018, phy_base + MPHY_DTAR3);
200*4882a593Smuzhiyun 	writel(0xdd22ee11, phy_base + MPHY_DTDR0);
201*4882a593Smuzhiyun 	writel(0x7788bb44, phy_base + MPHY_DTDR1);
202*4882a593Smuzhiyun 
203*4882a593Smuzhiyun 	/* impedance control settings */
204*4882a593Smuzhiyun 	writel(0x04048900, phy_base + MPHY_ZQCR);
205*4882a593Smuzhiyun 
206*4882a593Smuzhiyun 	zq_base = phy_base + MPHY_ZQ_BASE;
207*4882a593Smuzhiyun 	for (zq = 0; zq < 4; zq++) {
208*4882a593Smuzhiyun 		/*
209*4882a593Smuzhiyun 		 * board-dependent
210*4882a593Smuzhiyun 		 * PXS2: CH0ZQ0=0x5B, CH1ZQ0=0x5B, CH2ZQ0=0x59, others=0x5D
211*4882a593Smuzhiyun 		 */
212*4882a593Smuzhiyun 		writel(0x0007BB5D, zq_base + MPHY_ZQ_PR);
213*4882a593Smuzhiyun 		zq_base += MPHY_ZQ_STRIDE;
214*4882a593Smuzhiyun 	}
215*4882a593Smuzhiyun 
216*4882a593Smuzhiyun 	/* DATX8 settings */
217*4882a593Smuzhiyun 	dx_base = phy_base + MPHY_DX_BASE;
218*4882a593Smuzhiyun 	for (dx = 0; dx < 4; dx++) {
219*4882a593Smuzhiyun 		tmp = readl(dx_base + MPHY_DX_GCR0);
220*4882a593Smuzhiyun 		tmp &= ~MPHY_DX_GCR0_WLRKEN_MASK;
221*4882a593Smuzhiyun 		tmp |= BIT(MPHY_DX_GCR0_WLRKEN_SHIFT + ddrphy_get_rank(dx)) &
222*4882a593Smuzhiyun 						MPHY_DX_GCR0_WLRKEN_MASK;
223*4882a593Smuzhiyun 		writel(tmp, dx_base + MPHY_DX_GCR0);
224*4882a593Smuzhiyun 
225*4882a593Smuzhiyun 		writel(0x00000000, dx_base + MPHY_DX_GCR1);
226*4882a593Smuzhiyun 		writel(0x00000000, dx_base + MPHY_DX_GCR2);
227*4882a593Smuzhiyun 		writel(0x00000000, dx_base + MPHY_DX_GCR3);
228*4882a593Smuzhiyun 		dx_base += MPHY_DX_STRIDE;
229*4882a593Smuzhiyun 	}
230*4882a593Smuzhiyun 
231*4882a593Smuzhiyun 	while (!(readl(phy_base + MPHY_PGSR0) & MPHY_PGSR0_IDONE))
232*4882a593Smuzhiyun 		cpu_relax();
233*4882a593Smuzhiyun 
234*4882a593Smuzhiyun 	ddrphy_dqs_delay_fixup(phy_base, nr_dx, -4);
235*4882a593Smuzhiyun }
236*4882a593Smuzhiyun 
237*4882a593Smuzhiyun struct ddrphy_init_sequence {
238*4882a593Smuzhiyun 	char *description;
239*4882a593Smuzhiyun 	u32 init_flag;
240*4882a593Smuzhiyun 	u32 done_flag;
241*4882a593Smuzhiyun 	u32 err_flag;
242*4882a593Smuzhiyun };
243*4882a593Smuzhiyun 
244*4882a593Smuzhiyun static const struct ddrphy_init_sequence impedance_calibration_sequence[] = {
245*4882a593Smuzhiyun 	{
246*4882a593Smuzhiyun 		"Impedance Calibration",
247*4882a593Smuzhiyun 		MPHY_PIR_ZCAL,
248*4882a593Smuzhiyun 		MPHY_PGSR0_ZCDONE,
249*4882a593Smuzhiyun 		MPHY_PGSR0_ZCERR,
250*4882a593Smuzhiyun 	},
251*4882a593Smuzhiyun 	{ /* sentinel */ }
252*4882a593Smuzhiyun };
253*4882a593Smuzhiyun 
254*4882a593Smuzhiyun static const struct ddrphy_init_sequence dram_init_sequence[] = {
255*4882a593Smuzhiyun 	{
256*4882a593Smuzhiyun 		"DRAM Initialization",
257*4882a593Smuzhiyun 		MPHY_PIR_DRAMRST | MPHY_PIR_DRAMINIT,
258*4882a593Smuzhiyun 		MPHY_PGSR0_DIDONE,
259*4882a593Smuzhiyun 		0,
260*4882a593Smuzhiyun 	},
261*4882a593Smuzhiyun 	{ /* sentinel */ }
262*4882a593Smuzhiyun };
263*4882a593Smuzhiyun 
264*4882a593Smuzhiyun static const struct ddrphy_init_sequence training_sequence[] = {
265*4882a593Smuzhiyun 	{
266*4882a593Smuzhiyun 		"Write Leveling",
267*4882a593Smuzhiyun 		MPHY_PIR_WL,
268*4882a593Smuzhiyun 		MPHY_PGSR0_WLDONE,
269*4882a593Smuzhiyun 		MPHY_PGSR0_WLERR,
270*4882a593Smuzhiyun 	},
271*4882a593Smuzhiyun 	{
272*4882a593Smuzhiyun 		"Read DQS Gate Training",
273*4882a593Smuzhiyun 		MPHY_PIR_QSGATE,
274*4882a593Smuzhiyun 		MPHY_PGSR0_QSGDONE,
275*4882a593Smuzhiyun 		MPHY_PGSR0_QSGERR,
276*4882a593Smuzhiyun 	},
277*4882a593Smuzhiyun 	{
278*4882a593Smuzhiyun 		"Write Leveling Adjustment",
279*4882a593Smuzhiyun 		MPHY_PIR_WLADJ,
280*4882a593Smuzhiyun 		MPHY_PGSR0_WLADONE,
281*4882a593Smuzhiyun 		MPHY_PGSR0_WLAERR,
282*4882a593Smuzhiyun 	},
283*4882a593Smuzhiyun 	{
284*4882a593Smuzhiyun 		"Read Bit Deskew",
285*4882a593Smuzhiyun 		MPHY_PIR_RDDSKW,
286*4882a593Smuzhiyun 		MPHY_PGSR0_RDDONE,
287*4882a593Smuzhiyun 		MPHY_PGSR0_RDERR,
288*4882a593Smuzhiyun 	},
289*4882a593Smuzhiyun 	{
290*4882a593Smuzhiyun 		"Write Bit Deskew",
291*4882a593Smuzhiyun 		MPHY_PIR_WRDSKW,
292*4882a593Smuzhiyun 		MPHY_PGSR0_WDDONE,
293*4882a593Smuzhiyun 		MPHY_PGSR0_WDERR,
294*4882a593Smuzhiyun 	},
295*4882a593Smuzhiyun 	{
296*4882a593Smuzhiyun 		"Read Eye Training",
297*4882a593Smuzhiyun 		MPHY_PIR_RDEYE,
298*4882a593Smuzhiyun 		MPHY_PGSR0_REDONE,
299*4882a593Smuzhiyun 		MPHY_PGSR0_REERR,
300*4882a593Smuzhiyun 	},
301*4882a593Smuzhiyun 	{
302*4882a593Smuzhiyun 		"Write Eye Training",
303*4882a593Smuzhiyun 		MPHY_PIR_WREYE,
304*4882a593Smuzhiyun 		MPHY_PGSR0_WEDONE,
305*4882a593Smuzhiyun 		MPHY_PGSR0_WEERR,
306*4882a593Smuzhiyun 	},
307*4882a593Smuzhiyun 	{ /* sentinel */ }
308*4882a593Smuzhiyun };
309*4882a593Smuzhiyun 
__ddrphy_training(void __iomem * phy_base,const struct ddrphy_init_sequence * seq)310*4882a593Smuzhiyun static int __ddrphy_training(void __iomem *phy_base,
311*4882a593Smuzhiyun 			     const struct ddrphy_init_sequence *seq)
312*4882a593Smuzhiyun {
313*4882a593Smuzhiyun 	const struct ddrphy_init_sequence *s;
314*4882a593Smuzhiyun 	u32 pgsr0;
315*4882a593Smuzhiyun 	u32 init_flag = MPHY_PIR_INIT;
316*4882a593Smuzhiyun 	u32 done_flag = MPHY_PGSR0_IDONE;
317*4882a593Smuzhiyun 	int timeout = 50000; /* 50 msec is long enough */
318*4882a593Smuzhiyun #ifdef DISPLAY_ELAPSED_TIME
319*4882a593Smuzhiyun 	ulong start = get_timer(0);
320*4882a593Smuzhiyun #endif
321*4882a593Smuzhiyun 
322*4882a593Smuzhiyun 	for (s = seq; s->description; s++) {
323*4882a593Smuzhiyun 		init_flag |= s->init_flag;
324*4882a593Smuzhiyun 		done_flag |= s->done_flag;
325*4882a593Smuzhiyun 	}
326*4882a593Smuzhiyun 
327*4882a593Smuzhiyun 	writel(init_flag, phy_base + MPHY_PIR);
328*4882a593Smuzhiyun 
329*4882a593Smuzhiyun 	do {
330*4882a593Smuzhiyun 		if (--timeout < 0) {
331*4882a593Smuzhiyun 			pr_err("%s: error: timeout during DDR training\n",
332*4882a593Smuzhiyun 			       __func__);
333*4882a593Smuzhiyun 			return -ETIMEDOUT;
334*4882a593Smuzhiyun 		}
335*4882a593Smuzhiyun 		udelay(1);
336*4882a593Smuzhiyun 		pgsr0 = readl(phy_base + MPHY_PGSR0);
337*4882a593Smuzhiyun 	} while ((pgsr0 & done_flag) != done_flag);
338*4882a593Smuzhiyun 
339*4882a593Smuzhiyun 	for (s = seq; s->description; s++) {
340*4882a593Smuzhiyun 		if (pgsr0 & s->err_flag) {
341*4882a593Smuzhiyun 			pr_err("%s: error: %s failed\n", __func__,
342*4882a593Smuzhiyun 			       s->description);
343*4882a593Smuzhiyun 			return -EIO;
344*4882a593Smuzhiyun 		}
345*4882a593Smuzhiyun 	}
346*4882a593Smuzhiyun 
347*4882a593Smuzhiyun #ifdef DISPLAY_ELAPSED_TIME
348*4882a593Smuzhiyun 	printf("%s: info: elapsed time %ld msec\n", get_timer(start));
349*4882a593Smuzhiyun #endif
350*4882a593Smuzhiyun 
351*4882a593Smuzhiyun 	return 0;
352*4882a593Smuzhiyun }
353*4882a593Smuzhiyun 
ddrphy_impedance_calibration(void __iomem * phy_base)354*4882a593Smuzhiyun static int ddrphy_impedance_calibration(void __iomem *phy_base)
355*4882a593Smuzhiyun {
356*4882a593Smuzhiyun 	int ret;
357*4882a593Smuzhiyun 	u32 tmp;
358*4882a593Smuzhiyun 
359*4882a593Smuzhiyun 	ret = __ddrphy_training(phy_base, impedance_calibration_sequence);
360*4882a593Smuzhiyun 	if (ret)
361*4882a593Smuzhiyun 		return ret;
362*4882a593Smuzhiyun 
363*4882a593Smuzhiyun 	/*
364*4882a593Smuzhiyun 	 * Because of a hardware bug, IDONE flag is set when the first ZQ block
365*4882a593Smuzhiyun 	 * is calibrated.  The flag does not guarantee the completion for all
366*4882a593Smuzhiyun 	 * the ZQ blocks.  Wait a little more just in case.
367*4882a593Smuzhiyun 	 */
368*4882a593Smuzhiyun 	udelay(1);
369*4882a593Smuzhiyun 
370*4882a593Smuzhiyun 	/* reflect ZQ settings and enable average algorithm*/
371*4882a593Smuzhiyun 	tmp = readl(phy_base + MPHY_ZQCR);
372*4882a593Smuzhiyun 	tmp |= MPHY_ZQCR_FORCE_ZCAL_VT_UPDATE;
373*4882a593Smuzhiyun 	writel(tmp, phy_base + MPHY_ZQCR);
374*4882a593Smuzhiyun 	tmp &= ~MPHY_ZQCR_FORCE_ZCAL_VT_UPDATE;
375*4882a593Smuzhiyun 	tmp |= MPHY_ZQCR_AVGEN;
376*4882a593Smuzhiyun 	writel(tmp, phy_base + MPHY_ZQCR);
377*4882a593Smuzhiyun 
378*4882a593Smuzhiyun 	return 0;
379*4882a593Smuzhiyun }
380*4882a593Smuzhiyun 
ddrphy_dram_init(void __iomem * phy_base)381*4882a593Smuzhiyun static int ddrphy_dram_init(void __iomem *phy_base)
382*4882a593Smuzhiyun {
383*4882a593Smuzhiyun 	return __ddrphy_training(phy_base, dram_init_sequence);
384*4882a593Smuzhiyun }
385*4882a593Smuzhiyun 
ddrphy_training(void __iomem * phy_base)386*4882a593Smuzhiyun static int ddrphy_training(void __iomem *phy_base)
387*4882a593Smuzhiyun {
388*4882a593Smuzhiyun 	return __ddrphy_training(phy_base, training_sequence);
389*4882a593Smuzhiyun }
390*4882a593Smuzhiyun 
391*4882a593Smuzhiyun /* UMC */
392*4882a593Smuzhiyun static u32 umc_cmdctla[DRAM_FREQ_NR] = {0x66DD131D, 0x77EE1722};
393*4882a593Smuzhiyun /*
394*4882a593Smuzhiyun  * The ch2 is a different generation UMC core.
395*4882a593Smuzhiyun  * The register spec is different, unfortunately.
396*4882a593Smuzhiyun  */
397*4882a593Smuzhiyun static u32 umc_cmdctlb_ch01[DRAM_FREQ_NR] = {0x13E87C44, 0x18F88C44};
398*4882a593Smuzhiyun static u32 umc_cmdctlb_ch2[DRAM_FREQ_NR] = {0x19E8DC44, 0x1EF8EC44};
399*4882a593Smuzhiyun static u32 umc_spcctla[DRAM_FREQ_NR][DRAM_SZ_NR] = {
400*4882a593Smuzhiyun 	{0x004A071D, 0x0078071D},
401*4882a593Smuzhiyun 	{0x0055081E, 0x0089081E},
402*4882a593Smuzhiyun };
403*4882a593Smuzhiyun 
404*4882a593Smuzhiyun static u32 umc_spcctlb[] = {0x00FF000A, 0x00FF000B};
405*4882a593Smuzhiyun /* The ch2 is different for some reason only hardware guys know... */
406*4882a593Smuzhiyun static u32 umc_flowctla_ch01[] = {0x0800001E, 0x08000022};
407*4882a593Smuzhiyun static u32 umc_flowctla_ch2[] = {0x0800001E, 0x0800001E};
408*4882a593Smuzhiyun 
umc_set_system_latency(void __iomem * dc_base,int phy_latency)409*4882a593Smuzhiyun static void umc_set_system_latency(void __iomem *dc_base, int phy_latency)
410*4882a593Smuzhiyun {
411*4882a593Smuzhiyun 	u32 val;
412*4882a593Smuzhiyun 	int latency;
413*4882a593Smuzhiyun 
414*4882a593Smuzhiyun 	val = readl(dc_base + UMC_RDATACTL_D0);
415*4882a593Smuzhiyun 	latency = (val & UMC_RDATACTL_RADLTY_MASK) >> UMC_RDATACTL_RADLTY_SHIFT;
416*4882a593Smuzhiyun 	latency += (val & UMC_RDATACTL_RAD2LTY_MASK) >>
417*4882a593Smuzhiyun 						UMC_RDATACTL_RAD2LTY_SHIFT;
418*4882a593Smuzhiyun 	/*
419*4882a593Smuzhiyun 	 * UMC works at the half clock rate of the PHY.
420*4882a593Smuzhiyun 	 * The LSB of latency is ignored
421*4882a593Smuzhiyun 	 */
422*4882a593Smuzhiyun 	latency += phy_latency & ~1;
423*4882a593Smuzhiyun 
424*4882a593Smuzhiyun 	val &= ~(UMC_RDATACTL_RADLTY_MASK | UMC_RDATACTL_RAD2LTY_MASK);
425*4882a593Smuzhiyun 	if (latency > 0xf) {
426*4882a593Smuzhiyun 		val |= 0xf << UMC_RDATACTL_RADLTY_SHIFT;
427*4882a593Smuzhiyun 		val |= (latency - 0xf) << UMC_RDATACTL_RAD2LTY_SHIFT;
428*4882a593Smuzhiyun 	} else {
429*4882a593Smuzhiyun 		val |= latency << UMC_RDATACTL_RADLTY_SHIFT;
430*4882a593Smuzhiyun 	}
431*4882a593Smuzhiyun 
432*4882a593Smuzhiyun 	writel(val, dc_base + UMC_RDATACTL_D0);
433*4882a593Smuzhiyun 	writel(val, dc_base + UMC_RDATACTL_D1);
434*4882a593Smuzhiyun 
435*4882a593Smuzhiyun 	readl(dc_base + UMC_RDATACTL_D1); /* relax */
436*4882a593Smuzhiyun }
437*4882a593Smuzhiyun 
438*4882a593Smuzhiyun /* enable/disable auto refresh */
umc_refresh_ctrl(void __iomem * dc_base,int enable)439*4882a593Smuzhiyun static void umc_refresh_ctrl(void __iomem *dc_base, int enable)
440*4882a593Smuzhiyun {
441*4882a593Smuzhiyun 	u32 tmp;
442*4882a593Smuzhiyun 
443*4882a593Smuzhiyun 	tmp = readl(dc_base + UMC_SPCSETB);
444*4882a593Smuzhiyun 	tmp &= ~UMC_SPCSETB_AREFMD_MASK;
445*4882a593Smuzhiyun 
446*4882a593Smuzhiyun 	if (enable)
447*4882a593Smuzhiyun 		tmp |= UMC_SPCSETB_AREFMD_ARB;
448*4882a593Smuzhiyun 	else
449*4882a593Smuzhiyun 		tmp |= UMC_SPCSETB_AREFMD_REG;
450*4882a593Smuzhiyun 
451*4882a593Smuzhiyun 	writel(tmp, dc_base + UMC_SPCSETB);
452*4882a593Smuzhiyun 	udelay(1);
453*4882a593Smuzhiyun }
454*4882a593Smuzhiyun 
umc_ud_init(void __iomem * umc_base,int ch)455*4882a593Smuzhiyun static void umc_ud_init(void __iomem *umc_base, int ch)
456*4882a593Smuzhiyun {
457*4882a593Smuzhiyun 	writel(0x00000003, umc_base + UMC_BITPERPIXELMODE_D0);
458*4882a593Smuzhiyun 
459*4882a593Smuzhiyun 	if (ch == 2)
460*4882a593Smuzhiyun 		writel(0x00000033, umc_base + UMC_PAIR1DOFF_D0);
461*4882a593Smuzhiyun }
462*4882a593Smuzhiyun 
umc_dc_init(void __iomem * dc_base,enum dram_freq freq,unsigned long size,int width,int ch)463*4882a593Smuzhiyun static int umc_dc_init(void __iomem *dc_base, enum dram_freq freq,
464*4882a593Smuzhiyun 		       unsigned long size, int width, int ch)
465*4882a593Smuzhiyun {
466*4882a593Smuzhiyun 	enum dram_size size_e;
467*4882a593Smuzhiyun 	int latency;
468*4882a593Smuzhiyun 	u32 val;
469*4882a593Smuzhiyun 
470*4882a593Smuzhiyun 	switch (size) {
471*4882a593Smuzhiyun 	case 0:
472*4882a593Smuzhiyun 		return 0;
473*4882a593Smuzhiyun 	case SZ_256M:
474*4882a593Smuzhiyun 		size_e = DRAM_SZ_256M;
475*4882a593Smuzhiyun 		break;
476*4882a593Smuzhiyun 	case SZ_512M:
477*4882a593Smuzhiyun 		size_e = DRAM_SZ_512M;
478*4882a593Smuzhiyun 		break;
479*4882a593Smuzhiyun 	default:
480*4882a593Smuzhiyun 		pr_err("unsupported DRAM size 0x%08lx (per 16bit) for ch%d\n",
481*4882a593Smuzhiyun 		       size, ch);
482*4882a593Smuzhiyun 		return -EINVAL;
483*4882a593Smuzhiyun 	}
484*4882a593Smuzhiyun 
485*4882a593Smuzhiyun 	writel(umc_cmdctla[freq], dc_base + UMC_CMDCTLA);
486*4882a593Smuzhiyun 
487*4882a593Smuzhiyun 	writel(ch == 2 ? umc_cmdctlb_ch2[freq] : umc_cmdctlb_ch01[freq],
488*4882a593Smuzhiyun 	       dc_base + UMC_CMDCTLB);
489*4882a593Smuzhiyun 
490*4882a593Smuzhiyun 	writel(umc_spcctla[freq][size_e], dc_base + UMC_SPCCTLA);
491*4882a593Smuzhiyun 	writel(umc_spcctlb[freq], dc_base + UMC_SPCCTLB);
492*4882a593Smuzhiyun 
493*4882a593Smuzhiyun 	val = 0x000e000e;
494*4882a593Smuzhiyun 	latency = 12;
495*4882a593Smuzhiyun 	/* ES2 inserted one more FF to the logic. */
496*4882a593Smuzhiyun 	if (uniphier_get_soc_model() >= 2)
497*4882a593Smuzhiyun 		latency += 2;
498*4882a593Smuzhiyun 
499*4882a593Smuzhiyun 	if (latency > 0xf) {
500*4882a593Smuzhiyun 		val |= 0xf << UMC_RDATACTL_RADLTY_SHIFT;
501*4882a593Smuzhiyun 		val |= (latency - 0xf) << UMC_RDATACTL_RAD2LTY_SHIFT;
502*4882a593Smuzhiyun 	} else {
503*4882a593Smuzhiyun 		val |= latency << UMC_RDATACTL_RADLTY_SHIFT;
504*4882a593Smuzhiyun 	}
505*4882a593Smuzhiyun 
506*4882a593Smuzhiyun 	writel(val, dc_base + UMC_RDATACTL_D0);
507*4882a593Smuzhiyun 	if (width >= 32)
508*4882a593Smuzhiyun 		writel(val, dc_base + UMC_RDATACTL_D1);
509*4882a593Smuzhiyun 
510*4882a593Smuzhiyun 	writel(0x04060A02, dc_base + UMC_WDATACTL_D0);
511*4882a593Smuzhiyun 	if (width >= 32)
512*4882a593Smuzhiyun 		writel(0x04060A02, dc_base + UMC_WDATACTL_D1);
513*4882a593Smuzhiyun 	writel(0x04000000, dc_base + UMC_DATASET);
514*4882a593Smuzhiyun 	writel(0x00400020, dc_base + UMC_DCCGCTL);
515*4882a593Smuzhiyun 	writel(0x00000084, dc_base + UMC_FLOWCTLG);
516*4882a593Smuzhiyun 	writel(0x00000000, dc_base + UMC_ACSSETA);
517*4882a593Smuzhiyun 
518*4882a593Smuzhiyun 	writel(ch == 2 ? umc_flowctla_ch2[freq] : umc_flowctla_ch01[freq],
519*4882a593Smuzhiyun 	       dc_base + UMC_FLOWCTLA);
520*4882a593Smuzhiyun 
521*4882a593Smuzhiyun 	writel(0x00004400, dc_base + UMC_FLOWCTLC);
522*4882a593Smuzhiyun 	writel(0x200A0A00, dc_base + UMC_SPCSETB);
523*4882a593Smuzhiyun 	writel(0x00000520, dc_base + UMC_DFICUPDCTLA);
524*4882a593Smuzhiyun 	writel(0x0000000D, dc_base + UMC_RESPCTL);
525*4882a593Smuzhiyun 
526*4882a593Smuzhiyun 	if (ch != 2) {
527*4882a593Smuzhiyun 		writel(0x00202000, dc_base + UMC_FLOWCTLB);
528*4882a593Smuzhiyun 		writel(0xFDBFFFFF, dc_base + UMC_FLOWCTLOB0);
529*4882a593Smuzhiyun 		writel(0xFFFFFFFF, dc_base + UMC_FLOWCTLOB1);
530*4882a593Smuzhiyun 		writel(0x00080700, dc_base + UMC_BSICMAPSET);
531*4882a593Smuzhiyun 	} else {
532*4882a593Smuzhiyun 		writel(0x00200000, dc_base + UMC_FLOWCTLB);
533*4882a593Smuzhiyun 		writel(0x00000000, dc_base + UMC_BSICMAPSET);
534*4882a593Smuzhiyun 	}
535*4882a593Smuzhiyun 
536*4882a593Smuzhiyun 	writel(0x00000000, dc_base + UMC_ERRMASKA);
537*4882a593Smuzhiyun 	writel(0x00000000, dc_base + UMC_ERRMASKB);
538*4882a593Smuzhiyun 
539*4882a593Smuzhiyun 	return 0;
540*4882a593Smuzhiyun }
541*4882a593Smuzhiyun 
umc_ch_init(void __iomem * umc_ch_base,enum dram_freq freq,unsigned long size,unsigned int width,int ch)542*4882a593Smuzhiyun static int umc_ch_init(void __iomem *umc_ch_base, enum dram_freq freq,
543*4882a593Smuzhiyun 		       unsigned long size, unsigned int width, int ch)
544*4882a593Smuzhiyun {
545*4882a593Smuzhiyun 	void __iomem *dc_base = umc_ch_base + 0x00011000;
546*4882a593Smuzhiyun 	void __iomem *phy_base = umc_ch_base + 0x00030000;
547*4882a593Smuzhiyun 	int ret;
548*4882a593Smuzhiyun 
549*4882a593Smuzhiyun 	writel(0x00000002, dc_base + UMC_INITSET);
550*4882a593Smuzhiyun 	while (readl(dc_base + UMC_INITSTAT) & BIT(2))
551*4882a593Smuzhiyun 		cpu_relax();
552*4882a593Smuzhiyun 
553*4882a593Smuzhiyun 	/* deassert PHY reset signals */
554*4882a593Smuzhiyun 	writel(UMC_DIOCTLA_CTL_NRST | UMC_DIOCTLA_CFG_NRST,
555*4882a593Smuzhiyun 	       dc_base + UMC_DIOCTLA);
556*4882a593Smuzhiyun 
557*4882a593Smuzhiyun 	ddrphy_init(phy_base, freq, width, ch);
558*4882a593Smuzhiyun 
559*4882a593Smuzhiyun 	ret = ddrphy_impedance_calibration(phy_base);
560*4882a593Smuzhiyun 	if (ret)
561*4882a593Smuzhiyun 		return ret;
562*4882a593Smuzhiyun 
563*4882a593Smuzhiyun 	ddrphy_dram_init(phy_base);
564*4882a593Smuzhiyun 	if (ret)
565*4882a593Smuzhiyun 		return ret;
566*4882a593Smuzhiyun 
567*4882a593Smuzhiyun 	ret = umc_dc_init(dc_base, freq, size, width, ch);
568*4882a593Smuzhiyun 	if (ret)
569*4882a593Smuzhiyun 		return ret;
570*4882a593Smuzhiyun 
571*4882a593Smuzhiyun 	umc_ud_init(umc_ch_base, ch);
572*4882a593Smuzhiyun 
573*4882a593Smuzhiyun 	ret = ddrphy_training(phy_base);
574*4882a593Smuzhiyun 	if (ret)
575*4882a593Smuzhiyun 		return ret;
576*4882a593Smuzhiyun 
577*4882a593Smuzhiyun 	udelay(1);
578*4882a593Smuzhiyun 
579*4882a593Smuzhiyun 	/* match the system latency between UMC and PHY */
580*4882a593Smuzhiyun 	umc_set_system_latency(dc_base,
581*4882a593Smuzhiyun 			       ddrphy_get_system_latency(phy_base, width));
582*4882a593Smuzhiyun 
583*4882a593Smuzhiyun 	udelay(1);
584*4882a593Smuzhiyun 
585*4882a593Smuzhiyun 	/* stop auto refresh before clearing FIFO in PHY */
586*4882a593Smuzhiyun 	umc_refresh_ctrl(dc_base, 0);
587*4882a593Smuzhiyun 	ddrphy_fifo_reset(phy_base);
588*4882a593Smuzhiyun 	umc_refresh_ctrl(dc_base, 1);
589*4882a593Smuzhiyun 
590*4882a593Smuzhiyun 	udelay(10);
591*4882a593Smuzhiyun 
592*4882a593Smuzhiyun 	return 0;
593*4882a593Smuzhiyun }
594*4882a593Smuzhiyun 
um_init(void __iomem * um_base)595*4882a593Smuzhiyun static void um_init(void __iomem *um_base)
596*4882a593Smuzhiyun {
597*4882a593Smuzhiyun 	writel(0x000000ff, um_base + UMC_MBUS0);
598*4882a593Smuzhiyun 	writel(0x000000ff, um_base + UMC_MBUS1);
599*4882a593Smuzhiyun 	writel(0x000000ff, um_base + UMC_MBUS2);
600*4882a593Smuzhiyun 	writel(0x000000ff, um_base + UMC_MBUS3);
601*4882a593Smuzhiyun }
602*4882a593Smuzhiyun 
uniphier_pxs2_umc_init(const struct uniphier_board_data * bd)603*4882a593Smuzhiyun int uniphier_pxs2_umc_init(const struct uniphier_board_data *bd)
604*4882a593Smuzhiyun {
605*4882a593Smuzhiyun 	void __iomem *um_base = (void __iomem *)0x5b600000;
606*4882a593Smuzhiyun 	void __iomem *umc_ch_base = (void __iomem *)0x5b800000;
607*4882a593Smuzhiyun 	enum dram_freq freq;
608*4882a593Smuzhiyun 	int ch, ret;
609*4882a593Smuzhiyun 
610*4882a593Smuzhiyun 	switch (bd->dram_freq) {
611*4882a593Smuzhiyun 	case 1866:
612*4882a593Smuzhiyun 		freq = DRAM_FREQ_1866M;
613*4882a593Smuzhiyun 		break;
614*4882a593Smuzhiyun 	case 2133:
615*4882a593Smuzhiyun 		freq = DRAM_FREQ_2133M;
616*4882a593Smuzhiyun 		break;
617*4882a593Smuzhiyun 	default:
618*4882a593Smuzhiyun 		pr_err("unsupported DRAM frequency %d MHz\n", bd->dram_freq);
619*4882a593Smuzhiyun 		return -EINVAL;
620*4882a593Smuzhiyun 	}
621*4882a593Smuzhiyun 
622*4882a593Smuzhiyun 	for (ch = 0; ch < DRAM_CH_NR; ch++) {
623*4882a593Smuzhiyun 		unsigned long size = bd->dram_ch[ch].size;
624*4882a593Smuzhiyun 		unsigned int width = bd->dram_ch[ch].width;
625*4882a593Smuzhiyun 
626*4882a593Smuzhiyun 		if (size) {
627*4882a593Smuzhiyun 			ret = umc_ch_init(umc_ch_base, freq,
628*4882a593Smuzhiyun 					  size / (width / 16), width, ch);
629*4882a593Smuzhiyun 			if (ret) {
630*4882a593Smuzhiyun 				pr_err("failed to initialize UMC ch%d\n", ch);
631*4882a593Smuzhiyun 				return ret;
632*4882a593Smuzhiyun 			}
633*4882a593Smuzhiyun 		}
634*4882a593Smuzhiyun 
635*4882a593Smuzhiyun 		umc_ch_base += 0x00200000;
636*4882a593Smuzhiyun 	}
637*4882a593Smuzhiyun 
638*4882a593Smuzhiyun 	um_init(um_base);
639*4882a593Smuzhiyun 
640*4882a593Smuzhiyun 	return 0;
641*4882a593Smuzhiyun }
642