xref: /rk3399_ARM-atf/plat/rockchip/rk3399/drivers/dram/suspend.c (revision 2831bc3a5f5dd9cdd6f272044f9f916e68797ff1)
1*2831bc3aSCaesar Wang /*
2*2831bc3aSCaesar Wang  * Copyright (c) 2016, ARM Limited and Contributors. All rights reserved.
3*2831bc3aSCaesar Wang  *
4*2831bc3aSCaesar Wang  * Redistribution and use in source and binary forms, with or without
5*2831bc3aSCaesar Wang  * modification, are permitted provided that the following conditions are met:
6*2831bc3aSCaesar Wang  *
7*2831bc3aSCaesar Wang  * Redistributions of source code must retain the above copyright notice, this
8*2831bc3aSCaesar Wang  * list of conditions and the following disclaimer.
9*2831bc3aSCaesar Wang  *
10*2831bc3aSCaesar Wang  * Redistributions in binary form must reproduce the above copyright notice,
11*2831bc3aSCaesar Wang  * this list of conditions and the following disclaimer in the documentation
12*2831bc3aSCaesar Wang  * and/or other materials provided with the distribution.
13*2831bc3aSCaesar Wang  *
14*2831bc3aSCaesar Wang  * Neither the name of ARM nor the names of its contributors may be used
15*2831bc3aSCaesar Wang  * to endorse or promote products derived from this software without specific
16*2831bc3aSCaesar Wang  * prior written permission.
17*2831bc3aSCaesar Wang  *
18*2831bc3aSCaesar Wang  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19*2831bc3aSCaesar Wang  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20*2831bc3aSCaesar Wang  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21*2831bc3aSCaesar Wang  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
22*2831bc3aSCaesar Wang  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
23*2831bc3aSCaesar Wang  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
24*2831bc3aSCaesar Wang  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
25*2831bc3aSCaesar Wang  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
26*2831bc3aSCaesar Wang  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
27*2831bc3aSCaesar Wang  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
28*2831bc3aSCaesar Wang  * POSSIBILITY OF SUCH DAMAGE.
29*2831bc3aSCaesar Wang  */
30*2831bc3aSCaesar Wang #include <debug.h>
31*2831bc3aSCaesar Wang #include <arch_helpers.h>
32*2831bc3aSCaesar Wang #include <platform_def.h>
33*2831bc3aSCaesar Wang #include <plat_private.h>
34*2831bc3aSCaesar Wang #include <dram.h>
35*2831bc3aSCaesar Wang #include <pmu_regs.h>
36*2831bc3aSCaesar Wang #include <rk3399_def.h>
37*2831bc3aSCaesar Wang #include <soc.h>
38*2831bc3aSCaesar Wang #include <suspend.h>
39*2831bc3aSCaesar Wang 
40*2831bc3aSCaesar Wang #define PMUGRF_OS_REG0			0x300
41*2831bc3aSCaesar Wang #define PMUGRF_OS_REG1			0x304
42*2831bc3aSCaesar Wang #define PMUGRF_OS_REG2			0x308
43*2831bc3aSCaesar Wang #define PMUGRF_OS_REG3			0x30c
44*2831bc3aSCaesar Wang 
45*2831bc3aSCaesar Wang #define CRU_SFTRST_DDR_CTRL(ch, n)	((0x1 << (8 + 16 + (ch) * 4)) | \
46*2831bc3aSCaesar Wang 					 ((n) << (8 + (ch) * 4)))
47*2831bc3aSCaesar Wang #define CRU_SFTRST_DDR_PHY(ch, n)	((0x1 << (9 + 16 + (ch) * 4)) | \
48*2831bc3aSCaesar Wang 					 ((n) << (9 + (ch) * 4)))
49*2831bc3aSCaesar Wang 
50*2831bc3aSCaesar Wang #define FBDIV_ENC(n)			((n) << 16)
51*2831bc3aSCaesar Wang #define FBDIV_DEC(n)			(((n) >> 16) & 0xfff)
52*2831bc3aSCaesar Wang #define POSTDIV2_ENC(n)			((n) << 12)
53*2831bc3aSCaesar Wang #define POSTDIV2_DEC(n)			(((n) >> 12) & 0x7)
54*2831bc3aSCaesar Wang #define POSTDIV1_ENC(n)			((n) << 8)
55*2831bc3aSCaesar Wang #define POSTDIV1_DEC(n)			(((n) >> 8) & 0x7)
56*2831bc3aSCaesar Wang #define REFDIV_ENC(n)			(n)
57*2831bc3aSCaesar Wang #define REFDIV_DEC(n)			((n) & 0x3f)
58*2831bc3aSCaesar Wang 
59*2831bc3aSCaesar Wang /* PMU CRU */
60*2831bc3aSCaesar Wang #define PMUCRU_RSTNHOLD_CON0		0x120
61*2831bc3aSCaesar Wang #define PMUCRU_RSTNHOLD_CON1		0x124
62*2831bc3aSCaesar Wang 
63*2831bc3aSCaesar Wang #define PRESET_GPIO0_HOLD(n)		(((n) << 7) | WMSK_BIT(7))
64*2831bc3aSCaesar Wang #define PRESET_GPIO1_HOLD(n)		(((n) << 8) | WMSK_BIT(8))
65*2831bc3aSCaesar Wang 
66*2831bc3aSCaesar Wang #define SYS_COUNTER_FREQ_IN_MHZ		(SYS_COUNTER_FREQ_IN_TICKS / 1000000)
67*2831bc3aSCaesar Wang 
68*2831bc3aSCaesar Wang /*
69*2831bc3aSCaesar Wang  * Copy @num registers from @src to @dst
70*2831bc3aSCaesar Wang  */
71*2831bc3aSCaesar Wang __sramfunc void sram_regcpy(uintptr_t dst, uintptr_t src, uint32_t num)
72*2831bc3aSCaesar Wang {
73*2831bc3aSCaesar Wang 	while (num--) {
74*2831bc3aSCaesar Wang 		mmio_write_32(dst, mmio_read_32(src));
75*2831bc3aSCaesar Wang 		dst += sizeof(uint32_t);
76*2831bc3aSCaesar Wang 		src += sizeof(uint32_t);
77*2831bc3aSCaesar Wang 	}
78*2831bc3aSCaesar Wang }
79*2831bc3aSCaesar Wang 
80*2831bc3aSCaesar Wang static __sramfunc uint32_t sram_get_timer_value(void)
81*2831bc3aSCaesar Wang {
82*2831bc3aSCaesar Wang 	/*
83*2831bc3aSCaesar Wang 	 * Generic delay timer implementation expects the timer to be a down
84*2831bc3aSCaesar Wang 	 * counter. We apply bitwise NOT operator to the tick values returned
85*2831bc3aSCaesar Wang 	 * by read_cntpct_el0() to simulate the down counter.
86*2831bc3aSCaesar Wang 	 */
87*2831bc3aSCaesar Wang 	return (uint32_t)(~read_cntpct_el0());
88*2831bc3aSCaesar Wang }
89*2831bc3aSCaesar Wang 
90*2831bc3aSCaesar Wang static __sramfunc void sram_udelay(uint32_t usec)
91*2831bc3aSCaesar Wang {
92*2831bc3aSCaesar Wang 	uint32_t start, cnt, delta, delta_us;
93*2831bc3aSCaesar Wang 
94*2831bc3aSCaesar Wang 	/* counter is decreasing */
95*2831bc3aSCaesar Wang 	start = sram_get_timer_value();
96*2831bc3aSCaesar Wang 	do {
97*2831bc3aSCaesar Wang 		cnt = sram_get_timer_value();
98*2831bc3aSCaesar Wang 		if (cnt > start) {
99*2831bc3aSCaesar Wang 			delta = UINT32_MAX - cnt;
100*2831bc3aSCaesar Wang 			delta += start;
101*2831bc3aSCaesar Wang 		} else
102*2831bc3aSCaesar Wang 			delta = start - cnt;
103*2831bc3aSCaesar Wang 		delta_us = (delta * SYS_COUNTER_FREQ_IN_MHZ);
104*2831bc3aSCaesar Wang 	} while (delta_us < usec);
105*2831bc3aSCaesar Wang }
106*2831bc3aSCaesar Wang 
107*2831bc3aSCaesar Wang static __sramfunc void configure_sgrf(void)
108*2831bc3aSCaesar Wang {
109*2831bc3aSCaesar Wang 	/*
110*2831bc3aSCaesar Wang 	 * SGRF_DDR_RGN_DPLL_CLK and SGRF_DDR_RGN_RTC_CLK:
111*2831bc3aSCaesar Wang 	 * IC ECO bug, need to set this register.
112*2831bc3aSCaesar Wang 	 *
113*2831bc3aSCaesar Wang 	 * SGRF_DDR_RGN_BYPS:
114*2831bc3aSCaesar Wang 	 * After the PD_CENTER suspend/resume, the DDR region
115*2831bc3aSCaesar Wang 	 * related registers in the SGRF will be reset, we
116*2831bc3aSCaesar Wang 	 * need to re-initialize them.
117*2831bc3aSCaesar Wang 	 */
118*2831bc3aSCaesar Wang 	mmio_write_32(SGRF_BASE + SGRF_DDRRGN_CON0_16(16),
119*2831bc3aSCaesar Wang 		      SGRF_DDR_RGN_DPLL_CLK |
120*2831bc3aSCaesar Wang 		      SGRF_DDR_RGN_RTC_CLK |
121*2831bc3aSCaesar Wang 		      SGRF_DDR_RGN_BYPS);
122*2831bc3aSCaesar Wang }
123*2831bc3aSCaesar Wang 
124*2831bc3aSCaesar Wang static __sramfunc void rkclk_ddr_reset(uint32_t channel, uint32_t ctl,
125*2831bc3aSCaesar Wang 		uint32_t phy)
126*2831bc3aSCaesar Wang {
127*2831bc3aSCaesar Wang 	channel &= 0x1;
128*2831bc3aSCaesar Wang 	ctl &= 0x1;
129*2831bc3aSCaesar Wang 	phy &= 0x1;
130*2831bc3aSCaesar Wang 	mmio_write_32(CRU_BASE + CRU_SOFTRST_CON(4),
131*2831bc3aSCaesar Wang 		      CRU_SFTRST_DDR_CTRL(channel, ctl) |
132*2831bc3aSCaesar Wang 		      CRU_SFTRST_DDR_PHY(channel, phy));
133*2831bc3aSCaesar Wang }
134*2831bc3aSCaesar Wang 
135*2831bc3aSCaesar Wang static __sramfunc void phy_pctrl_reset(uint32_t ch)
136*2831bc3aSCaesar Wang {
137*2831bc3aSCaesar Wang 	rkclk_ddr_reset(ch, 1, 1);
138*2831bc3aSCaesar Wang 	sram_udelay(10);
139*2831bc3aSCaesar Wang 	rkclk_ddr_reset(ch, 1, 0);
140*2831bc3aSCaesar Wang 	sram_udelay(10);
141*2831bc3aSCaesar Wang 	rkclk_ddr_reset(ch, 0, 0);
142*2831bc3aSCaesar Wang 	sram_udelay(10);
143*2831bc3aSCaesar Wang }
144*2831bc3aSCaesar Wang 
145*2831bc3aSCaesar Wang static __sramfunc void phy_dll_bypass_set(uint32_t ch, uint32_t hz)
146*2831bc3aSCaesar Wang {
147*2831bc3aSCaesar Wang 	if (hz <= 125 * MHz) {
148*2831bc3aSCaesar Wang 		/* phy_sw_master_mode_X PHY_86/214/342/470 4bits offset_8 */
149*2831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 86), (0x3 << 2) << 8);
150*2831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 214), (0x3 << 2) << 8);
151*2831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 342), (0x3 << 2) << 8);
152*2831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 470), (0x3 << 2) << 8);
153*2831bc3aSCaesar Wang 		/* phy_adrctl_sw_master_mode PHY_547/675/803 4bits offset_16 */
154*2831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 547), (0x3 << 2) << 16);
155*2831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 675), (0x3 << 2) << 16);
156*2831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 803), (0x3 << 2) << 16);
157*2831bc3aSCaesar Wang 	} else {
158*2831bc3aSCaesar Wang 		/* phy_sw_master_mode_X PHY_86/214/342/470 4bits offset_8 */
159*2831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 86), (0x3 << 2) << 8);
160*2831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 214), (0x3 << 2) << 8);
161*2831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 342), (0x3 << 2) << 8);
162*2831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 470), (0x3 << 2) << 8);
163*2831bc3aSCaesar Wang 		/* phy_adrctl_sw_master_mode PHY_547/675/803 4bits offset_16 */
164*2831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 547), (0x3 << 2) << 16);
165*2831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 675), (0x3 << 2) << 16);
166*2831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 803), (0x3 << 2) << 16);
167*2831bc3aSCaesar Wang 	}
168*2831bc3aSCaesar Wang }
169*2831bc3aSCaesar Wang 
170*2831bc3aSCaesar Wang static __sramfunc void set_cs_training_index(uint32_t ch, uint32_t rank)
171*2831bc3aSCaesar Wang {
172*2831bc3aSCaesar Wang 	/* PHY_8/136/264/392 phy_per_cs_training_index_X 1bit offset_24 */
173*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 8), 0x1 << 24, rank << 24);
174*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 136), 0x1 << 24, rank << 24);
175*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 264), 0x1 << 24, rank << 24);
176*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 392), 0x1 << 24, rank << 24);
177*2831bc3aSCaesar Wang }
178*2831bc3aSCaesar Wang 
179*2831bc3aSCaesar Wang static __sramfunc void select_per_cs_training_index(uint32_t ch, uint32_t rank)
180*2831bc3aSCaesar Wang {
181*2831bc3aSCaesar Wang 	/* PHY_84 PHY_PER_CS_TRAINING_EN_0 1bit offset_16 */
182*2831bc3aSCaesar Wang 	if ((mmio_read_32(PHY_REG(ch, 84)) >> 16) & 1)
183*2831bc3aSCaesar Wang 		set_cs_training_index(ch, rank);
184*2831bc3aSCaesar Wang }
185*2831bc3aSCaesar Wang 
186*2831bc3aSCaesar Wang static void override_write_leveling_value(uint32_t ch)
187*2831bc3aSCaesar Wang {
188*2831bc3aSCaesar Wang 	uint32_t byte;
189*2831bc3aSCaesar Wang 
190*2831bc3aSCaesar Wang 	/* PHY_896 PHY_FREQ_SEL_MULTICAST_EN 1bit offset_0 */
191*2831bc3aSCaesar Wang 	mmio_setbits_32(PHY_REG(ch, 896), 1);
192*2831bc3aSCaesar Wang 
193*2831bc3aSCaesar Wang 	/*
194*2831bc3aSCaesar Wang 	 * PHY_8/136/264/392
195*2831bc3aSCaesar Wang 	 * phy_per_cs_training_multicast_en_X 1bit offset_16
196*2831bc3aSCaesar Wang 	 */
197*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 8), 0x1 << 16, 1 << 16);
198*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 136), 0x1 << 16, 1 << 16);
199*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 264), 0x1 << 16, 1 << 16);
200*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 392), 0x1 << 16, 1 << 16);
201*2831bc3aSCaesar Wang 
202*2831bc3aSCaesar Wang 	for (byte = 0; byte < 4; byte++)
203*2831bc3aSCaesar Wang 		mmio_clrsetbits_32(PHY_REG(ch, 63 + (128 * byte)),
204*2831bc3aSCaesar Wang 				   0xffff << 16,
205*2831bc3aSCaesar Wang 				   0x200 << 16);
206*2831bc3aSCaesar Wang 
207*2831bc3aSCaesar Wang 	/* PHY_896 PHY_FREQ_SEL_MULTICAST_EN 1bit offset_0 */
208*2831bc3aSCaesar Wang 	mmio_clrbits_32(PHY_REG(ch, 896), 1);
209*2831bc3aSCaesar Wang 
210*2831bc3aSCaesar Wang 	/* CTL_200 ctrlupd_req 1bit offset_8 */
211*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(CTL_REG(ch, 200), 0x1 << 8, 0x1 << 8);
212*2831bc3aSCaesar Wang }
213*2831bc3aSCaesar Wang 
214*2831bc3aSCaesar Wang static __sramfunc int data_training(uint32_t ch,
215*2831bc3aSCaesar Wang 		struct rk3399_sdram_params *sdram_params,
216*2831bc3aSCaesar Wang 		uint32_t training_flag)
217*2831bc3aSCaesar Wang {
218*2831bc3aSCaesar Wang 	uint32_t obs_0, obs_1, obs_2, obs_3, obs_err = 0;
219*2831bc3aSCaesar Wang 	uint32_t rank = sdram_params->ch[ch].rank;
220*2831bc3aSCaesar Wang 	uint32_t rank_mask;
221*2831bc3aSCaesar Wang 	uint32_t i, tmp;
222*2831bc3aSCaesar Wang 
223*2831bc3aSCaesar Wang 	if (sdram_params->dramtype == LPDDR4)
224*2831bc3aSCaesar Wang 		rank_mask = (rank == 1) ? 0x5 : 0xf;
225*2831bc3aSCaesar Wang 	else
226*2831bc3aSCaesar Wang 		rank_mask = (rank == 1) ? 0x1 : 0x3;
227*2831bc3aSCaesar Wang 
228*2831bc3aSCaesar Wang 	/* PHY_927 PHY_PAD_DQS_DRIVE  RPULL offset_22 */
229*2831bc3aSCaesar Wang 	mmio_setbits_32(PHY_REG(ch, 927), (1 << 22));
230*2831bc3aSCaesar Wang 
231*2831bc3aSCaesar Wang 	if (training_flag == PI_FULL_TRAINING) {
232*2831bc3aSCaesar Wang 		if (sdram_params->dramtype == LPDDR4) {
233*2831bc3aSCaesar Wang 			training_flag = PI_WRITE_LEVELING |
234*2831bc3aSCaesar Wang 					PI_READ_GATE_TRAINING |
235*2831bc3aSCaesar Wang 					PI_READ_LEVELING |
236*2831bc3aSCaesar Wang 					PI_WDQ_LEVELING;
237*2831bc3aSCaesar Wang 		} else if (sdram_params->dramtype == LPDDR3) {
238*2831bc3aSCaesar Wang 			training_flag = PI_CA_TRAINING | PI_WRITE_LEVELING |
239*2831bc3aSCaesar Wang 					PI_READ_GATE_TRAINING;
240*2831bc3aSCaesar Wang 		} else if (sdram_params->dramtype == DDR3) {
241*2831bc3aSCaesar Wang 			training_flag = PI_WRITE_LEVELING |
242*2831bc3aSCaesar Wang 					PI_READ_GATE_TRAINING |
243*2831bc3aSCaesar Wang 					PI_READ_LEVELING;
244*2831bc3aSCaesar Wang 		}
245*2831bc3aSCaesar Wang 	}
246*2831bc3aSCaesar Wang 
247*2831bc3aSCaesar Wang 	/* ca training(LPDDR4,LPDDR3 support) */
248*2831bc3aSCaesar Wang 	if ((training_flag & PI_CA_TRAINING) == PI_CA_TRAINING) {
249*2831bc3aSCaesar Wang 		for (i = 0; i < 4; i++) {
250*2831bc3aSCaesar Wang 			if (!(rank_mask & (1 << i)))
251*2831bc3aSCaesar Wang 				continue;
252*2831bc3aSCaesar Wang 
253*2831bc3aSCaesar Wang 			select_per_cs_training_index(ch, i);
254*2831bc3aSCaesar Wang 			/* PI_100 PI_CALVL_EN:RW:8:2 */
255*2831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 100), 0x3 << 8, 0x2 << 8);
256*2831bc3aSCaesar Wang 
257*2831bc3aSCaesar Wang 			/* PI_92 PI_CALVL_REQ:WR:16:1,PI_CALVL_CS:RW:24:2 */
258*2831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 92),
259*2831bc3aSCaesar Wang 					   (0x1 << 16) | (0x3 << 24),
260*2831bc3aSCaesar Wang 					   (0x1 << 16) | (i << 24));
261*2831bc3aSCaesar Wang 			while (1) {
262*2831bc3aSCaesar Wang 				/* PI_174 PI_INT_STATUS:RD:8:18 */
263*2831bc3aSCaesar Wang 				tmp = mmio_read_32(PI_REG(ch, 174)) >> 8;
264*2831bc3aSCaesar Wang 
265*2831bc3aSCaesar Wang 				/*
266*2831bc3aSCaesar Wang 				 * check status obs
267*2831bc3aSCaesar Wang 				 * PHY_532/660/788 phy_adr_calvl_obs1_:0:32
268*2831bc3aSCaesar Wang 				 */
269*2831bc3aSCaesar Wang 				obs_0 = mmio_read_32(PHY_REG(ch, 532));
270*2831bc3aSCaesar Wang 				obs_1 = mmio_read_32(PHY_REG(ch, 660));
271*2831bc3aSCaesar Wang 				obs_2 = mmio_read_32(PHY_REG(ch, 788));
272*2831bc3aSCaesar Wang 				if (((obs_0 >> 30) & 0x3) ||
273*2831bc3aSCaesar Wang 				    ((obs_1 >> 30) & 0x3) ||
274*2831bc3aSCaesar Wang 				    ((obs_2 >> 30) & 0x3))
275*2831bc3aSCaesar Wang 					obs_err = 1;
276*2831bc3aSCaesar Wang 				if ((((tmp >> 11) & 0x1) == 0x1) &&
277*2831bc3aSCaesar Wang 				    (((tmp >> 13) & 0x1) == 0x1) &&
278*2831bc3aSCaesar Wang 				    (((tmp >> 5) & 0x1) == 0x0) &&
279*2831bc3aSCaesar Wang 				    (obs_err == 0))
280*2831bc3aSCaesar Wang 					break;
281*2831bc3aSCaesar Wang 				else if ((((tmp >> 5) & 0x1) == 0x1) ||
282*2831bc3aSCaesar Wang 					 (obs_err == 1))
283*2831bc3aSCaesar Wang 					return -1;
284*2831bc3aSCaesar Wang 			}
285*2831bc3aSCaesar Wang 			/* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
286*2831bc3aSCaesar Wang 			mmio_write_32(PI_REG(ch, 175), 0x00003f7c);
287*2831bc3aSCaesar Wang 		}
288*2831bc3aSCaesar Wang 		mmio_clrbits_32(PI_REG(ch, 100), 0x3 << 8);
289*2831bc3aSCaesar Wang 	}
290*2831bc3aSCaesar Wang 
291*2831bc3aSCaesar Wang 	/* write leveling(LPDDR4,LPDDR3,DDR3 support) */
292*2831bc3aSCaesar Wang 	if ((training_flag & PI_WRITE_LEVELING) == PI_WRITE_LEVELING) {
293*2831bc3aSCaesar Wang 		for (i = 0; i < rank; i++) {
294*2831bc3aSCaesar Wang 			select_per_cs_training_index(ch, i);
295*2831bc3aSCaesar Wang 			/* PI_60 PI_WRLVL_EN:RW:8:2 */
296*2831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 60), 0x3 << 8, 0x2 << 8);
297*2831bc3aSCaesar Wang 			/* PI_59 PI_WRLVL_REQ:WR:8:1,PI_WRLVL_CS:RW:16:2 */
298*2831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 59),
299*2831bc3aSCaesar Wang 					   (0x1 << 8) | (0x3 << 16),
300*2831bc3aSCaesar Wang 					   (0x1 << 8) | (i << 16));
301*2831bc3aSCaesar Wang 
302*2831bc3aSCaesar Wang 			while (1) {
303*2831bc3aSCaesar Wang 				/* PI_174 PI_INT_STATUS:RD:8:18 */
304*2831bc3aSCaesar Wang 				tmp = mmio_read_32(PI_REG(ch, 174)) >> 8;
305*2831bc3aSCaesar Wang 
306*2831bc3aSCaesar Wang 				/*
307*2831bc3aSCaesar Wang 				 * check status obs, if error maybe can not
308*2831bc3aSCaesar Wang 				 * get leveling done PHY_40/168/296/424
309*2831bc3aSCaesar Wang 				 * phy_wrlvl_status_obs_X:0:13
310*2831bc3aSCaesar Wang 				 */
311*2831bc3aSCaesar Wang 				obs_0 = mmio_read_32(PHY_REG(ch, 40));
312*2831bc3aSCaesar Wang 				obs_1 = mmio_read_32(PHY_REG(ch, 168));
313*2831bc3aSCaesar Wang 				obs_2 = mmio_read_32(PHY_REG(ch, 296));
314*2831bc3aSCaesar Wang 				obs_3 = mmio_read_32(PHY_REG(ch, 424));
315*2831bc3aSCaesar Wang 				if (((obs_0 >> 12) & 0x1) ||
316*2831bc3aSCaesar Wang 				    ((obs_1 >> 12) & 0x1) ||
317*2831bc3aSCaesar Wang 				    ((obs_2 >> 12) & 0x1) ||
318*2831bc3aSCaesar Wang 				    ((obs_3 >> 12) & 0x1))
319*2831bc3aSCaesar Wang 					obs_err = 1;
320*2831bc3aSCaesar Wang 				if ((((tmp >> 10) & 0x1) == 0x1) &&
321*2831bc3aSCaesar Wang 				    (((tmp >> 13) & 0x1) == 0x1) &&
322*2831bc3aSCaesar Wang 				    (((tmp >> 4) & 0x1) == 0x0) &&
323*2831bc3aSCaesar Wang 				    (obs_err == 0))
324*2831bc3aSCaesar Wang 					break;
325*2831bc3aSCaesar Wang 				else if ((((tmp >> 4) & 0x1) == 0x1) ||
326*2831bc3aSCaesar Wang 					 (obs_err == 1))
327*2831bc3aSCaesar Wang 					return -1;
328*2831bc3aSCaesar Wang 			}
329*2831bc3aSCaesar Wang 
330*2831bc3aSCaesar Wang 			/* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
331*2831bc3aSCaesar Wang 			mmio_write_32(PI_REG(ch, 175), 0x00003f7c);
332*2831bc3aSCaesar Wang 		}
333*2831bc3aSCaesar Wang 		override_write_leveling_value(ch);
334*2831bc3aSCaesar Wang 		mmio_clrbits_32(PI_REG(ch, 60), 0x3 << 8);
335*2831bc3aSCaesar Wang 	}
336*2831bc3aSCaesar Wang 
337*2831bc3aSCaesar Wang 	/* read gate training(LPDDR4,LPDDR3,DDR3 support) */
338*2831bc3aSCaesar Wang 	if ((training_flag & PI_READ_GATE_TRAINING) == PI_READ_GATE_TRAINING) {
339*2831bc3aSCaesar Wang 		for (i = 0; i < rank; i++) {
340*2831bc3aSCaesar Wang 			select_per_cs_training_index(ch, i);
341*2831bc3aSCaesar Wang 			/* PI_80 PI_RDLVL_GATE_EN:RW:24:2 */
342*2831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 80), 0x3 << 24,
343*2831bc3aSCaesar Wang 					   0x2 << 24);
344*2831bc3aSCaesar Wang 			/*
345*2831bc3aSCaesar Wang 			 * PI_74 PI_RDLVL_GATE_REQ:WR:16:1
346*2831bc3aSCaesar Wang 			 * PI_RDLVL_CS:RW:24:2
347*2831bc3aSCaesar Wang 			 */
348*2831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 74),
349*2831bc3aSCaesar Wang 					   (0x1 << 16) | (0x3 << 24),
350*2831bc3aSCaesar Wang 					   (0x1 << 16) | (i << 24));
351*2831bc3aSCaesar Wang 
352*2831bc3aSCaesar Wang 			while (1) {
353*2831bc3aSCaesar Wang 				/* PI_174 PI_INT_STATUS:RD:8:18 */
354*2831bc3aSCaesar Wang 				tmp = mmio_read_32(PI_REG(ch, 174)) >> 8;
355*2831bc3aSCaesar Wang 
356*2831bc3aSCaesar Wang 				/*
357*2831bc3aSCaesar Wang 				 * check status obs
358*2831bc3aSCaesar Wang 				 * PHY_43/171/299/427
359*2831bc3aSCaesar Wang 				 *     PHY_GTLVL_STATUS_OBS_x:16:8
360*2831bc3aSCaesar Wang 				 */
361*2831bc3aSCaesar Wang 				obs_0 = mmio_read_32(PHY_REG(ch, 43));
362*2831bc3aSCaesar Wang 				obs_1 = mmio_read_32(PHY_REG(ch, 171));
363*2831bc3aSCaesar Wang 				obs_2 = mmio_read_32(PHY_REG(ch, 299));
364*2831bc3aSCaesar Wang 				obs_3 = mmio_read_32(PHY_REG(ch, 427));
365*2831bc3aSCaesar Wang 				if (((obs_0 >> (16 + 6)) & 0x3) ||
366*2831bc3aSCaesar Wang 				    ((obs_1 >> (16 + 6)) & 0x3) ||
367*2831bc3aSCaesar Wang 				    ((obs_2 >> (16 + 6)) & 0x3) ||
368*2831bc3aSCaesar Wang 				    ((obs_3 >> (16 + 6)) & 0x3))
369*2831bc3aSCaesar Wang 					obs_err = 1;
370*2831bc3aSCaesar Wang 				if ((((tmp >> 9) & 0x1) == 0x1) &&
371*2831bc3aSCaesar Wang 				    (((tmp >> 13) & 0x1) == 0x1) &&
372*2831bc3aSCaesar Wang 				    (((tmp >> 3) & 0x1) == 0x0) &&
373*2831bc3aSCaesar Wang 				    (obs_err == 0))
374*2831bc3aSCaesar Wang 					break;
375*2831bc3aSCaesar Wang 				else if ((((tmp >> 3) & 0x1) == 0x1) ||
376*2831bc3aSCaesar Wang 					 (obs_err == 1))
377*2831bc3aSCaesar Wang 					return -1;
378*2831bc3aSCaesar Wang 			}
379*2831bc3aSCaesar Wang 			/* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
380*2831bc3aSCaesar Wang 			mmio_write_32(PI_REG(ch, 175), 0x00003f7c);
381*2831bc3aSCaesar Wang 		}
382*2831bc3aSCaesar Wang 		mmio_clrbits_32(PI_REG(ch, 80), 0x3 << 24);
383*2831bc3aSCaesar Wang 	}
384*2831bc3aSCaesar Wang 
385*2831bc3aSCaesar Wang 	/* read leveling(LPDDR4,LPDDR3,DDR3 support) */
386*2831bc3aSCaesar Wang 	if ((training_flag & PI_READ_LEVELING) == PI_READ_LEVELING) {
387*2831bc3aSCaesar Wang 		for (i = 0; i < rank; i++) {
388*2831bc3aSCaesar Wang 			select_per_cs_training_index(ch, i);
389*2831bc3aSCaesar Wang 			/* PI_80 PI_RDLVL_EN:RW:16:2 */
390*2831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 80), 0x3 << 16,
391*2831bc3aSCaesar Wang 					   0x2 << 16);
392*2831bc3aSCaesar Wang 			/* PI_74 PI_RDLVL_REQ:WR:8:1,PI_RDLVL_CS:RW:24:2 */
393*2831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 74),
394*2831bc3aSCaesar Wang 					   (0x1 << 8) | (0x3 << 24),
395*2831bc3aSCaesar Wang 					   (0x1 << 8) | (i << 24));
396*2831bc3aSCaesar Wang 			while (1) {
397*2831bc3aSCaesar Wang 				/* PI_174 PI_INT_STATUS:RD:8:18 */
398*2831bc3aSCaesar Wang 				tmp = mmio_read_32(PI_REG(ch, 174)) >> 8;
399*2831bc3aSCaesar Wang 
400*2831bc3aSCaesar Wang 				/*
401*2831bc3aSCaesar Wang 				 * make sure status obs not report error bit
402*2831bc3aSCaesar Wang 				 * PHY_46/174/302/430
403*2831bc3aSCaesar Wang 				 *     phy_rdlvl_status_obs_X:16:8
404*2831bc3aSCaesar Wang 				 */
405*2831bc3aSCaesar Wang 				if ((((tmp >> 8) & 0x1) == 0x1) &&
406*2831bc3aSCaesar Wang 				    (((tmp >> 13) & 0x1) == 0x1) &&
407*2831bc3aSCaesar Wang 				    (((tmp >> 2) & 0x1) == 0x0))
408*2831bc3aSCaesar Wang 					break;
409*2831bc3aSCaesar Wang 				else if (((tmp >> 2) & 0x1) == 0x1)
410*2831bc3aSCaesar Wang 					return -1;
411*2831bc3aSCaesar Wang 			}
412*2831bc3aSCaesar Wang 			/* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
413*2831bc3aSCaesar Wang 			mmio_write_32(PI_REG(ch, 175), 0x00003f7c);
414*2831bc3aSCaesar Wang 		}
415*2831bc3aSCaesar Wang 		mmio_clrbits_32(PI_REG(ch, 80), 0x3 << 16);
416*2831bc3aSCaesar Wang 	}
417*2831bc3aSCaesar Wang 
418*2831bc3aSCaesar Wang 	/* wdq leveling(LPDDR4 support) */
419*2831bc3aSCaesar Wang 	if ((training_flag & PI_WDQ_LEVELING) == PI_WDQ_LEVELING) {
420*2831bc3aSCaesar Wang 		for (i = 0; i < 4; i++) {
421*2831bc3aSCaesar Wang 			if (!(rank_mask & (1 << i)))
422*2831bc3aSCaesar Wang 				continue;
423*2831bc3aSCaesar Wang 
424*2831bc3aSCaesar Wang 			select_per_cs_training_index(ch, i);
425*2831bc3aSCaesar Wang 			/*
426*2831bc3aSCaesar Wang 			 * disable PI_WDQLVL_VREF_EN before wdq leveling?
427*2831bc3aSCaesar Wang 			 * PI_181 PI_WDQLVL_VREF_EN:RW:8:1
428*2831bc3aSCaesar Wang 			 */
429*2831bc3aSCaesar Wang 			mmio_clrbits_32(PI_REG(ch, 181), 0x1 << 8);
430*2831bc3aSCaesar Wang 			/* PI_124 PI_WDQLVL_EN:RW:16:2 */
431*2831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 124), 0x3 << 16,
432*2831bc3aSCaesar Wang 					   0x2 << 16);
433*2831bc3aSCaesar Wang 			/* PI_121 PI_WDQLVL_REQ:WR:8:1,PI_WDQLVL_CS:RW:16:2 */
434*2831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 121),
435*2831bc3aSCaesar Wang 					   (0x1 << 8) | (0x3 << 16),
436*2831bc3aSCaesar Wang 					   (0x1 << 8) | (i << 16));
437*2831bc3aSCaesar Wang 			while (1) {
438*2831bc3aSCaesar Wang 				/* PI_174 PI_INT_STATUS:RD:8:18 */
439*2831bc3aSCaesar Wang 				tmp = mmio_read_32(PI_REG(ch, 174)) >> 8;
440*2831bc3aSCaesar Wang 				if ((((tmp >> 12) & 0x1) == 0x1) &&
441*2831bc3aSCaesar Wang 				    (((tmp >> 13) & 0x1) == 0x1) &&
442*2831bc3aSCaesar Wang 				    (((tmp >> 6) & 0x1) == 0x0))
443*2831bc3aSCaesar Wang 					break;
444*2831bc3aSCaesar Wang 				else if (((tmp >> 6) & 0x1) == 0x1)
445*2831bc3aSCaesar Wang 					return -1;
446*2831bc3aSCaesar Wang 			}
447*2831bc3aSCaesar Wang 			/* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
448*2831bc3aSCaesar Wang 			mmio_write_32(PI_REG(ch, 175), 0x00003f7c);
449*2831bc3aSCaesar Wang 		}
450*2831bc3aSCaesar Wang 		mmio_clrbits_32(PI_REG(ch, 124), 0x3 << 16);
451*2831bc3aSCaesar Wang 	}
452*2831bc3aSCaesar Wang 
453*2831bc3aSCaesar Wang 	/* PHY_927 PHY_PAD_DQS_DRIVE  RPULL offset_22 */
454*2831bc3aSCaesar Wang 	mmio_clrbits_32(PHY_REG(ch, 927), (1 << 22));
455*2831bc3aSCaesar Wang 
456*2831bc3aSCaesar Wang 	return 0;
457*2831bc3aSCaesar Wang }
458*2831bc3aSCaesar Wang 
459*2831bc3aSCaesar Wang static __sramfunc void set_ddrconfig(struct rk3399_sdram_params *sdram_params,
460*2831bc3aSCaesar Wang 		unsigned char channel, uint32_t ddrconfig)
461*2831bc3aSCaesar Wang {
462*2831bc3aSCaesar Wang 	/* only need to set ddrconfig */
463*2831bc3aSCaesar Wang 	struct rk3399_sdram_channel *ch = &sdram_params->ch[channel];
464*2831bc3aSCaesar Wang 	unsigned int cs0_cap = 0;
465*2831bc3aSCaesar Wang 	unsigned int cs1_cap = 0;
466*2831bc3aSCaesar Wang 
467*2831bc3aSCaesar Wang 	cs0_cap = (1 << (ch->cs0_row + ch->col + ch->bk + ch->bw - 20));
468*2831bc3aSCaesar Wang 	if (ch->rank > 1)
469*2831bc3aSCaesar Wang 		cs1_cap = cs0_cap >> (ch->cs0_row - ch->cs1_row);
470*2831bc3aSCaesar Wang 	if (ch->row_3_4) {
471*2831bc3aSCaesar Wang 		cs0_cap = cs0_cap * 3 / 4;
472*2831bc3aSCaesar Wang 		cs1_cap = cs1_cap * 3 / 4;
473*2831bc3aSCaesar Wang 	}
474*2831bc3aSCaesar Wang 
475*2831bc3aSCaesar Wang 	mmio_write_32(MSCH_BASE(channel) + MSCH_DEVICECONF,
476*2831bc3aSCaesar Wang 		      ddrconfig | (ddrconfig << 6));
477*2831bc3aSCaesar Wang 	mmio_write_32(MSCH_BASE(channel) + MSCH_DEVICESIZE,
478*2831bc3aSCaesar Wang 		      ((cs0_cap / 32) & 0xff) | (((cs1_cap / 32) & 0xff) << 8));
479*2831bc3aSCaesar Wang }
480*2831bc3aSCaesar Wang 
481*2831bc3aSCaesar Wang static __sramfunc void dram_all_config(struct rk3399_sdram_params *sdram_params)
482*2831bc3aSCaesar Wang {
483*2831bc3aSCaesar Wang 	unsigned int i;
484*2831bc3aSCaesar Wang 
485*2831bc3aSCaesar Wang 	for (i = 0; i < 2; i++) {
486*2831bc3aSCaesar Wang 		struct rk3399_sdram_channel *info = &sdram_params->ch[i];
487*2831bc3aSCaesar Wang 		struct rk3399_msch_timings *noc = &info->noc_timings;
488*2831bc3aSCaesar Wang 
489*2831bc3aSCaesar Wang 		if (sdram_params->ch[i].col == 0)
490*2831bc3aSCaesar Wang 			continue;
491*2831bc3aSCaesar Wang 
492*2831bc3aSCaesar Wang 		mmio_write_32(MSCH_BASE(i) + MSCH_DDRTIMINGA0,
493*2831bc3aSCaesar Wang 			      noc->ddrtiminga0.d32);
494*2831bc3aSCaesar Wang 		mmio_write_32(MSCH_BASE(i) + MSCH_DDRTIMINGB0,
495*2831bc3aSCaesar Wang 			      noc->ddrtimingb0.d32);
496*2831bc3aSCaesar Wang 		mmio_write_32(MSCH_BASE(i) + MSCH_DDRTIMINGC0,
497*2831bc3aSCaesar Wang 			      noc->ddrtimingc0.d32);
498*2831bc3aSCaesar Wang 		mmio_write_32(MSCH_BASE(i) + MSCH_DEVTODEV0,
499*2831bc3aSCaesar Wang 			      noc->devtodev0.d32);
500*2831bc3aSCaesar Wang 		mmio_write_32(MSCH_BASE(i) + MSCH_DDRMODE, noc->ddrmode.d32);
501*2831bc3aSCaesar Wang 
502*2831bc3aSCaesar Wang 		/* rank 1 memory clock disable (dfi_dram_clk_disable = 1) */
503*2831bc3aSCaesar Wang 		if (sdram_params->ch[i].rank == 1)
504*2831bc3aSCaesar Wang 			mmio_setbits_32(CTL_REG(i, 276), 1 << 17);
505*2831bc3aSCaesar Wang 	}
506*2831bc3aSCaesar Wang 
507*2831bc3aSCaesar Wang 	DDR_STRIDE(sdram_params->stride);
508*2831bc3aSCaesar Wang 
509*2831bc3aSCaesar Wang 	/* reboot hold register set */
510*2831bc3aSCaesar Wang 	mmio_write_32(PMUCRU_BASE + CRU_PMU_RSTHOLD_CON(1),
511*2831bc3aSCaesar Wang 		      CRU_PMU_SGRF_RST_RLS |
512*2831bc3aSCaesar Wang 		      PRESET_GPIO0_HOLD(1) |
513*2831bc3aSCaesar Wang 		      PRESET_GPIO1_HOLD(1));
514*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(CRU_BASE + CRU_GLB_RST_CON, 0x3, 0x3);
515*2831bc3aSCaesar Wang }
516*2831bc3aSCaesar Wang 
517*2831bc3aSCaesar Wang static __sramfunc void pctl_cfg(uint32_t ch,
518*2831bc3aSCaesar Wang 		struct rk3399_sdram_params *sdram_params)
519*2831bc3aSCaesar Wang {
520*2831bc3aSCaesar Wang 	const uint32_t *params_ctl = sdram_params->pctl_regs.denali_ctl;
521*2831bc3aSCaesar Wang 	const uint32_t *params_phy = sdram_params->phy_regs.denali_phy;
522*2831bc3aSCaesar Wang 	const uint32_t *params_pi = sdram_params->pi_regs.denali_pi;
523*2831bc3aSCaesar Wang 	uint32_t tmp, tmp1, tmp2;
524*2831bc3aSCaesar Wang 
525*2831bc3aSCaesar Wang 	/*
526*2831bc3aSCaesar Wang 	 * Workaround controller bug:
527*2831bc3aSCaesar Wang 	 * Do not program DRAM_CLASS until NO_PHY_IND_TRAIN_INT is programmed
528*2831bc3aSCaesar Wang 	 */
529*2831bc3aSCaesar Wang 	sram_regcpy(CTL_REG(ch, 1), (uintptr_t)&params_ctl[1],
530*2831bc3aSCaesar Wang 		    CTL_REG_NUM - 1);
531*2831bc3aSCaesar Wang 	mmio_write_32(CTL_REG(ch, 0), params_ctl[0]);
532*2831bc3aSCaesar Wang 	sram_regcpy(PI_REG(ch, 0), (uintptr_t)&params_pi[0],
533*2831bc3aSCaesar Wang 		    PI_REG_NUM);
534*2831bc3aSCaesar Wang 
535*2831bc3aSCaesar Wang 	mmio_write_32(PHY_REG(ch, 910), params_phy[910]);
536*2831bc3aSCaesar Wang 	mmio_write_32(PHY_REG(ch, 911), params_phy[911]);
537*2831bc3aSCaesar Wang 	mmio_write_32(PHY_REG(ch, 912), params_phy[912]);
538*2831bc3aSCaesar Wang 
539*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(CTL_REG(ch, 68), PWRUP_SREFRESH_EXIT,
540*2831bc3aSCaesar Wang 				PWRUP_SREFRESH_EXIT);
541*2831bc3aSCaesar Wang 
542*2831bc3aSCaesar Wang 	/* PHY_DLL_RST_EN */
543*2831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 957), 0x3 << 24, 1 << 24);
544*2831bc3aSCaesar Wang 	dmbst();
545*2831bc3aSCaesar Wang 
546*2831bc3aSCaesar Wang 	mmio_setbits_32(PI_REG(ch, 0), START);
547*2831bc3aSCaesar Wang 	mmio_setbits_32(CTL_REG(ch, 0), START);
548*2831bc3aSCaesar Wang 
549*2831bc3aSCaesar Wang 	/* wait lock */
550*2831bc3aSCaesar Wang 	while (1) {
551*2831bc3aSCaesar Wang 		tmp = mmio_read_32(PHY_REG(ch, 920));
552*2831bc3aSCaesar Wang 		tmp1 = mmio_read_32(PHY_REG(ch, 921));
553*2831bc3aSCaesar Wang 		tmp2 = mmio_read_32(PHY_REG(ch, 922));
554*2831bc3aSCaesar Wang 		if ((((tmp >> 16) & 0x1) == 0x1) &&
555*2831bc3aSCaesar Wang 		     (((tmp1 >> 16) & 0x1) == 0x1) &&
556*2831bc3aSCaesar Wang 		     (((tmp1 >> 0) & 0x1) == 0x1) &&
557*2831bc3aSCaesar Wang 		     (((tmp2 >> 0) & 0x1) == 0x1))
558*2831bc3aSCaesar Wang 			break;
559*2831bc3aSCaesar Wang 		/* if PLL bypass,don't need wait lock */
560*2831bc3aSCaesar Wang 		if (mmio_read_32(PHY_REG(ch, 911)) & 0x1)
561*2831bc3aSCaesar Wang 			break;
562*2831bc3aSCaesar Wang 	}
563*2831bc3aSCaesar Wang 
564*2831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 896), (uintptr_t)&params_phy[896], 63);
565*2831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 0), (uintptr_t)&params_phy[0], 91);
566*2831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 128), (uintptr_t)&params_phy[128], 91);
567*2831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 256), (uintptr_t)&params_phy[256], 91);
568*2831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 384), (uintptr_t)&params_phy[384], 91);
569*2831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 512), (uintptr_t)&params_phy[512], 38);
570*2831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 640), (uintptr_t)&params_phy[640], 38);
571*2831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 768), (uintptr_t)&params_phy[768], 38);
572*2831bc3aSCaesar Wang }
573*2831bc3aSCaesar Wang 
574*2831bc3aSCaesar Wang static __sramfunc int dram_switch_to_phy_index1(
575*2831bc3aSCaesar Wang 		struct rk3399_sdram_params *sdram_params)
576*2831bc3aSCaesar Wang {
577*2831bc3aSCaesar Wang 	uint32_t ch, ch_count;
578*2831bc3aSCaesar Wang 
579*2831bc3aSCaesar Wang 	mmio_write_32(CIC_BASE + CIC_CTRL0,
580*2831bc3aSCaesar Wang 		      (((0x3 << 4) | (1 << 2) | 1) << 16) |
581*2831bc3aSCaesar Wang 		      (1 << 4) | (1 << 2) | 1);
582*2831bc3aSCaesar Wang 	while (!(mmio_read_32(CIC_BASE + CIC_STATUS0) & (1 << 2)))
583*2831bc3aSCaesar Wang 		;
584*2831bc3aSCaesar Wang 
585*2831bc3aSCaesar Wang 	mmio_write_32(CIC_BASE + CIC_CTRL0, 0x20002);
586*2831bc3aSCaesar Wang 	while (!(mmio_read_32(CIC_BASE + CIC_STATUS0) & (1 << 0)))
587*2831bc3aSCaesar Wang 		;
588*2831bc3aSCaesar Wang 
589*2831bc3aSCaesar Wang 	ch_count = sdram_params->num_channels;
590*2831bc3aSCaesar Wang 
591*2831bc3aSCaesar Wang 	/* LPDDR4 f2 cann't do training, all training will fail */
592*2831bc3aSCaesar Wang 	for (ch = 0; ch < ch_count; ch++) {
593*2831bc3aSCaesar Wang 		mmio_clrsetbits_32(PHY_REG(ch, 896), (0x3 << 8) | 1,
594*2831bc3aSCaesar Wang 				   1 << 8);
595*2831bc3aSCaesar Wang 
596*2831bc3aSCaesar Wang 		/* data_training failed */
597*2831bc3aSCaesar Wang 		if (data_training(ch, sdram_params, PI_FULL_TRAINING))
598*2831bc3aSCaesar Wang 			return -1;
599*2831bc3aSCaesar Wang 	}
600*2831bc3aSCaesar Wang 
601*2831bc3aSCaesar Wang 	return 0;
602*2831bc3aSCaesar Wang }
603*2831bc3aSCaesar Wang 
604*2831bc3aSCaesar Wang /*
605*2831bc3aSCaesar Wang  * Needs to be done for both channels at once in case of a shared reset signal
606*2831bc3aSCaesar Wang  * between channels.
607*2831bc3aSCaesar Wang  */
608*2831bc3aSCaesar Wang static __sramfunc int pctl_start(uint32_t channel_mask,
609*2831bc3aSCaesar Wang 		struct rk3399_sdram_params *sdram_params)
610*2831bc3aSCaesar Wang {
611*2831bc3aSCaesar Wang 	uint32_t count;
612*2831bc3aSCaesar Wang 
613*2831bc3aSCaesar Wang 	mmio_setbits_32(CTL_REG(0, 68), PWRUP_SREFRESH_EXIT);
614*2831bc3aSCaesar Wang 	mmio_setbits_32(CTL_REG(1, 68), PWRUP_SREFRESH_EXIT);
615*2831bc3aSCaesar Wang 
616*2831bc3aSCaesar Wang 	/* need de-access IO retention before controller START */
617*2831bc3aSCaesar Wang 	if (channel_mask & (1 << 0))
618*2831bc3aSCaesar Wang 		mmio_setbits_32(PMU_BASE + PMU_PWRMODE_CON, (1 << 19));
619*2831bc3aSCaesar Wang 	if (channel_mask & (1 << 1))
620*2831bc3aSCaesar Wang 		mmio_setbits_32(PMU_BASE + PMU_PWRMODE_CON, (1 << 23));
621*2831bc3aSCaesar Wang 
622*2831bc3aSCaesar Wang 	/* PHY_DLL_RST_EN */
623*2831bc3aSCaesar Wang 	if (channel_mask & (1 << 0))
624*2831bc3aSCaesar Wang 		mmio_clrsetbits_32(PHY_REG(0, 957), 0x3 << 24,
625*2831bc3aSCaesar Wang 				   0x2 << 24);
626*2831bc3aSCaesar Wang 	if (channel_mask & (1 << 1))
627*2831bc3aSCaesar Wang 		mmio_clrsetbits_32(PHY_REG(1, 957), 0x3 << 24,
628*2831bc3aSCaesar Wang 				   0x2 << 24);
629*2831bc3aSCaesar Wang 
630*2831bc3aSCaesar Wang 	/* check ERROR bit */
631*2831bc3aSCaesar Wang 	if (channel_mask & (1 << 0)) {
632*2831bc3aSCaesar Wang 		count = 0;
633*2831bc3aSCaesar Wang 		while (!(mmio_read_32(CTL_REG(0, 203)) & (1 << 3))) {
634*2831bc3aSCaesar Wang 			/* CKE is low, loop 10ms */
635*2831bc3aSCaesar Wang 			if (count > 100)
636*2831bc3aSCaesar Wang 				return -1;
637*2831bc3aSCaesar Wang 
638*2831bc3aSCaesar Wang 			sram_udelay(100);
639*2831bc3aSCaesar Wang 			count++;
640*2831bc3aSCaesar Wang 		}
641*2831bc3aSCaesar Wang 
642*2831bc3aSCaesar Wang 		mmio_clrbits_32(CTL_REG(0, 68), PWRUP_SREFRESH_EXIT);
643*2831bc3aSCaesar Wang 	}
644*2831bc3aSCaesar Wang 	if (channel_mask & (1 << 1)) {
645*2831bc3aSCaesar Wang 		count = 0;
646*2831bc3aSCaesar Wang 		while (!(mmio_read_32(CTL_REG(1, 203)) & (1 << 3))) {
647*2831bc3aSCaesar Wang 			/* CKE is low, loop 10ms */
648*2831bc3aSCaesar Wang 			if (count > 100)
649*2831bc3aSCaesar Wang 				return -1;
650*2831bc3aSCaesar Wang 
651*2831bc3aSCaesar Wang 			sram_udelay(100);
652*2831bc3aSCaesar Wang 			count++;
653*2831bc3aSCaesar Wang 		}
654*2831bc3aSCaesar Wang 
655*2831bc3aSCaesar Wang 		mmio_clrbits_32(CTL_REG(1, 68), PWRUP_SREFRESH_EXIT);
656*2831bc3aSCaesar Wang 	}
657*2831bc3aSCaesar Wang 
658*2831bc3aSCaesar Wang 	return 0;
659*2831bc3aSCaesar Wang }
660*2831bc3aSCaesar Wang 
661*2831bc3aSCaesar Wang void dmc_save(void)
662*2831bc3aSCaesar Wang {
663*2831bc3aSCaesar Wang 	struct rk3399_sdram_params *sdram_params = &sdram_config;
664*2831bc3aSCaesar Wang 	uint32_t *params_ctl;
665*2831bc3aSCaesar Wang 	uint32_t *params_pi;
666*2831bc3aSCaesar Wang 	uint32_t *params_phy;
667*2831bc3aSCaesar Wang 	uint32_t refdiv, postdiv2, postdiv1, fbdiv;
668*2831bc3aSCaesar Wang 	uint32_t tmp;
669*2831bc3aSCaesar Wang 
670*2831bc3aSCaesar Wang 	params_ctl = sdram_params->pctl_regs.denali_ctl;
671*2831bc3aSCaesar Wang 	params_pi = sdram_params->pi_regs.denali_pi;
672*2831bc3aSCaesar Wang 	params_phy = sdram_params->phy_regs.denali_phy;
673*2831bc3aSCaesar Wang 
674*2831bc3aSCaesar Wang 	fbdiv = mmio_read_32(CRU_BASE + CRU_PLL_CON(DPLL_ID, 0)) & 0xfff;
675*2831bc3aSCaesar Wang 	tmp = mmio_read_32(CRU_BASE + CRU_PLL_CON(DPLL_ID, 1));
676*2831bc3aSCaesar Wang 	postdiv2 = POSTDIV2_DEC(tmp);
677*2831bc3aSCaesar Wang 	postdiv1 = POSTDIV1_DEC(tmp);
678*2831bc3aSCaesar Wang 	refdiv = REFDIV_DEC(tmp);
679*2831bc3aSCaesar Wang 
680*2831bc3aSCaesar Wang 	sdram_params->ddr_freq = ((fbdiv * 24) /
681*2831bc3aSCaesar Wang 				(refdiv * postdiv1 * postdiv2)) * MHz;
682*2831bc3aSCaesar Wang 
683*2831bc3aSCaesar Wang 	INFO("sdram_params->ddr_freq = %d\n", sdram_params->ddr_freq);
684*2831bc3aSCaesar Wang 	sdram_params->odt = (((mmio_read_32(PHY_REG(0, 5)) >> 16) &
685*2831bc3aSCaesar Wang 			       0x7) != 0) ? 1 : 0;
686*2831bc3aSCaesar Wang 
687*2831bc3aSCaesar Wang 	/* copy the registers CTL PI and PHY */
688*2831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_ctl[0], CTL_REG(0, 0), CTL_REG_NUM);
689*2831bc3aSCaesar Wang 
690*2831bc3aSCaesar Wang 	/* mask DENALI_CTL_00_DATA.START, only copy here, will trigger later */
691*2831bc3aSCaesar Wang 	params_ctl[0] &= ~(0x1 << 0);
692*2831bc3aSCaesar Wang 
693*2831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_pi[0], PI_REG(0, 0),
694*2831bc3aSCaesar Wang 		    PI_REG_NUM);
695*2831bc3aSCaesar Wang 
696*2831bc3aSCaesar Wang 	/* mask DENALI_PI_00_DATA.START, only copy here, will trigger later*/
697*2831bc3aSCaesar Wang 	params_pi[0] &= ~(0x1 << 0);
698*2831bc3aSCaesar Wang 
699*2831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[0], PHY_REG(0, 0), 91);
700*2831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[128], PHY_REG(0, 128), 91);
701*2831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[256], PHY_REG(0, 256), 91);
702*2831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[384], PHY_REG(0, 384), 91);
703*2831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[512], PHY_REG(0, 512), 38);
704*2831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[640], PHY_REG(0, 640), 38);
705*2831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[768], PHY_REG(0, 768), 38);
706*2831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[896], PHY_REG(0, 896), 63);
707*2831bc3aSCaesar Wang 
708*2831bc3aSCaesar Wang 	/* set DENALI_PHY_957_DATA.PHY_DLL_RST_EN = 0x1 */
709*2831bc3aSCaesar Wang 	params_phy[957] &= ~(0x3 << 24);
710*2831bc3aSCaesar Wang 	params_phy[957] |= 1 << 24;
711*2831bc3aSCaesar Wang 	params_phy[896] |= 1;
712*2831bc3aSCaesar Wang 	params_phy[896] &= ~(0x3 << 8);
713*2831bc3aSCaesar Wang }
714*2831bc3aSCaesar Wang 
715*2831bc3aSCaesar Wang __sramfunc void dmc_restore(void)
716*2831bc3aSCaesar Wang {
717*2831bc3aSCaesar Wang 	struct rk3399_sdram_params *sdram_params = &sdram_config;
718*2831bc3aSCaesar Wang 	uint32_t channel_mask = 0;
719*2831bc3aSCaesar Wang 	uint32_t channel;
720*2831bc3aSCaesar Wang 
721*2831bc3aSCaesar Wang 	configure_sgrf();
722*2831bc3aSCaesar Wang 
723*2831bc3aSCaesar Wang retry:
724*2831bc3aSCaesar Wang 	for (channel = 0; channel < sdram_params->num_channels; channel++) {
725*2831bc3aSCaesar Wang 		phy_pctrl_reset(channel);
726*2831bc3aSCaesar Wang 		phy_dll_bypass_set(channel, sdram_params->ddr_freq);
727*2831bc3aSCaesar Wang 		if (channel >= sdram_params->num_channels)
728*2831bc3aSCaesar Wang 			continue;
729*2831bc3aSCaesar Wang 
730*2831bc3aSCaesar Wang 		pctl_cfg(channel, sdram_params);
731*2831bc3aSCaesar Wang 	}
732*2831bc3aSCaesar Wang 
733*2831bc3aSCaesar Wang 	for (channel = 0; channel < 2; channel++) {
734*2831bc3aSCaesar Wang 		if (sdram_params->ch[channel].col)
735*2831bc3aSCaesar Wang 			channel_mask |= 1 << channel;
736*2831bc3aSCaesar Wang 	}
737*2831bc3aSCaesar Wang 
738*2831bc3aSCaesar Wang 	if (pctl_start(channel_mask, sdram_params) < 0)
739*2831bc3aSCaesar Wang 		goto retry;
740*2831bc3aSCaesar Wang 
741*2831bc3aSCaesar Wang 	for (channel = 0; channel < sdram_params->num_channels; channel++) {
742*2831bc3aSCaesar Wang 		/* LPDDR2/LPDDR3 need to wait DAI complete, max 10us */
743*2831bc3aSCaesar Wang 		if (sdram_params->dramtype == LPDDR3)
744*2831bc3aSCaesar Wang 			sram_udelay(10);
745*2831bc3aSCaesar Wang 
746*2831bc3aSCaesar Wang 		/* If traning fail, retry to do it again. */
747*2831bc3aSCaesar Wang 		if (data_training(channel, sdram_params, PI_FULL_TRAINING))
748*2831bc3aSCaesar Wang 			goto retry;
749*2831bc3aSCaesar Wang 
750*2831bc3aSCaesar Wang 		set_ddrconfig(sdram_params, channel,
751*2831bc3aSCaesar Wang 			      sdram_params->ch[channel].ddrconfig);
752*2831bc3aSCaesar Wang 	}
753*2831bc3aSCaesar Wang 
754*2831bc3aSCaesar Wang 	dram_all_config(sdram_params);
755*2831bc3aSCaesar Wang 
756*2831bc3aSCaesar Wang 	/* Switch to index 1 and prepare for DDR frequency switch. */
757*2831bc3aSCaesar Wang 	dram_switch_to_phy_index1(sdram_params);
758*2831bc3aSCaesar Wang }
759