xref: /rk3399_ARM-atf/plat/rockchip/rk3399/drivers/dram/suspend.c (revision 82cb2c1ad9897473743f08437d0a3995bed561b9)
12831bc3aSCaesar Wang /*
22831bc3aSCaesar Wang  * Copyright (c) 2016, ARM Limited and Contributors. All rights reserved.
32831bc3aSCaesar Wang  *
4*82cb2c1aSdp-arm  * SPDX-License-Identifier: BSD-3-Clause
52831bc3aSCaesar Wang  */
62831bc3aSCaesar Wang #include <debug.h>
72831bc3aSCaesar Wang #include <arch_helpers.h>
82831bc3aSCaesar Wang #include <platform_def.h>
92831bc3aSCaesar Wang #include <plat_private.h>
102831bc3aSCaesar Wang #include <dram.h>
112831bc3aSCaesar Wang #include <pmu_regs.h>
122831bc3aSCaesar Wang #include <rk3399_def.h>
13e3525114SXing Zheng #include <secure.h>
142831bc3aSCaesar Wang #include <soc.h>
152831bc3aSCaesar Wang #include <suspend.h>
162831bc3aSCaesar Wang 
172831bc3aSCaesar Wang #define PMUGRF_OS_REG0			0x300
182831bc3aSCaesar Wang #define PMUGRF_OS_REG1			0x304
192831bc3aSCaesar Wang #define PMUGRF_OS_REG2			0x308
202831bc3aSCaesar Wang #define PMUGRF_OS_REG3			0x30c
212831bc3aSCaesar Wang 
222831bc3aSCaesar Wang #define CRU_SFTRST_DDR_CTRL(ch, n)	((0x1 << (8 + 16 + (ch) * 4)) | \
232831bc3aSCaesar Wang 					 ((n) << (8 + (ch) * 4)))
242831bc3aSCaesar Wang #define CRU_SFTRST_DDR_PHY(ch, n)	((0x1 << (9 + 16 + (ch) * 4)) | \
252831bc3aSCaesar Wang 					 ((n) << (9 + (ch) * 4)))
262831bc3aSCaesar Wang 
272831bc3aSCaesar Wang #define FBDIV_ENC(n)			((n) << 16)
282831bc3aSCaesar Wang #define FBDIV_DEC(n)			(((n) >> 16) & 0xfff)
292831bc3aSCaesar Wang #define POSTDIV2_ENC(n)			((n) << 12)
302831bc3aSCaesar Wang #define POSTDIV2_DEC(n)			(((n) >> 12) & 0x7)
312831bc3aSCaesar Wang #define POSTDIV1_ENC(n)			((n) << 8)
322831bc3aSCaesar Wang #define POSTDIV1_DEC(n)			(((n) >> 8) & 0x7)
332831bc3aSCaesar Wang #define REFDIV_ENC(n)			(n)
342831bc3aSCaesar Wang #define REFDIV_DEC(n)			((n) & 0x3f)
352831bc3aSCaesar Wang 
362831bc3aSCaesar Wang /* PMU CRU */
372831bc3aSCaesar Wang #define PMUCRU_RSTNHOLD_CON0		0x120
382831bc3aSCaesar Wang #define PMUCRU_RSTNHOLD_CON1		0x124
392831bc3aSCaesar Wang 
402831bc3aSCaesar Wang #define PRESET_GPIO0_HOLD(n)		(((n) << 7) | WMSK_BIT(7))
412831bc3aSCaesar Wang #define PRESET_GPIO1_HOLD(n)		(((n) << 8) | WMSK_BIT(8))
422831bc3aSCaesar Wang 
432831bc3aSCaesar Wang #define SYS_COUNTER_FREQ_IN_MHZ		(SYS_COUNTER_FREQ_IN_TICKS / 1000000)
442831bc3aSCaesar Wang 
452831bc3aSCaesar Wang /*
462831bc3aSCaesar Wang  * Copy @num registers from @src to @dst
472831bc3aSCaesar Wang  */
482831bc3aSCaesar Wang __sramfunc void sram_regcpy(uintptr_t dst, uintptr_t src, uint32_t num)
492831bc3aSCaesar Wang {
502831bc3aSCaesar Wang 	while (num--) {
512831bc3aSCaesar Wang 		mmio_write_32(dst, mmio_read_32(src));
522831bc3aSCaesar Wang 		dst += sizeof(uint32_t);
532831bc3aSCaesar Wang 		src += sizeof(uint32_t);
542831bc3aSCaesar Wang 	}
552831bc3aSCaesar Wang }
562831bc3aSCaesar Wang 
572831bc3aSCaesar Wang static __sramfunc uint32_t sram_get_timer_value(void)
582831bc3aSCaesar Wang {
592831bc3aSCaesar Wang 	/*
602831bc3aSCaesar Wang 	 * Generic delay timer implementation expects the timer to be a down
612831bc3aSCaesar Wang 	 * counter. We apply bitwise NOT operator to the tick values returned
622831bc3aSCaesar Wang 	 * by read_cntpct_el0() to simulate the down counter.
632831bc3aSCaesar Wang 	 */
642831bc3aSCaesar Wang 	return (uint32_t)(~read_cntpct_el0());
652831bc3aSCaesar Wang }
662831bc3aSCaesar Wang 
672831bc3aSCaesar Wang static __sramfunc void sram_udelay(uint32_t usec)
682831bc3aSCaesar Wang {
692831bc3aSCaesar Wang 	uint32_t start, cnt, delta, delta_us;
702831bc3aSCaesar Wang 
712831bc3aSCaesar Wang 	/* counter is decreasing */
722831bc3aSCaesar Wang 	start = sram_get_timer_value();
732831bc3aSCaesar Wang 	do {
742831bc3aSCaesar Wang 		cnt = sram_get_timer_value();
752831bc3aSCaesar Wang 		if (cnt > start) {
762831bc3aSCaesar Wang 			delta = UINT32_MAX - cnt;
772831bc3aSCaesar Wang 			delta += start;
782831bc3aSCaesar Wang 		} else
792831bc3aSCaesar Wang 			delta = start - cnt;
802831bc3aSCaesar Wang 		delta_us = (delta * SYS_COUNTER_FREQ_IN_MHZ);
812831bc3aSCaesar Wang 	} while (delta_us < usec);
822831bc3aSCaesar Wang }
832831bc3aSCaesar Wang 
842831bc3aSCaesar Wang static __sramfunc void configure_sgrf(void)
852831bc3aSCaesar Wang {
862831bc3aSCaesar Wang 	/*
872831bc3aSCaesar Wang 	 * SGRF_DDR_RGN_DPLL_CLK and SGRF_DDR_RGN_RTC_CLK:
882831bc3aSCaesar Wang 	 * IC ECO bug, need to set this register.
892831bc3aSCaesar Wang 	 *
902831bc3aSCaesar Wang 	 * SGRF_DDR_RGN_BYPS:
912831bc3aSCaesar Wang 	 * After the PD_CENTER suspend/resume, the DDR region
922831bc3aSCaesar Wang 	 * related registers in the SGRF will be reset, we
932831bc3aSCaesar Wang 	 * need to re-initialize them.
942831bc3aSCaesar Wang 	 */
952831bc3aSCaesar Wang 	mmio_write_32(SGRF_BASE + SGRF_DDRRGN_CON0_16(16),
962831bc3aSCaesar Wang 		      SGRF_DDR_RGN_DPLL_CLK |
972831bc3aSCaesar Wang 		      SGRF_DDR_RGN_RTC_CLK |
982831bc3aSCaesar Wang 		      SGRF_DDR_RGN_BYPS);
992831bc3aSCaesar Wang }
1002831bc3aSCaesar Wang 
1012831bc3aSCaesar Wang static __sramfunc void rkclk_ddr_reset(uint32_t channel, uint32_t ctl,
1022831bc3aSCaesar Wang 		uint32_t phy)
1032831bc3aSCaesar Wang {
1042831bc3aSCaesar Wang 	channel &= 0x1;
1052831bc3aSCaesar Wang 	ctl &= 0x1;
1062831bc3aSCaesar Wang 	phy &= 0x1;
1072831bc3aSCaesar Wang 	mmio_write_32(CRU_BASE + CRU_SOFTRST_CON(4),
1082831bc3aSCaesar Wang 		      CRU_SFTRST_DDR_CTRL(channel, ctl) |
1092831bc3aSCaesar Wang 		      CRU_SFTRST_DDR_PHY(channel, phy));
1102831bc3aSCaesar Wang }
1112831bc3aSCaesar Wang 
1122831bc3aSCaesar Wang static __sramfunc void phy_pctrl_reset(uint32_t ch)
1132831bc3aSCaesar Wang {
1142831bc3aSCaesar Wang 	rkclk_ddr_reset(ch, 1, 1);
1152831bc3aSCaesar Wang 	sram_udelay(10);
1162831bc3aSCaesar Wang 	rkclk_ddr_reset(ch, 1, 0);
1172831bc3aSCaesar Wang 	sram_udelay(10);
1182831bc3aSCaesar Wang 	rkclk_ddr_reset(ch, 0, 0);
1192831bc3aSCaesar Wang 	sram_udelay(10);
1202831bc3aSCaesar Wang }
1212831bc3aSCaesar Wang 
1222831bc3aSCaesar Wang static __sramfunc void phy_dll_bypass_set(uint32_t ch, uint32_t hz)
1232831bc3aSCaesar Wang {
1242831bc3aSCaesar Wang 	if (hz <= 125 * MHz) {
1252831bc3aSCaesar Wang 		/* phy_sw_master_mode_X PHY_86/214/342/470 4bits offset_8 */
1262831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 86), (0x3 << 2) << 8);
1272831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 214), (0x3 << 2) << 8);
1282831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 342), (0x3 << 2) << 8);
1292831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 470), (0x3 << 2) << 8);
1302831bc3aSCaesar Wang 		/* phy_adrctl_sw_master_mode PHY_547/675/803 4bits offset_16 */
1312831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 547), (0x3 << 2) << 16);
1322831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 675), (0x3 << 2) << 16);
1332831bc3aSCaesar Wang 		mmio_setbits_32(PHY_REG(ch, 803), (0x3 << 2) << 16);
1342831bc3aSCaesar Wang 	} else {
1352831bc3aSCaesar Wang 		/* phy_sw_master_mode_X PHY_86/214/342/470 4bits offset_8 */
1362831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 86), (0x3 << 2) << 8);
1372831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 214), (0x3 << 2) << 8);
1382831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 342), (0x3 << 2) << 8);
1392831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 470), (0x3 << 2) << 8);
1402831bc3aSCaesar Wang 		/* phy_adrctl_sw_master_mode PHY_547/675/803 4bits offset_16 */
1412831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 547), (0x3 << 2) << 16);
1422831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 675), (0x3 << 2) << 16);
1432831bc3aSCaesar Wang 		mmio_clrbits_32(PHY_REG(ch, 803), (0x3 << 2) << 16);
1442831bc3aSCaesar Wang 	}
1452831bc3aSCaesar Wang }
1462831bc3aSCaesar Wang 
1472831bc3aSCaesar Wang static __sramfunc void set_cs_training_index(uint32_t ch, uint32_t rank)
1482831bc3aSCaesar Wang {
1492831bc3aSCaesar Wang 	/* PHY_8/136/264/392 phy_per_cs_training_index_X 1bit offset_24 */
1502831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 8), 0x1 << 24, rank << 24);
1512831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 136), 0x1 << 24, rank << 24);
1522831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 264), 0x1 << 24, rank << 24);
1532831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 392), 0x1 << 24, rank << 24);
1542831bc3aSCaesar Wang }
1552831bc3aSCaesar Wang 
1562831bc3aSCaesar Wang static __sramfunc void select_per_cs_training_index(uint32_t ch, uint32_t rank)
1572831bc3aSCaesar Wang {
1582831bc3aSCaesar Wang 	/* PHY_84 PHY_PER_CS_TRAINING_EN_0 1bit offset_16 */
1592831bc3aSCaesar Wang 	if ((mmio_read_32(PHY_REG(ch, 84)) >> 16) & 1)
1602831bc3aSCaesar Wang 		set_cs_training_index(ch, rank);
1612831bc3aSCaesar Wang }
1622831bc3aSCaesar Wang 
1632831bc3aSCaesar Wang static void override_write_leveling_value(uint32_t ch)
1642831bc3aSCaesar Wang {
1652831bc3aSCaesar Wang 	uint32_t byte;
1662831bc3aSCaesar Wang 
1672831bc3aSCaesar Wang 	/* PHY_896 PHY_FREQ_SEL_MULTICAST_EN 1bit offset_0 */
1682831bc3aSCaesar Wang 	mmio_setbits_32(PHY_REG(ch, 896), 1);
1692831bc3aSCaesar Wang 
1702831bc3aSCaesar Wang 	/*
1712831bc3aSCaesar Wang 	 * PHY_8/136/264/392
1722831bc3aSCaesar Wang 	 * phy_per_cs_training_multicast_en_X 1bit offset_16
1732831bc3aSCaesar Wang 	 */
1742831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 8), 0x1 << 16, 1 << 16);
1752831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 136), 0x1 << 16, 1 << 16);
1762831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 264), 0x1 << 16, 1 << 16);
1772831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 392), 0x1 << 16, 1 << 16);
1782831bc3aSCaesar Wang 
1792831bc3aSCaesar Wang 	for (byte = 0; byte < 4; byte++)
1802831bc3aSCaesar Wang 		mmio_clrsetbits_32(PHY_REG(ch, 63 + (128 * byte)),
1812831bc3aSCaesar Wang 				   0xffff << 16,
1822831bc3aSCaesar Wang 				   0x200 << 16);
1832831bc3aSCaesar Wang 
1842831bc3aSCaesar Wang 	/* PHY_896 PHY_FREQ_SEL_MULTICAST_EN 1bit offset_0 */
1852831bc3aSCaesar Wang 	mmio_clrbits_32(PHY_REG(ch, 896), 1);
1862831bc3aSCaesar Wang 
1872831bc3aSCaesar Wang 	/* CTL_200 ctrlupd_req 1bit offset_8 */
1882831bc3aSCaesar Wang 	mmio_clrsetbits_32(CTL_REG(ch, 200), 0x1 << 8, 0x1 << 8);
1892831bc3aSCaesar Wang }
1902831bc3aSCaesar Wang 
1912831bc3aSCaesar Wang static __sramfunc int data_training(uint32_t ch,
1922831bc3aSCaesar Wang 		struct rk3399_sdram_params *sdram_params,
1932831bc3aSCaesar Wang 		uint32_t training_flag)
1942831bc3aSCaesar Wang {
1952831bc3aSCaesar Wang 	uint32_t obs_0, obs_1, obs_2, obs_3, obs_err = 0;
1962831bc3aSCaesar Wang 	uint32_t rank = sdram_params->ch[ch].rank;
1972831bc3aSCaesar Wang 	uint32_t rank_mask;
1982831bc3aSCaesar Wang 	uint32_t i, tmp;
1992831bc3aSCaesar Wang 
2002831bc3aSCaesar Wang 	if (sdram_params->dramtype == LPDDR4)
2012831bc3aSCaesar Wang 		rank_mask = (rank == 1) ? 0x5 : 0xf;
2022831bc3aSCaesar Wang 	else
2032831bc3aSCaesar Wang 		rank_mask = (rank == 1) ? 0x1 : 0x3;
2042831bc3aSCaesar Wang 
2052831bc3aSCaesar Wang 	/* PHY_927 PHY_PAD_DQS_DRIVE  RPULL offset_22 */
2062831bc3aSCaesar Wang 	mmio_setbits_32(PHY_REG(ch, 927), (1 << 22));
2072831bc3aSCaesar Wang 
2082831bc3aSCaesar Wang 	if (training_flag == PI_FULL_TRAINING) {
2092831bc3aSCaesar Wang 		if (sdram_params->dramtype == LPDDR4) {
2102831bc3aSCaesar Wang 			training_flag = PI_WRITE_LEVELING |
2112831bc3aSCaesar Wang 					PI_READ_GATE_TRAINING |
2122831bc3aSCaesar Wang 					PI_READ_LEVELING |
2132831bc3aSCaesar Wang 					PI_WDQ_LEVELING;
2142831bc3aSCaesar Wang 		} else if (sdram_params->dramtype == LPDDR3) {
2152831bc3aSCaesar Wang 			training_flag = PI_CA_TRAINING | PI_WRITE_LEVELING |
2162831bc3aSCaesar Wang 					PI_READ_GATE_TRAINING;
2172831bc3aSCaesar Wang 		} else if (sdram_params->dramtype == DDR3) {
2182831bc3aSCaesar Wang 			training_flag = PI_WRITE_LEVELING |
2192831bc3aSCaesar Wang 					PI_READ_GATE_TRAINING |
2202831bc3aSCaesar Wang 					PI_READ_LEVELING;
2212831bc3aSCaesar Wang 		}
2222831bc3aSCaesar Wang 	}
2232831bc3aSCaesar Wang 
2242831bc3aSCaesar Wang 	/* ca training(LPDDR4,LPDDR3 support) */
2252831bc3aSCaesar Wang 	if ((training_flag & PI_CA_TRAINING) == PI_CA_TRAINING) {
2262831bc3aSCaesar Wang 		for (i = 0; i < 4; i++) {
2272831bc3aSCaesar Wang 			if (!(rank_mask & (1 << i)))
2282831bc3aSCaesar Wang 				continue;
2292831bc3aSCaesar Wang 
2302831bc3aSCaesar Wang 			select_per_cs_training_index(ch, i);
2312831bc3aSCaesar Wang 			/* PI_100 PI_CALVL_EN:RW:8:2 */
2322831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 100), 0x3 << 8, 0x2 << 8);
2332831bc3aSCaesar Wang 
2342831bc3aSCaesar Wang 			/* PI_92 PI_CALVL_REQ:WR:16:1,PI_CALVL_CS:RW:24:2 */
2352831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 92),
2362831bc3aSCaesar Wang 					   (0x1 << 16) | (0x3 << 24),
2372831bc3aSCaesar Wang 					   (0x1 << 16) | (i << 24));
2382831bc3aSCaesar Wang 			while (1) {
2392831bc3aSCaesar Wang 				/* PI_174 PI_INT_STATUS:RD:8:18 */
2402831bc3aSCaesar Wang 				tmp = mmio_read_32(PI_REG(ch, 174)) >> 8;
2412831bc3aSCaesar Wang 
2422831bc3aSCaesar Wang 				/*
2432831bc3aSCaesar Wang 				 * check status obs
2442831bc3aSCaesar Wang 				 * PHY_532/660/788 phy_adr_calvl_obs1_:0:32
2452831bc3aSCaesar Wang 				 */
2462831bc3aSCaesar Wang 				obs_0 = mmio_read_32(PHY_REG(ch, 532));
2472831bc3aSCaesar Wang 				obs_1 = mmio_read_32(PHY_REG(ch, 660));
2482831bc3aSCaesar Wang 				obs_2 = mmio_read_32(PHY_REG(ch, 788));
2492831bc3aSCaesar Wang 				if (((obs_0 >> 30) & 0x3) ||
2502831bc3aSCaesar Wang 				    ((obs_1 >> 30) & 0x3) ||
2512831bc3aSCaesar Wang 				    ((obs_2 >> 30) & 0x3))
2522831bc3aSCaesar Wang 					obs_err = 1;
2532831bc3aSCaesar Wang 				if ((((tmp >> 11) & 0x1) == 0x1) &&
2542831bc3aSCaesar Wang 				    (((tmp >> 13) & 0x1) == 0x1) &&
2552831bc3aSCaesar Wang 				    (((tmp >> 5) & 0x1) == 0x0) &&
2562831bc3aSCaesar Wang 				    (obs_err == 0))
2572831bc3aSCaesar Wang 					break;
2582831bc3aSCaesar Wang 				else if ((((tmp >> 5) & 0x1) == 0x1) ||
2592831bc3aSCaesar Wang 					 (obs_err == 1))
2602831bc3aSCaesar Wang 					return -1;
2612831bc3aSCaesar Wang 			}
2622831bc3aSCaesar Wang 			/* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
2632831bc3aSCaesar Wang 			mmio_write_32(PI_REG(ch, 175), 0x00003f7c);
2642831bc3aSCaesar Wang 		}
2652831bc3aSCaesar Wang 		mmio_clrbits_32(PI_REG(ch, 100), 0x3 << 8);
2662831bc3aSCaesar Wang 	}
2672831bc3aSCaesar Wang 
2682831bc3aSCaesar Wang 	/* write leveling(LPDDR4,LPDDR3,DDR3 support) */
2692831bc3aSCaesar Wang 	if ((training_flag & PI_WRITE_LEVELING) == PI_WRITE_LEVELING) {
2702831bc3aSCaesar Wang 		for (i = 0; i < rank; i++) {
2712831bc3aSCaesar Wang 			select_per_cs_training_index(ch, i);
2722831bc3aSCaesar Wang 			/* PI_60 PI_WRLVL_EN:RW:8:2 */
2732831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 60), 0x3 << 8, 0x2 << 8);
2742831bc3aSCaesar Wang 			/* PI_59 PI_WRLVL_REQ:WR:8:1,PI_WRLVL_CS:RW:16:2 */
2752831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 59),
2762831bc3aSCaesar Wang 					   (0x1 << 8) | (0x3 << 16),
2772831bc3aSCaesar Wang 					   (0x1 << 8) | (i << 16));
2782831bc3aSCaesar Wang 
2792831bc3aSCaesar Wang 			while (1) {
2802831bc3aSCaesar Wang 				/* PI_174 PI_INT_STATUS:RD:8:18 */
2812831bc3aSCaesar Wang 				tmp = mmio_read_32(PI_REG(ch, 174)) >> 8;
2822831bc3aSCaesar Wang 
2832831bc3aSCaesar Wang 				/*
2842831bc3aSCaesar Wang 				 * check status obs, if error maybe can not
2852831bc3aSCaesar Wang 				 * get leveling done PHY_40/168/296/424
2862831bc3aSCaesar Wang 				 * phy_wrlvl_status_obs_X:0:13
2872831bc3aSCaesar Wang 				 */
2882831bc3aSCaesar Wang 				obs_0 = mmio_read_32(PHY_REG(ch, 40));
2892831bc3aSCaesar Wang 				obs_1 = mmio_read_32(PHY_REG(ch, 168));
2902831bc3aSCaesar Wang 				obs_2 = mmio_read_32(PHY_REG(ch, 296));
2912831bc3aSCaesar Wang 				obs_3 = mmio_read_32(PHY_REG(ch, 424));
2922831bc3aSCaesar Wang 				if (((obs_0 >> 12) & 0x1) ||
2932831bc3aSCaesar Wang 				    ((obs_1 >> 12) & 0x1) ||
2942831bc3aSCaesar Wang 				    ((obs_2 >> 12) & 0x1) ||
2952831bc3aSCaesar Wang 				    ((obs_3 >> 12) & 0x1))
2962831bc3aSCaesar Wang 					obs_err = 1;
2972831bc3aSCaesar Wang 				if ((((tmp >> 10) & 0x1) == 0x1) &&
2982831bc3aSCaesar Wang 				    (((tmp >> 13) & 0x1) == 0x1) &&
2992831bc3aSCaesar Wang 				    (((tmp >> 4) & 0x1) == 0x0) &&
3002831bc3aSCaesar Wang 				    (obs_err == 0))
3012831bc3aSCaesar Wang 					break;
3022831bc3aSCaesar Wang 				else if ((((tmp >> 4) & 0x1) == 0x1) ||
3032831bc3aSCaesar Wang 					 (obs_err == 1))
3042831bc3aSCaesar Wang 					return -1;
3052831bc3aSCaesar Wang 			}
3062831bc3aSCaesar Wang 
3072831bc3aSCaesar Wang 			/* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
3082831bc3aSCaesar Wang 			mmio_write_32(PI_REG(ch, 175), 0x00003f7c);
3092831bc3aSCaesar Wang 		}
3102831bc3aSCaesar Wang 		override_write_leveling_value(ch);
3112831bc3aSCaesar Wang 		mmio_clrbits_32(PI_REG(ch, 60), 0x3 << 8);
3122831bc3aSCaesar Wang 	}
3132831bc3aSCaesar Wang 
3142831bc3aSCaesar Wang 	/* read gate training(LPDDR4,LPDDR3,DDR3 support) */
3152831bc3aSCaesar Wang 	if ((training_flag & PI_READ_GATE_TRAINING) == PI_READ_GATE_TRAINING) {
3162831bc3aSCaesar Wang 		for (i = 0; i < rank; i++) {
3172831bc3aSCaesar Wang 			select_per_cs_training_index(ch, i);
3182831bc3aSCaesar Wang 			/* PI_80 PI_RDLVL_GATE_EN:RW:24:2 */
3192831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 80), 0x3 << 24,
3202831bc3aSCaesar Wang 					   0x2 << 24);
3212831bc3aSCaesar Wang 			/*
3222831bc3aSCaesar Wang 			 * PI_74 PI_RDLVL_GATE_REQ:WR:16:1
3232831bc3aSCaesar Wang 			 * PI_RDLVL_CS:RW:24:2
3242831bc3aSCaesar Wang 			 */
3252831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 74),
3262831bc3aSCaesar Wang 					   (0x1 << 16) | (0x3 << 24),
3272831bc3aSCaesar Wang 					   (0x1 << 16) | (i << 24));
3282831bc3aSCaesar Wang 
3292831bc3aSCaesar Wang 			while (1) {
3302831bc3aSCaesar Wang 				/* PI_174 PI_INT_STATUS:RD:8:18 */
3312831bc3aSCaesar Wang 				tmp = mmio_read_32(PI_REG(ch, 174)) >> 8;
3322831bc3aSCaesar Wang 
3332831bc3aSCaesar Wang 				/*
3342831bc3aSCaesar Wang 				 * check status obs
3352831bc3aSCaesar Wang 				 * PHY_43/171/299/427
3362831bc3aSCaesar Wang 				 *     PHY_GTLVL_STATUS_OBS_x:16:8
3372831bc3aSCaesar Wang 				 */
3382831bc3aSCaesar Wang 				obs_0 = mmio_read_32(PHY_REG(ch, 43));
3392831bc3aSCaesar Wang 				obs_1 = mmio_read_32(PHY_REG(ch, 171));
3402831bc3aSCaesar Wang 				obs_2 = mmio_read_32(PHY_REG(ch, 299));
3412831bc3aSCaesar Wang 				obs_3 = mmio_read_32(PHY_REG(ch, 427));
3422831bc3aSCaesar Wang 				if (((obs_0 >> (16 + 6)) & 0x3) ||
3432831bc3aSCaesar Wang 				    ((obs_1 >> (16 + 6)) & 0x3) ||
3442831bc3aSCaesar Wang 				    ((obs_2 >> (16 + 6)) & 0x3) ||
3452831bc3aSCaesar Wang 				    ((obs_3 >> (16 + 6)) & 0x3))
3462831bc3aSCaesar Wang 					obs_err = 1;
3472831bc3aSCaesar Wang 				if ((((tmp >> 9) & 0x1) == 0x1) &&
3482831bc3aSCaesar Wang 				    (((tmp >> 13) & 0x1) == 0x1) &&
3492831bc3aSCaesar Wang 				    (((tmp >> 3) & 0x1) == 0x0) &&
3502831bc3aSCaesar Wang 				    (obs_err == 0))
3512831bc3aSCaesar Wang 					break;
3522831bc3aSCaesar Wang 				else if ((((tmp >> 3) & 0x1) == 0x1) ||
3532831bc3aSCaesar Wang 					 (obs_err == 1))
3542831bc3aSCaesar Wang 					return -1;
3552831bc3aSCaesar Wang 			}
3562831bc3aSCaesar Wang 			/* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
3572831bc3aSCaesar Wang 			mmio_write_32(PI_REG(ch, 175), 0x00003f7c);
3582831bc3aSCaesar Wang 		}
3592831bc3aSCaesar Wang 		mmio_clrbits_32(PI_REG(ch, 80), 0x3 << 24);
3602831bc3aSCaesar Wang 	}
3612831bc3aSCaesar Wang 
3622831bc3aSCaesar Wang 	/* read leveling(LPDDR4,LPDDR3,DDR3 support) */
3632831bc3aSCaesar Wang 	if ((training_flag & PI_READ_LEVELING) == PI_READ_LEVELING) {
3642831bc3aSCaesar Wang 		for (i = 0; i < rank; i++) {
3652831bc3aSCaesar Wang 			select_per_cs_training_index(ch, i);
3662831bc3aSCaesar Wang 			/* PI_80 PI_RDLVL_EN:RW:16:2 */
3672831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 80), 0x3 << 16,
3682831bc3aSCaesar Wang 					   0x2 << 16);
3692831bc3aSCaesar Wang 			/* PI_74 PI_RDLVL_REQ:WR:8:1,PI_RDLVL_CS:RW:24:2 */
3702831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 74),
3712831bc3aSCaesar Wang 					   (0x1 << 8) | (0x3 << 24),
3722831bc3aSCaesar Wang 					   (0x1 << 8) | (i << 24));
3732831bc3aSCaesar Wang 			while (1) {
3742831bc3aSCaesar Wang 				/* PI_174 PI_INT_STATUS:RD:8:18 */
3752831bc3aSCaesar Wang 				tmp = mmio_read_32(PI_REG(ch, 174)) >> 8;
3762831bc3aSCaesar Wang 
3772831bc3aSCaesar Wang 				/*
3782831bc3aSCaesar Wang 				 * make sure status obs not report error bit
3792831bc3aSCaesar Wang 				 * PHY_46/174/302/430
3802831bc3aSCaesar Wang 				 *     phy_rdlvl_status_obs_X:16:8
3812831bc3aSCaesar Wang 				 */
3822831bc3aSCaesar Wang 				if ((((tmp >> 8) & 0x1) == 0x1) &&
3832831bc3aSCaesar Wang 				    (((tmp >> 13) & 0x1) == 0x1) &&
3842831bc3aSCaesar Wang 				    (((tmp >> 2) & 0x1) == 0x0))
3852831bc3aSCaesar Wang 					break;
3862831bc3aSCaesar Wang 				else if (((tmp >> 2) & 0x1) == 0x1)
3872831bc3aSCaesar Wang 					return -1;
3882831bc3aSCaesar Wang 			}
3892831bc3aSCaesar Wang 			/* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
3902831bc3aSCaesar Wang 			mmio_write_32(PI_REG(ch, 175), 0x00003f7c);
3912831bc3aSCaesar Wang 		}
3922831bc3aSCaesar Wang 		mmio_clrbits_32(PI_REG(ch, 80), 0x3 << 16);
3932831bc3aSCaesar Wang 	}
3942831bc3aSCaesar Wang 
3952831bc3aSCaesar Wang 	/* wdq leveling(LPDDR4 support) */
3962831bc3aSCaesar Wang 	if ((training_flag & PI_WDQ_LEVELING) == PI_WDQ_LEVELING) {
3972831bc3aSCaesar Wang 		for (i = 0; i < 4; i++) {
3982831bc3aSCaesar Wang 			if (!(rank_mask & (1 << i)))
3992831bc3aSCaesar Wang 				continue;
4002831bc3aSCaesar Wang 
4012831bc3aSCaesar Wang 			select_per_cs_training_index(ch, i);
4022831bc3aSCaesar Wang 			/*
4032831bc3aSCaesar Wang 			 * disable PI_WDQLVL_VREF_EN before wdq leveling?
4042831bc3aSCaesar Wang 			 * PI_181 PI_WDQLVL_VREF_EN:RW:8:1
4052831bc3aSCaesar Wang 			 */
4062831bc3aSCaesar Wang 			mmio_clrbits_32(PI_REG(ch, 181), 0x1 << 8);
4072831bc3aSCaesar Wang 			/* PI_124 PI_WDQLVL_EN:RW:16:2 */
4082831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 124), 0x3 << 16,
4092831bc3aSCaesar Wang 					   0x2 << 16);
4102831bc3aSCaesar Wang 			/* PI_121 PI_WDQLVL_REQ:WR:8:1,PI_WDQLVL_CS:RW:16:2 */
4112831bc3aSCaesar Wang 			mmio_clrsetbits_32(PI_REG(ch, 121),
4122831bc3aSCaesar Wang 					   (0x1 << 8) | (0x3 << 16),
4132831bc3aSCaesar Wang 					   (0x1 << 8) | (i << 16));
4142831bc3aSCaesar Wang 			while (1) {
4152831bc3aSCaesar Wang 				/* PI_174 PI_INT_STATUS:RD:8:18 */
4162831bc3aSCaesar Wang 				tmp = mmio_read_32(PI_REG(ch, 174)) >> 8;
4172831bc3aSCaesar Wang 				if ((((tmp >> 12) & 0x1) == 0x1) &&
4182831bc3aSCaesar Wang 				    (((tmp >> 13) & 0x1) == 0x1) &&
4192831bc3aSCaesar Wang 				    (((tmp >> 6) & 0x1) == 0x0))
4202831bc3aSCaesar Wang 					break;
4212831bc3aSCaesar Wang 				else if (((tmp >> 6) & 0x1) == 0x1)
4222831bc3aSCaesar Wang 					return -1;
4232831bc3aSCaesar Wang 			}
4242831bc3aSCaesar Wang 			/* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
4252831bc3aSCaesar Wang 			mmio_write_32(PI_REG(ch, 175), 0x00003f7c);
4262831bc3aSCaesar Wang 		}
4272831bc3aSCaesar Wang 		mmio_clrbits_32(PI_REG(ch, 124), 0x3 << 16);
4282831bc3aSCaesar Wang 	}
4292831bc3aSCaesar Wang 
4302831bc3aSCaesar Wang 	/* PHY_927 PHY_PAD_DQS_DRIVE  RPULL offset_22 */
4312831bc3aSCaesar Wang 	mmio_clrbits_32(PHY_REG(ch, 927), (1 << 22));
4322831bc3aSCaesar Wang 
4332831bc3aSCaesar Wang 	return 0;
4342831bc3aSCaesar Wang }
4352831bc3aSCaesar Wang 
4362831bc3aSCaesar Wang static __sramfunc void set_ddrconfig(struct rk3399_sdram_params *sdram_params,
4372831bc3aSCaesar Wang 		unsigned char channel, uint32_t ddrconfig)
4382831bc3aSCaesar Wang {
4392831bc3aSCaesar Wang 	/* only need to set ddrconfig */
4402831bc3aSCaesar Wang 	struct rk3399_sdram_channel *ch = &sdram_params->ch[channel];
4412831bc3aSCaesar Wang 	unsigned int cs0_cap = 0;
4422831bc3aSCaesar Wang 	unsigned int cs1_cap = 0;
4432831bc3aSCaesar Wang 
4442831bc3aSCaesar Wang 	cs0_cap = (1 << (ch->cs0_row + ch->col + ch->bk + ch->bw - 20));
4452831bc3aSCaesar Wang 	if (ch->rank > 1)
4462831bc3aSCaesar Wang 		cs1_cap = cs0_cap >> (ch->cs0_row - ch->cs1_row);
4472831bc3aSCaesar Wang 	if (ch->row_3_4) {
4482831bc3aSCaesar Wang 		cs0_cap = cs0_cap * 3 / 4;
4492831bc3aSCaesar Wang 		cs1_cap = cs1_cap * 3 / 4;
4502831bc3aSCaesar Wang 	}
4512831bc3aSCaesar Wang 
4522831bc3aSCaesar Wang 	mmio_write_32(MSCH_BASE(channel) + MSCH_DEVICECONF,
4532831bc3aSCaesar Wang 		      ddrconfig | (ddrconfig << 6));
4542831bc3aSCaesar Wang 	mmio_write_32(MSCH_BASE(channel) + MSCH_DEVICESIZE,
4552831bc3aSCaesar Wang 		      ((cs0_cap / 32) & 0xff) | (((cs1_cap / 32) & 0xff) << 8));
4562831bc3aSCaesar Wang }
4572831bc3aSCaesar Wang 
4582831bc3aSCaesar Wang static __sramfunc void dram_all_config(struct rk3399_sdram_params *sdram_params)
4592831bc3aSCaesar Wang {
4602831bc3aSCaesar Wang 	unsigned int i;
4612831bc3aSCaesar Wang 
4622831bc3aSCaesar Wang 	for (i = 0; i < 2; i++) {
4632831bc3aSCaesar Wang 		struct rk3399_sdram_channel *info = &sdram_params->ch[i];
4642831bc3aSCaesar Wang 		struct rk3399_msch_timings *noc = &info->noc_timings;
4652831bc3aSCaesar Wang 
4662831bc3aSCaesar Wang 		if (sdram_params->ch[i].col == 0)
4672831bc3aSCaesar Wang 			continue;
4682831bc3aSCaesar Wang 
4692831bc3aSCaesar Wang 		mmio_write_32(MSCH_BASE(i) + MSCH_DDRTIMINGA0,
4702831bc3aSCaesar Wang 			      noc->ddrtiminga0.d32);
4712831bc3aSCaesar Wang 		mmio_write_32(MSCH_BASE(i) + MSCH_DDRTIMINGB0,
4722831bc3aSCaesar Wang 			      noc->ddrtimingb0.d32);
4732831bc3aSCaesar Wang 		mmio_write_32(MSCH_BASE(i) + MSCH_DDRTIMINGC0,
4742831bc3aSCaesar Wang 			      noc->ddrtimingc0.d32);
4752831bc3aSCaesar Wang 		mmio_write_32(MSCH_BASE(i) + MSCH_DEVTODEV0,
4762831bc3aSCaesar Wang 			      noc->devtodev0.d32);
4772831bc3aSCaesar Wang 		mmio_write_32(MSCH_BASE(i) + MSCH_DDRMODE, noc->ddrmode.d32);
4782831bc3aSCaesar Wang 
4792831bc3aSCaesar Wang 		/* rank 1 memory clock disable (dfi_dram_clk_disable = 1) */
4802831bc3aSCaesar Wang 		if (sdram_params->ch[i].rank == 1)
4812831bc3aSCaesar Wang 			mmio_setbits_32(CTL_REG(i, 276), 1 << 17);
4822831bc3aSCaesar Wang 	}
4832831bc3aSCaesar Wang 
4842831bc3aSCaesar Wang 	DDR_STRIDE(sdram_params->stride);
4852831bc3aSCaesar Wang 
4862831bc3aSCaesar Wang 	/* reboot hold register set */
4872831bc3aSCaesar Wang 	mmio_write_32(PMUCRU_BASE + CRU_PMU_RSTHOLD_CON(1),
4882831bc3aSCaesar Wang 		      CRU_PMU_SGRF_RST_RLS |
4892831bc3aSCaesar Wang 		      PRESET_GPIO0_HOLD(1) |
4902831bc3aSCaesar Wang 		      PRESET_GPIO1_HOLD(1));
4912831bc3aSCaesar Wang 	mmio_clrsetbits_32(CRU_BASE + CRU_GLB_RST_CON, 0x3, 0x3);
4922831bc3aSCaesar Wang }
4932831bc3aSCaesar Wang 
4942831bc3aSCaesar Wang static __sramfunc void pctl_cfg(uint32_t ch,
4952831bc3aSCaesar Wang 		struct rk3399_sdram_params *sdram_params)
4962831bc3aSCaesar Wang {
4972831bc3aSCaesar Wang 	const uint32_t *params_ctl = sdram_params->pctl_regs.denali_ctl;
4982831bc3aSCaesar Wang 	const uint32_t *params_phy = sdram_params->phy_regs.denali_phy;
4992831bc3aSCaesar Wang 	const uint32_t *params_pi = sdram_params->pi_regs.denali_pi;
5002831bc3aSCaesar Wang 	uint32_t tmp, tmp1, tmp2;
5012831bc3aSCaesar Wang 
5022831bc3aSCaesar Wang 	/*
5032831bc3aSCaesar Wang 	 * Workaround controller bug:
5042831bc3aSCaesar Wang 	 * Do not program DRAM_CLASS until NO_PHY_IND_TRAIN_INT is programmed
5052831bc3aSCaesar Wang 	 */
5062831bc3aSCaesar Wang 	sram_regcpy(CTL_REG(ch, 1), (uintptr_t)&params_ctl[1],
5072831bc3aSCaesar Wang 		    CTL_REG_NUM - 1);
5082831bc3aSCaesar Wang 	mmio_write_32(CTL_REG(ch, 0), params_ctl[0]);
5092831bc3aSCaesar Wang 	sram_regcpy(PI_REG(ch, 0), (uintptr_t)&params_pi[0],
5102831bc3aSCaesar Wang 		    PI_REG_NUM);
5112831bc3aSCaesar Wang 
5122831bc3aSCaesar Wang 	mmio_write_32(PHY_REG(ch, 910), params_phy[910]);
5132831bc3aSCaesar Wang 	mmio_write_32(PHY_REG(ch, 911), params_phy[911]);
5142831bc3aSCaesar Wang 	mmio_write_32(PHY_REG(ch, 912), params_phy[912]);
5152831bc3aSCaesar Wang 
5162831bc3aSCaesar Wang 	mmio_clrsetbits_32(CTL_REG(ch, 68), PWRUP_SREFRESH_EXIT,
5172831bc3aSCaesar Wang 				PWRUP_SREFRESH_EXIT);
5182831bc3aSCaesar Wang 
5192831bc3aSCaesar Wang 	/* PHY_DLL_RST_EN */
5202831bc3aSCaesar Wang 	mmio_clrsetbits_32(PHY_REG(ch, 957), 0x3 << 24, 1 << 24);
5212831bc3aSCaesar Wang 	dmbst();
5222831bc3aSCaesar Wang 
5232831bc3aSCaesar Wang 	mmio_setbits_32(PI_REG(ch, 0), START);
5242831bc3aSCaesar Wang 	mmio_setbits_32(CTL_REG(ch, 0), START);
5252831bc3aSCaesar Wang 
5262831bc3aSCaesar Wang 	/* wait lock */
5272831bc3aSCaesar Wang 	while (1) {
5282831bc3aSCaesar Wang 		tmp = mmio_read_32(PHY_REG(ch, 920));
5292831bc3aSCaesar Wang 		tmp1 = mmio_read_32(PHY_REG(ch, 921));
5302831bc3aSCaesar Wang 		tmp2 = mmio_read_32(PHY_REG(ch, 922));
5312831bc3aSCaesar Wang 		if ((((tmp >> 16) & 0x1) == 0x1) &&
5322831bc3aSCaesar Wang 		     (((tmp1 >> 16) & 0x1) == 0x1) &&
5332831bc3aSCaesar Wang 		     (((tmp1 >> 0) & 0x1) == 0x1) &&
5342831bc3aSCaesar Wang 		     (((tmp2 >> 0) & 0x1) == 0x1))
5352831bc3aSCaesar Wang 			break;
5362831bc3aSCaesar Wang 		/* if PLL bypass,don't need wait lock */
5372831bc3aSCaesar Wang 		if (mmio_read_32(PHY_REG(ch, 911)) & 0x1)
5382831bc3aSCaesar Wang 			break;
5392831bc3aSCaesar Wang 	}
5402831bc3aSCaesar Wang 
5412831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 896), (uintptr_t)&params_phy[896], 63);
5422831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 0), (uintptr_t)&params_phy[0], 91);
5432831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 128), (uintptr_t)&params_phy[128], 91);
5442831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 256), (uintptr_t)&params_phy[256], 91);
5452831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 384), (uintptr_t)&params_phy[384], 91);
5462831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 512), (uintptr_t)&params_phy[512], 38);
5472831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 640), (uintptr_t)&params_phy[640], 38);
5482831bc3aSCaesar Wang 	sram_regcpy(PHY_REG(ch, 768), (uintptr_t)&params_phy[768], 38);
5492831bc3aSCaesar Wang }
5502831bc3aSCaesar Wang 
5514bd1d3faSDerek Basehore static __sramfunc int dram_switch_to_next_index(
5522831bc3aSCaesar Wang 		struct rk3399_sdram_params *sdram_params)
5532831bc3aSCaesar Wang {
5542831bc3aSCaesar Wang 	uint32_t ch, ch_count;
5554bd1d3faSDerek Basehore 	uint32_t fn = ((mmio_read_32(CTL_REG(0, 111)) >> 16) + 1) & 0x1;
5562831bc3aSCaesar Wang 
5572831bc3aSCaesar Wang 	mmio_write_32(CIC_BASE + CIC_CTRL0,
5582831bc3aSCaesar Wang 		      (((0x3 << 4) | (1 << 2) | 1) << 16) |
5594bd1d3faSDerek Basehore 		      (fn << 4) | (1 << 2) | 1);
5602831bc3aSCaesar Wang 	while (!(mmio_read_32(CIC_BASE + CIC_STATUS0) & (1 << 2)))
5612831bc3aSCaesar Wang 		;
5622831bc3aSCaesar Wang 
5632831bc3aSCaesar Wang 	mmio_write_32(CIC_BASE + CIC_CTRL0, 0x20002);
5642831bc3aSCaesar Wang 	while (!(mmio_read_32(CIC_BASE + CIC_STATUS0) & (1 << 0)))
5652831bc3aSCaesar Wang 		;
5662831bc3aSCaesar Wang 
5672831bc3aSCaesar Wang 	ch_count = sdram_params->num_channels;
5682831bc3aSCaesar Wang 
5692831bc3aSCaesar Wang 	/* LPDDR4 f2 cann't do training, all training will fail */
5702831bc3aSCaesar Wang 	for (ch = 0; ch < ch_count; ch++) {
5712831bc3aSCaesar Wang 		mmio_clrsetbits_32(PHY_REG(ch, 896), (0x3 << 8) | 1,
5724bd1d3faSDerek Basehore 				   fn << 8);
5732831bc3aSCaesar Wang 
5742831bc3aSCaesar Wang 		/* data_training failed */
5752831bc3aSCaesar Wang 		if (data_training(ch, sdram_params, PI_FULL_TRAINING))
5762831bc3aSCaesar Wang 			return -1;
5772831bc3aSCaesar Wang 	}
5782831bc3aSCaesar Wang 
5792831bc3aSCaesar Wang 	return 0;
5802831bc3aSCaesar Wang }
5812831bc3aSCaesar Wang 
5822831bc3aSCaesar Wang /*
5832831bc3aSCaesar Wang  * Needs to be done for both channels at once in case of a shared reset signal
5842831bc3aSCaesar Wang  * between channels.
5852831bc3aSCaesar Wang  */
5862831bc3aSCaesar Wang static __sramfunc int pctl_start(uint32_t channel_mask,
5872831bc3aSCaesar Wang 		struct rk3399_sdram_params *sdram_params)
5882831bc3aSCaesar Wang {
5892831bc3aSCaesar Wang 	uint32_t count;
590951752ddSDerek Basehore 	uint32_t byte;
5912831bc3aSCaesar Wang 
5922831bc3aSCaesar Wang 	mmio_setbits_32(CTL_REG(0, 68), PWRUP_SREFRESH_EXIT);
5932831bc3aSCaesar Wang 	mmio_setbits_32(CTL_REG(1, 68), PWRUP_SREFRESH_EXIT);
5942831bc3aSCaesar Wang 
5952831bc3aSCaesar Wang 	/* need de-access IO retention before controller START */
5962831bc3aSCaesar Wang 	if (channel_mask & (1 << 0))
5972831bc3aSCaesar Wang 		mmio_setbits_32(PMU_BASE + PMU_PWRMODE_CON, (1 << 19));
5982831bc3aSCaesar Wang 	if (channel_mask & (1 << 1))
5992831bc3aSCaesar Wang 		mmio_setbits_32(PMU_BASE + PMU_PWRMODE_CON, (1 << 23));
6002831bc3aSCaesar Wang 
6012831bc3aSCaesar Wang 	/* PHY_DLL_RST_EN */
6022831bc3aSCaesar Wang 	if (channel_mask & (1 << 0))
6032831bc3aSCaesar Wang 		mmio_clrsetbits_32(PHY_REG(0, 957), 0x3 << 24,
6042831bc3aSCaesar Wang 				   0x2 << 24);
6052831bc3aSCaesar Wang 	if (channel_mask & (1 << 1))
6062831bc3aSCaesar Wang 		mmio_clrsetbits_32(PHY_REG(1, 957), 0x3 << 24,
6072831bc3aSCaesar Wang 				   0x2 << 24);
6082831bc3aSCaesar Wang 
6092831bc3aSCaesar Wang 	/* check ERROR bit */
6102831bc3aSCaesar Wang 	if (channel_mask & (1 << 0)) {
6112831bc3aSCaesar Wang 		count = 0;
6122831bc3aSCaesar Wang 		while (!(mmio_read_32(CTL_REG(0, 203)) & (1 << 3))) {
6132831bc3aSCaesar Wang 			/* CKE is low, loop 10ms */
6142831bc3aSCaesar Wang 			if (count > 100)
6152831bc3aSCaesar Wang 				return -1;
6162831bc3aSCaesar Wang 
6172831bc3aSCaesar Wang 			sram_udelay(100);
6182831bc3aSCaesar Wang 			count++;
6192831bc3aSCaesar Wang 		}
6202831bc3aSCaesar Wang 
6212831bc3aSCaesar Wang 		mmio_clrbits_32(CTL_REG(0, 68), PWRUP_SREFRESH_EXIT);
622951752ddSDerek Basehore 
623951752ddSDerek Basehore 		/* Restore the PHY_RX_CAL_DQS value */
624951752ddSDerek Basehore 		for (byte = 0; byte < 4; byte++)
625951752ddSDerek Basehore 			mmio_clrsetbits_32(PHY_REG(0, 57 + 128 * byte),
626951752ddSDerek Basehore 					   0xfff << 16,
627951752ddSDerek Basehore 					   sdram_params->rx_cal_dqs[0][byte]);
6282831bc3aSCaesar Wang 	}
6292831bc3aSCaesar Wang 	if (channel_mask & (1 << 1)) {
6302831bc3aSCaesar Wang 		count = 0;
6312831bc3aSCaesar Wang 		while (!(mmio_read_32(CTL_REG(1, 203)) & (1 << 3))) {
6322831bc3aSCaesar Wang 			/* CKE is low, loop 10ms */
6332831bc3aSCaesar Wang 			if (count > 100)
6342831bc3aSCaesar Wang 				return -1;
6352831bc3aSCaesar Wang 
6362831bc3aSCaesar Wang 			sram_udelay(100);
6372831bc3aSCaesar Wang 			count++;
6382831bc3aSCaesar Wang 		}
6392831bc3aSCaesar Wang 
6402831bc3aSCaesar Wang 		mmio_clrbits_32(CTL_REG(1, 68), PWRUP_SREFRESH_EXIT);
641951752ddSDerek Basehore 
642951752ddSDerek Basehore 		/* Restore the PHY_RX_CAL_DQS value */
643951752ddSDerek Basehore 		for (byte = 0; byte < 4; byte++)
644951752ddSDerek Basehore 			mmio_clrsetbits_32(PHY_REG(1, 57 + 128 * byte),
645951752ddSDerek Basehore 					   0xfff << 16,
646951752ddSDerek Basehore 					   sdram_params->rx_cal_dqs[1][byte]);
6472831bc3aSCaesar Wang 	}
6482831bc3aSCaesar Wang 
6492831bc3aSCaesar Wang 	return 0;
6502831bc3aSCaesar Wang }
6512831bc3aSCaesar Wang 
6522831bc3aSCaesar Wang void dmc_save(void)
6532831bc3aSCaesar Wang {
6542831bc3aSCaesar Wang 	struct rk3399_sdram_params *sdram_params = &sdram_config;
6552831bc3aSCaesar Wang 	uint32_t *params_ctl;
6562831bc3aSCaesar Wang 	uint32_t *params_pi;
6572831bc3aSCaesar Wang 	uint32_t *params_phy;
6582831bc3aSCaesar Wang 	uint32_t refdiv, postdiv2, postdiv1, fbdiv;
659951752ddSDerek Basehore 	uint32_t tmp, ch, byte;
6602831bc3aSCaesar Wang 
6612831bc3aSCaesar Wang 	params_ctl = sdram_params->pctl_regs.denali_ctl;
6622831bc3aSCaesar Wang 	params_pi = sdram_params->pi_regs.denali_pi;
6632831bc3aSCaesar Wang 	params_phy = sdram_params->phy_regs.denali_phy;
6642831bc3aSCaesar Wang 
6652831bc3aSCaesar Wang 	fbdiv = mmio_read_32(CRU_BASE + CRU_PLL_CON(DPLL_ID, 0)) & 0xfff;
6662831bc3aSCaesar Wang 	tmp = mmio_read_32(CRU_BASE + CRU_PLL_CON(DPLL_ID, 1));
6672831bc3aSCaesar Wang 	postdiv2 = POSTDIV2_DEC(tmp);
6682831bc3aSCaesar Wang 	postdiv1 = POSTDIV1_DEC(tmp);
6692831bc3aSCaesar Wang 	refdiv = REFDIV_DEC(tmp);
6702831bc3aSCaesar Wang 
6712831bc3aSCaesar Wang 	sdram_params->ddr_freq = ((fbdiv * 24) /
6722831bc3aSCaesar Wang 				(refdiv * postdiv1 * postdiv2)) * MHz;
6732831bc3aSCaesar Wang 
6742831bc3aSCaesar Wang 	INFO("sdram_params->ddr_freq = %d\n", sdram_params->ddr_freq);
6752831bc3aSCaesar Wang 	sdram_params->odt = (((mmio_read_32(PHY_REG(0, 5)) >> 16) &
6762831bc3aSCaesar Wang 			       0x7) != 0) ? 1 : 0;
6772831bc3aSCaesar Wang 
6782831bc3aSCaesar Wang 	/* copy the registers CTL PI and PHY */
6792831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_ctl[0], CTL_REG(0, 0), CTL_REG_NUM);
6802831bc3aSCaesar Wang 
6812831bc3aSCaesar Wang 	/* mask DENALI_CTL_00_DATA.START, only copy here, will trigger later */
6822831bc3aSCaesar Wang 	params_ctl[0] &= ~(0x1 << 0);
6832831bc3aSCaesar Wang 
6842831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_pi[0], PI_REG(0, 0),
6852831bc3aSCaesar Wang 		    PI_REG_NUM);
6862831bc3aSCaesar Wang 
6872831bc3aSCaesar Wang 	/* mask DENALI_PI_00_DATA.START, only copy here, will trigger later*/
6882831bc3aSCaesar Wang 	params_pi[0] &= ~(0x1 << 0);
6892831bc3aSCaesar Wang 
6902831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[0], PHY_REG(0, 0), 91);
6912831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[128], PHY_REG(0, 128), 91);
6922831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[256], PHY_REG(0, 256), 91);
6932831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[384], PHY_REG(0, 384), 91);
6942831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[512], PHY_REG(0, 512), 38);
6952831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[640], PHY_REG(0, 640), 38);
6962831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[768], PHY_REG(0, 768), 38);
6972831bc3aSCaesar Wang 	sram_regcpy((uintptr_t)&params_phy[896], PHY_REG(0, 896), 63);
6982831bc3aSCaesar Wang 
699951752ddSDerek Basehore 	for (ch = 0; ch < sdram_params->num_channels; ch++) {
700951752ddSDerek Basehore 		for (byte = 0; byte < 4; byte++)
701951752ddSDerek Basehore 			sdram_params->rx_cal_dqs[ch][byte] = (0xfff << 16) &
702951752ddSDerek Basehore 				mmio_read_32(PHY_REG(ch, 57 + byte * 128));
703951752ddSDerek Basehore 	}
704951752ddSDerek Basehore 
7052831bc3aSCaesar Wang 	/* set DENALI_PHY_957_DATA.PHY_DLL_RST_EN = 0x1 */
7062831bc3aSCaesar Wang 	params_phy[957] &= ~(0x3 << 24);
7072831bc3aSCaesar Wang 	params_phy[957] |= 1 << 24;
7082831bc3aSCaesar Wang 	params_phy[896] |= 1;
7092831bc3aSCaesar Wang 	params_phy[896] &= ~(0x3 << 8);
7102831bc3aSCaesar Wang }
7112831bc3aSCaesar Wang 
7122831bc3aSCaesar Wang __sramfunc void dmc_restore(void)
7132831bc3aSCaesar Wang {
7142831bc3aSCaesar Wang 	struct rk3399_sdram_params *sdram_params = &sdram_config;
7152831bc3aSCaesar Wang 	uint32_t channel_mask = 0;
7162831bc3aSCaesar Wang 	uint32_t channel;
7172831bc3aSCaesar Wang 
7182831bc3aSCaesar Wang 	configure_sgrf();
7192831bc3aSCaesar Wang 
7202831bc3aSCaesar Wang retry:
7212831bc3aSCaesar Wang 	for (channel = 0; channel < sdram_params->num_channels; channel++) {
7222831bc3aSCaesar Wang 		phy_pctrl_reset(channel);
7232831bc3aSCaesar Wang 		phy_dll_bypass_set(channel, sdram_params->ddr_freq);
7242831bc3aSCaesar Wang 		if (channel >= sdram_params->num_channels)
7252831bc3aSCaesar Wang 			continue;
7262831bc3aSCaesar Wang 
7272831bc3aSCaesar Wang 		pctl_cfg(channel, sdram_params);
7282831bc3aSCaesar Wang 	}
7292831bc3aSCaesar Wang 
7302831bc3aSCaesar Wang 	for (channel = 0; channel < 2; channel++) {
7312831bc3aSCaesar Wang 		if (sdram_params->ch[channel].col)
7322831bc3aSCaesar Wang 			channel_mask |= 1 << channel;
7332831bc3aSCaesar Wang 	}
7342831bc3aSCaesar Wang 
7352831bc3aSCaesar Wang 	if (pctl_start(channel_mask, sdram_params) < 0)
7362831bc3aSCaesar Wang 		goto retry;
7372831bc3aSCaesar Wang 
7382831bc3aSCaesar Wang 	for (channel = 0; channel < sdram_params->num_channels; channel++) {
7392831bc3aSCaesar Wang 		/* LPDDR2/LPDDR3 need to wait DAI complete, max 10us */
7402831bc3aSCaesar Wang 		if (sdram_params->dramtype == LPDDR3)
7412831bc3aSCaesar Wang 			sram_udelay(10);
7422831bc3aSCaesar Wang 
7432831bc3aSCaesar Wang 		/* If traning fail, retry to do it again. */
7442831bc3aSCaesar Wang 		if (data_training(channel, sdram_params, PI_FULL_TRAINING))
7452831bc3aSCaesar Wang 			goto retry;
7462831bc3aSCaesar Wang 
7472831bc3aSCaesar Wang 		set_ddrconfig(sdram_params, channel,
7482831bc3aSCaesar Wang 			      sdram_params->ch[channel].ddrconfig);
7492831bc3aSCaesar Wang 	}
7502831bc3aSCaesar Wang 
7512831bc3aSCaesar Wang 	dram_all_config(sdram_params);
7522831bc3aSCaesar Wang 
7532831bc3aSCaesar Wang 	/* Switch to index 1 and prepare for DDR frequency switch. */
7544bd1d3faSDerek Basehore 	dram_switch_to_next_index(sdram_params);
7552831bc3aSCaesar Wang }
756