xref: /rk3399_rockchip-uboot/drivers/ddr/altera/sequencer.c (revision 162d60ef733a1878eee85cf1f3ed5e56f2a26903)
13da42859SDinh Nguyen /*
23da42859SDinh Nguyen  * Copyright Altera Corporation (C) 2012-2015
33da42859SDinh Nguyen  *
43da42859SDinh Nguyen  * SPDX-License-Identifier:    BSD-3-Clause
53da42859SDinh Nguyen  */
63da42859SDinh Nguyen 
73da42859SDinh Nguyen #include <common.h>
83da42859SDinh Nguyen #include <asm/io.h>
93da42859SDinh Nguyen #include <asm/arch/sdram.h>
103da42859SDinh Nguyen #include "sequencer.h"
113da42859SDinh Nguyen #include "sequencer_auto.h"
123da42859SDinh Nguyen #include "sequencer_auto_ac_init.h"
133da42859SDinh Nguyen #include "sequencer_auto_inst_init.h"
143da42859SDinh Nguyen #include "sequencer_defines.h"
153da42859SDinh Nguyen 
163da42859SDinh Nguyen static void scc_mgr_load_dqs_for_write_group(uint32_t write_group);
173da42859SDinh Nguyen 
183da42859SDinh Nguyen static struct socfpga_sdr_rw_load_manager *sdr_rw_load_mgr_regs =
196afb4fe2SMarek Vasut 	(struct socfpga_sdr_rw_load_manager *)(SDR_PHYGRP_RWMGRGRP_ADDRESS | 0x800);
203da42859SDinh Nguyen 
213da42859SDinh Nguyen static struct socfpga_sdr_rw_load_jump_manager *sdr_rw_load_jump_mgr_regs =
226afb4fe2SMarek Vasut 	(struct socfpga_sdr_rw_load_jump_manager *)(SDR_PHYGRP_RWMGRGRP_ADDRESS | 0xC00);
233da42859SDinh Nguyen 
243da42859SDinh Nguyen static struct socfpga_sdr_reg_file *sdr_reg_file =
25a1c654a8SMarek Vasut 	(struct socfpga_sdr_reg_file *)SDR_PHYGRP_REGFILEGRP_ADDRESS;
263da42859SDinh Nguyen 
273da42859SDinh Nguyen static struct socfpga_sdr_scc_mgr *sdr_scc_mgr =
28e79025a7SMarek Vasut 	(struct socfpga_sdr_scc_mgr *)(SDR_PHYGRP_SCCGRP_ADDRESS | 0xe00);
293da42859SDinh Nguyen 
303da42859SDinh Nguyen static struct socfpga_phy_mgr_cmd *phy_mgr_cmd =
311bc6f14aSMarek Vasut 	(struct socfpga_phy_mgr_cmd *)SDR_PHYGRP_PHYMGRGRP_ADDRESS;
323da42859SDinh Nguyen 
333da42859SDinh Nguyen static struct socfpga_phy_mgr_cfg *phy_mgr_cfg =
341bc6f14aSMarek Vasut 	(struct socfpga_phy_mgr_cfg *)(SDR_PHYGRP_PHYMGRGRP_ADDRESS | 0x40);
353da42859SDinh Nguyen 
363da42859SDinh Nguyen static struct socfpga_data_mgr *data_mgr =
37c4815f76SMarek Vasut 	(struct socfpga_data_mgr *)SDR_PHYGRP_DATAMGRGRP_ADDRESS;
383da42859SDinh Nguyen 
396cb9f167SMarek Vasut static struct socfpga_sdr_ctrl *sdr_ctrl =
406cb9f167SMarek Vasut 	(struct socfpga_sdr_ctrl *)SDR_CTRLGRP_ADDRESS;
416cb9f167SMarek Vasut 
423da42859SDinh Nguyen #define DELTA_D		1
433da42859SDinh Nguyen 
443da42859SDinh Nguyen /*
453da42859SDinh Nguyen  * In order to reduce ROM size, most of the selectable calibration steps are
463da42859SDinh Nguyen  * decided at compile time based on the user's calibration mode selection,
473da42859SDinh Nguyen  * as captured by the STATIC_CALIB_STEPS selection below.
483da42859SDinh Nguyen  *
493da42859SDinh Nguyen  * However, to support simulation-time selection of fast simulation mode, where
503da42859SDinh Nguyen  * we skip everything except the bare minimum, we need a few of the steps to
513da42859SDinh Nguyen  * be dynamic.  In those cases, we either use the DYNAMIC_CALIB_STEPS for the
523da42859SDinh Nguyen  * check, which is based on the rtl-supplied value, or we dynamically compute
533da42859SDinh Nguyen  * the value to use based on the dynamically-chosen calibration mode
543da42859SDinh Nguyen  */
553da42859SDinh Nguyen 
563da42859SDinh Nguyen #define DLEVEL 0
573da42859SDinh Nguyen #define STATIC_IN_RTL_SIM 0
583da42859SDinh Nguyen #define STATIC_SKIP_DELAY_LOOPS 0
593da42859SDinh Nguyen 
603da42859SDinh Nguyen #define STATIC_CALIB_STEPS (STATIC_IN_RTL_SIM | CALIB_SKIP_FULL_TEST | \
613da42859SDinh Nguyen 	STATIC_SKIP_DELAY_LOOPS)
623da42859SDinh Nguyen 
633da42859SDinh Nguyen /* calibration steps requested by the rtl */
643da42859SDinh Nguyen uint16_t dyn_calib_steps;
653da42859SDinh Nguyen 
663da42859SDinh Nguyen /*
673da42859SDinh Nguyen  * To make CALIB_SKIP_DELAY_LOOPS a dynamic conditional option
683da42859SDinh Nguyen  * instead of static, we use boolean logic to select between
693da42859SDinh Nguyen  * non-skip and skip values
703da42859SDinh Nguyen  *
713da42859SDinh Nguyen  * The mask is set to include all bits when not-skipping, but is
723da42859SDinh Nguyen  * zero when skipping
733da42859SDinh Nguyen  */
743da42859SDinh Nguyen 
753da42859SDinh Nguyen uint16_t skip_delay_mask;	/* mask off bits when skipping/not-skipping */
763da42859SDinh Nguyen 
773da42859SDinh Nguyen #define SKIP_DELAY_LOOP_VALUE_OR_ZERO(non_skip_value) \
783da42859SDinh Nguyen 	((non_skip_value) & skip_delay_mask)
793da42859SDinh Nguyen 
803da42859SDinh Nguyen struct gbl_type *gbl;
813da42859SDinh Nguyen struct param_type *param;
823da42859SDinh Nguyen uint32_t curr_shadow_reg;
833da42859SDinh Nguyen 
843da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_write_test(uint32_t rank_bgn,
853da42859SDinh Nguyen 	uint32_t write_group, uint32_t use_dm,
863da42859SDinh Nguyen 	uint32_t all_correct, uint32_t *bit_chk, uint32_t all_ranks);
873da42859SDinh Nguyen 
883da42859SDinh Nguyen static void set_failing_group_stage(uint32_t group, uint32_t stage,
893da42859SDinh Nguyen 	uint32_t substage)
903da42859SDinh Nguyen {
913da42859SDinh Nguyen 	/*
923da42859SDinh Nguyen 	 * Only set the global stage if there was not been any other
933da42859SDinh Nguyen 	 * failing group
943da42859SDinh Nguyen 	 */
953da42859SDinh Nguyen 	if (gbl->error_stage == CAL_STAGE_NIL)	{
963da42859SDinh Nguyen 		gbl->error_substage = substage;
973da42859SDinh Nguyen 		gbl->error_stage = stage;
983da42859SDinh Nguyen 		gbl->error_group = group;
993da42859SDinh Nguyen 	}
1003da42859SDinh Nguyen }
1013da42859SDinh Nguyen 
1022c0d2d9cSMarek Vasut static void reg_file_set_group(u16 set_group)
1033da42859SDinh Nguyen {
1042c0d2d9cSMarek Vasut 	clrsetbits_le32(&sdr_reg_file->cur_stage, 0xffff0000, set_group << 16);
1053da42859SDinh Nguyen }
1063da42859SDinh Nguyen 
1072c0d2d9cSMarek Vasut static void reg_file_set_stage(u8 set_stage)
1083da42859SDinh Nguyen {
1092c0d2d9cSMarek Vasut 	clrsetbits_le32(&sdr_reg_file->cur_stage, 0xffff, set_stage & 0xff);
1103da42859SDinh Nguyen }
1113da42859SDinh Nguyen 
1122c0d2d9cSMarek Vasut static void reg_file_set_sub_stage(u8 set_sub_stage)
1133da42859SDinh Nguyen {
1142c0d2d9cSMarek Vasut 	set_sub_stage &= 0xff;
1152c0d2d9cSMarek Vasut 	clrsetbits_le32(&sdr_reg_file->cur_stage, 0xff00, set_sub_stage << 8);
1163da42859SDinh Nguyen }
1173da42859SDinh Nguyen 
1183da42859SDinh Nguyen static void initialize(void)
1193da42859SDinh Nguyen {
1203da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
1213da42859SDinh Nguyen 	/* USER calibration has control over path to memory */
1223da42859SDinh Nguyen 	/*
1233da42859SDinh Nguyen 	 * In Hard PHY this is a 2-bit control:
1243da42859SDinh Nguyen 	 * 0: AFI Mux Select
1253da42859SDinh Nguyen 	 * 1: DDIO Mux Select
1263da42859SDinh Nguyen 	 */
1271273dd9eSMarek Vasut 	writel(0x3, &phy_mgr_cfg->mux_sel);
1283da42859SDinh Nguyen 
1293da42859SDinh Nguyen 	/* USER memory clock is not stable we begin initialization  */
1301273dd9eSMarek Vasut 	writel(0, &phy_mgr_cfg->reset_mem_stbl);
1313da42859SDinh Nguyen 
1323da42859SDinh Nguyen 	/* USER calibration status all set to zero */
1331273dd9eSMarek Vasut 	writel(0, &phy_mgr_cfg->cal_status);
1343da42859SDinh Nguyen 
1351273dd9eSMarek Vasut 	writel(0, &phy_mgr_cfg->cal_debug_info);
1363da42859SDinh Nguyen 
1373da42859SDinh Nguyen 	if ((dyn_calib_steps & CALIB_SKIP_ALL) != CALIB_SKIP_ALL) {
1383da42859SDinh Nguyen 		param->read_correct_mask_vg  = ((uint32_t)1 <<
1393da42859SDinh Nguyen 			(RW_MGR_MEM_DQ_PER_READ_DQS /
1403da42859SDinh Nguyen 			RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS)) - 1;
1413da42859SDinh Nguyen 		param->write_correct_mask_vg = ((uint32_t)1 <<
1423da42859SDinh Nguyen 			(RW_MGR_MEM_DQ_PER_READ_DQS /
1433da42859SDinh Nguyen 			RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS)) - 1;
1443da42859SDinh Nguyen 		param->read_correct_mask     = ((uint32_t)1 <<
1453da42859SDinh Nguyen 			RW_MGR_MEM_DQ_PER_READ_DQS) - 1;
1463da42859SDinh Nguyen 		param->write_correct_mask    = ((uint32_t)1 <<
1473da42859SDinh Nguyen 			RW_MGR_MEM_DQ_PER_WRITE_DQS) - 1;
1483da42859SDinh Nguyen 		param->dm_correct_mask       = ((uint32_t)1 <<
1493da42859SDinh Nguyen 			(RW_MGR_MEM_DATA_WIDTH / RW_MGR_MEM_DATA_MASK_WIDTH))
1503da42859SDinh Nguyen 			- 1;
1513da42859SDinh Nguyen 	}
1523da42859SDinh Nguyen }
1533da42859SDinh Nguyen 
1543da42859SDinh Nguyen static void set_rank_and_odt_mask(uint32_t rank, uint32_t odt_mode)
1553da42859SDinh Nguyen {
1563da42859SDinh Nguyen 	uint32_t odt_mask_0 = 0;
1573da42859SDinh Nguyen 	uint32_t odt_mask_1 = 0;
1583da42859SDinh Nguyen 	uint32_t cs_and_odt_mask;
1593da42859SDinh Nguyen 
1603da42859SDinh Nguyen 	if (odt_mode == RW_MGR_ODT_MODE_READ_WRITE) {
1613da42859SDinh Nguyen 		if (RW_MGR_MEM_NUMBER_OF_RANKS == 1) {
1623da42859SDinh Nguyen 			/*
1633da42859SDinh Nguyen 			 * 1 Rank
1643da42859SDinh Nguyen 			 * Read: ODT = 0
1653da42859SDinh Nguyen 			 * Write: ODT = 1
1663da42859SDinh Nguyen 			 */
1673da42859SDinh Nguyen 			odt_mask_0 = 0x0;
1683da42859SDinh Nguyen 			odt_mask_1 = 0x1;
1693da42859SDinh Nguyen 		} else if (RW_MGR_MEM_NUMBER_OF_RANKS == 2) {
1703da42859SDinh Nguyen 			/* 2 Ranks */
1713da42859SDinh Nguyen 			if (RW_MGR_MEM_NUMBER_OF_CS_PER_DIMM == 1) {
1723da42859SDinh Nguyen 				/* - Dual-Slot , Single-Rank
1733da42859SDinh Nguyen 				 * (1 chip-select per DIMM)
1743da42859SDinh Nguyen 				 * OR
1753da42859SDinh Nguyen 				 * - RDIMM, 4 total CS (2 CS per DIMM)
1763da42859SDinh Nguyen 				 * means 2 DIMM
1773da42859SDinh Nguyen 				 * Since MEM_NUMBER_OF_RANKS is 2 they are
1783da42859SDinh Nguyen 				 * both single rank
1793da42859SDinh Nguyen 				 * with 2 CS each (special for RDIMM)
1803da42859SDinh Nguyen 				 * Read: Turn on ODT on the opposite rank
1813da42859SDinh Nguyen 				 * Write: Turn on ODT on all ranks
1823da42859SDinh Nguyen 				 */
1833da42859SDinh Nguyen 				odt_mask_0 = 0x3 & ~(1 << rank);
1843da42859SDinh Nguyen 				odt_mask_1 = 0x3;
1853da42859SDinh Nguyen 			} else {
1863da42859SDinh Nguyen 				/*
1873da42859SDinh Nguyen 				 * USER - Single-Slot , Dual-rank DIMMs
1883da42859SDinh Nguyen 				 * (2 chip-selects per DIMM)
1893da42859SDinh Nguyen 				 * USER Read: Turn on ODT off on all ranks
1903da42859SDinh Nguyen 				 * USER Write: Turn on ODT on active rank
1913da42859SDinh Nguyen 				 */
1923da42859SDinh Nguyen 				odt_mask_0 = 0x0;
1933da42859SDinh Nguyen 				odt_mask_1 = 0x3 & (1 << rank);
1943da42859SDinh Nguyen 			}
1953da42859SDinh Nguyen 		} else {
1963da42859SDinh Nguyen 			/* 4 Ranks
1973da42859SDinh Nguyen 			 * Read:
1983da42859SDinh Nguyen 			 * ----------+-----------------------+
1993da42859SDinh Nguyen 			 *           |                       |
2003da42859SDinh Nguyen 			 *           |         ODT           |
2013da42859SDinh Nguyen 			 * Read From +-----------------------+
2023da42859SDinh Nguyen 			 *   Rank    |  3  |  2  |  1  |  0  |
2033da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2043da42859SDinh Nguyen 			 *     0     |  0  |  1  |  0  |  0  |
2053da42859SDinh Nguyen 			 *     1     |  1  |  0  |  0  |  0  |
2063da42859SDinh Nguyen 			 *     2     |  0  |  0  |  0  |  1  |
2073da42859SDinh Nguyen 			 *     3     |  0  |  0  |  1  |  0  |
2083da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2093da42859SDinh Nguyen 			 *
2103da42859SDinh Nguyen 			 * Write:
2113da42859SDinh Nguyen 			 * ----------+-----------------------+
2123da42859SDinh Nguyen 			 *           |                       |
2133da42859SDinh Nguyen 			 *           |         ODT           |
2143da42859SDinh Nguyen 			 * Write To  +-----------------------+
2153da42859SDinh Nguyen 			 *   Rank    |  3  |  2  |  1  |  0  |
2163da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2173da42859SDinh Nguyen 			 *     0     |  0  |  1  |  0  |  1  |
2183da42859SDinh Nguyen 			 *     1     |  1  |  0  |  1  |  0  |
2193da42859SDinh Nguyen 			 *     2     |  0  |  1  |  0  |  1  |
2203da42859SDinh Nguyen 			 *     3     |  1  |  0  |  1  |  0  |
2213da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2223da42859SDinh Nguyen 			 */
2233da42859SDinh Nguyen 			switch (rank) {
2243da42859SDinh Nguyen 			case 0:
2253da42859SDinh Nguyen 				odt_mask_0 = 0x4;
2263da42859SDinh Nguyen 				odt_mask_1 = 0x5;
2273da42859SDinh Nguyen 				break;
2283da42859SDinh Nguyen 			case 1:
2293da42859SDinh Nguyen 				odt_mask_0 = 0x8;
2303da42859SDinh Nguyen 				odt_mask_1 = 0xA;
2313da42859SDinh Nguyen 				break;
2323da42859SDinh Nguyen 			case 2:
2333da42859SDinh Nguyen 				odt_mask_0 = 0x1;
2343da42859SDinh Nguyen 				odt_mask_1 = 0x5;
2353da42859SDinh Nguyen 				break;
2363da42859SDinh Nguyen 			case 3:
2373da42859SDinh Nguyen 				odt_mask_0 = 0x2;
2383da42859SDinh Nguyen 				odt_mask_1 = 0xA;
2393da42859SDinh Nguyen 				break;
2403da42859SDinh Nguyen 			}
2413da42859SDinh Nguyen 		}
2423da42859SDinh Nguyen 	} else {
2433da42859SDinh Nguyen 		odt_mask_0 = 0x0;
2443da42859SDinh Nguyen 		odt_mask_1 = 0x0;
2453da42859SDinh Nguyen 	}
2463da42859SDinh Nguyen 
2473da42859SDinh Nguyen 	cs_and_odt_mask =
2483da42859SDinh Nguyen 		(0xFF & ~(1 << rank)) |
2493da42859SDinh Nguyen 		((0xFF & odt_mask_0) << 8) |
2503da42859SDinh Nguyen 		((0xFF & odt_mask_1) << 16);
2511273dd9eSMarek Vasut 	writel(cs_and_odt_mask, SDR_PHYGRP_RWMGRGRP_ADDRESS |
2521273dd9eSMarek Vasut 				RW_MGR_SET_CS_AND_ODT_MASK_OFFSET);
2533da42859SDinh Nguyen }
2543da42859SDinh Nguyen 
255c76976d9SMarek Vasut /**
256c76976d9SMarek Vasut  * scc_mgr_set() - Set SCC Manager register
257c76976d9SMarek Vasut  * @off:	Base offset in SCC Manager space
258c76976d9SMarek Vasut  * @grp:	Read/Write group
259c76976d9SMarek Vasut  * @val:	Value to be set
260c76976d9SMarek Vasut  *
261c76976d9SMarek Vasut  * This function sets the SCC Manager (Scan Chain Control Manager) register.
262c76976d9SMarek Vasut  */
263c76976d9SMarek Vasut static void scc_mgr_set(u32 off, u32 grp, u32 val)
264c76976d9SMarek Vasut {
265c76976d9SMarek Vasut 	writel(val, SDR_PHYGRP_SCCGRP_ADDRESS | off | (grp << 2));
266c76976d9SMarek Vasut }
267c76976d9SMarek Vasut 
268e893f4dcSMarek Vasut /**
269e893f4dcSMarek Vasut  * scc_mgr_initialize() - Initialize SCC Manager registers
270e893f4dcSMarek Vasut  *
271e893f4dcSMarek Vasut  * Initialize SCC Manager registers.
272e893f4dcSMarek Vasut  */
2733da42859SDinh Nguyen static void scc_mgr_initialize(void)
2743da42859SDinh Nguyen {
2753da42859SDinh Nguyen 	/*
276e893f4dcSMarek Vasut 	 * Clear register file for HPS. 16 (2^4) is the size of the
277e893f4dcSMarek Vasut 	 * full register file in the scc mgr:
278e893f4dcSMarek Vasut 	 *	RFILE_DEPTH = 1 + log2(MEM_DQ_PER_DQS + 1 + MEM_DM_PER_DQS +
279e893f4dcSMarek Vasut 	 *                             MEM_IF_READ_DQS_WIDTH - 1);
2803da42859SDinh Nguyen 	 */
281c76976d9SMarek Vasut 	int i;
282e893f4dcSMarek Vasut 
2833da42859SDinh Nguyen 	for (i = 0; i < 16; i++) {
2847ac40d25SMarek Vasut 		debug_cond(DLEVEL == 1, "%s:%d: Clearing SCC RFILE index %u\n",
2853da42859SDinh Nguyen 			   __func__, __LINE__, i);
286c76976d9SMarek Vasut 		scc_mgr_set(SCC_MGR_HHP_RFILE_OFFSET, 0, i);
2873da42859SDinh Nguyen 	}
2883da42859SDinh Nguyen }
2893da42859SDinh Nguyen 
2905ff825b8SMarek Vasut static void scc_mgr_set_dqdqs_output_phase(uint32_t write_group, uint32_t phase)
2915ff825b8SMarek Vasut {
292c76976d9SMarek Vasut 	scc_mgr_set(SCC_MGR_DQDQS_OUT_PHASE_OFFSET, write_group, phase);
2935ff825b8SMarek Vasut }
2945ff825b8SMarek Vasut 
2955ff825b8SMarek Vasut static void scc_mgr_set_dqs_bus_in_delay(uint32_t read_group, uint32_t delay)
2963da42859SDinh Nguyen {
297c76976d9SMarek Vasut 	scc_mgr_set(SCC_MGR_DQS_IN_DELAY_OFFSET, read_group, delay);
2983da42859SDinh Nguyen }
2993da42859SDinh Nguyen 
3003da42859SDinh Nguyen static void scc_mgr_set_dqs_en_phase(uint32_t read_group, uint32_t phase)
3013da42859SDinh Nguyen {
302c76976d9SMarek Vasut 	scc_mgr_set(SCC_MGR_DQS_EN_PHASE_OFFSET, read_group, phase);
3033da42859SDinh Nguyen }
3043da42859SDinh Nguyen 
3055ff825b8SMarek Vasut static void scc_mgr_set_dqs_en_delay(uint32_t read_group, uint32_t delay)
3065ff825b8SMarek Vasut {
307c76976d9SMarek Vasut 	scc_mgr_set(SCC_MGR_DQS_EN_DELAY_OFFSET, read_group, delay);
3085ff825b8SMarek Vasut }
3095ff825b8SMarek Vasut 
3105ff825b8SMarek Vasut static void scc_mgr_set_dqs_io_in_delay(uint32_t write_group, uint32_t delay)
3115ff825b8SMarek Vasut {
312c76976d9SMarek Vasut 	scc_mgr_set(SCC_MGR_IO_IN_DELAY_OFFSET, RW_MGR_MEM_DQ_PER_WRITE_DQS,
313c76976d9SMarek Vasut 		    delay);
3145ff825b8SMarek Vasut }
3155ff825b8SMarek Vasut 
3165ff825b8SMarek Vasut static void scc_mgr_set_dq_in_delay(uint32_t dq_in_group, uint32_t delay)
3175ff825b8SMarek Vasut {
318c76976d9SMarek Vasut 	scc_mgr_set(SCC_MGR_IO_IN_DELAY_OFFSET, dq_in_group, delay);
3195ff825b8SMarek Vasut }
3205ff825b8SMarek Vasut 
3215ff825b8SMarek Vasut static void scc_mgr_set_dq_out1_delay(uint32_t dq_in_group, uint32_t delay)
3225ff825b8SMarek Vasut {
323c76976d9SMarek Vasut 	scc_mgr_set(SCC_MGR_IO_OUT1_DELAY_OFFSET, dq_in_group, delay);
3245ff825b8SMarek Vasut }
3255ff825b8SMarek Vasut 
3265ff825b8SMarek Vasut static void scc_mgr_set_dqs_out1_delay(uint32_t write_group,
3275ff825b8SMarek Vasut 					      uint32_t delay)
3285ff825b8SMarek Vasut {
329c76976d9SMarek Vasut 	scc_mgr_set(SCC_MGR_IO_OUT1_DELAY_OFFSET, RW_MGR_MEM_DQ_PER_WRITE_DQS,
330c76976d9SMarek Vasut 		    delay);
3315ff825b8SMarek Vasut }
3325ff825b8SMarek Vasut 
3335ff825b8SMarek Vasut static void scc_mgr_set_dm_out1_delay(uint32_t dm, uint32_t delay)
3345ff825b8SMarek Vasut {
335c76976d9SMarek Vasut 	scc_mgr_set(SCC_MGR_IO_OUT1_DELAY_OFFSET,
336c76976d9SMarek Vasut 		    RW_MGR_MEM_DQ_PER_WRITE_DQS + 1 + dm,
337c76976d9SMarek Vasut 		    delay);
3385ff825b8SMarek Vasut }
3395ff825b8SMarek Vasut 
3405ff825b8SMarek Vasut /* load up dqs config settings */
3415ff825b8SMarek Vasut static void scc_mgr_load_dqs(uint32_t dqs)
3425ff825b8SMarek Vasut {
3435ff825b8SMarek Vasut 	writel(dqs, &sdr_scc_mgr->dqs_ena);
3445ff825b8SMarek Vasut }
3455ff825b8SMarek Vasut 
3465ff825b8SMarek Vasut /* load up dqs io config settings */
3475ff825b8SMarek Vasut static void scc_mgr_load_dqs_io(void)
3485ff825b8SMarek Vasut {
3495ff825b8SMarek Vasut 	writel(0, &sdr_scc_mgr->dqs_io_ena);
3505ff825b8SMarek Vasut }
3515ff825b8SMarek Vasut 
3525ff825b8SMarek Vasut /* load up dq config settings */
3535ff825b8SMarek Vasut static void scc_mgr_load_dq(uint32_t dq_in_group)
3545ff825b8SMarek Vasut {
3555ff825b8SMarek Vasut 	writel(dq_in_group, &sdr_scc_mgr->dq_ena);
3565ff825b8SMarek Vasut }
3575ff825b8SMarek Vasut 
3585ff825b8SMarek Vasut /* load up dm config settings */
3595ff825b8SMarek Vasut static void scc_mgr_load_dm(uint32_t dm)
3605ff825b8SMarek Vasut {
3615ff825b8SMarek Vasut 	writel(dm, &sdr_scc_mgr->dm_ena);
3625ff825b8SMarek Vasut }
3635ff825b8SMarek Vasut 
3643da42859SDinh Nguyen static void scc_mgr_set_dqs_en_phase_all_ranks(uint32_t read_group,
3653da42859SDinh Nguyen 					       uint32_t phase)
3663da42859SDinh Nguyen {
3673da42859SDinh Nguyen 	uint32_t r;
3683da42859SDinh Nguyen 
3693da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
3703da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
371*162d60efSMarek Vasut 		scc_mgr_set_dqs_en_phase(read_group, phase);
372*162d60efSMarek Vasut 
3733da42859SDinh Nguyen 		/*
3743da42859SDinh Nguyen 		 * USER although the h/w doesn't support different phases per
3753da42859SDinh Nguyen 		 * shadow register, for simplicity our scc manager modeling
3763da42859SDinh Nguyen 		 * keeps different phase settings per shadow reg, and it's
3773da42859SDinh Nguyen 		 * important for us to keep them in sync to match h/w.
3783da42859SDinh Nguyen 		 * for efficiency, the scan chain update should occur only
3793da42859SDinh Nguyen 		 * once to sr0.
3803da42859SDinh Nguyen 		 */
3813da42859SDinh Nguyen 
382*162d60efSMarek Vasut 		if (r == 0) {
3831273dd9eSMarek Vasut 			writel(read_group, &sdr_scc_mgr->dqs_ena);
3841273dd9eSMarek Vasut 			writel(0, &sdr_scc_mgr->update);
3853da42859SDinh Nguyen 		}
3863da42859SDinh Nguyen 	}
3873da42859SDinh Nguyen }
3883da42859SDinh Nguyen 
3893da42859SDinh Nguyen static void scc_mgr_set_dqdqs_output_phase_all_ranks(uint32_t write_group,
3903da42859SDinh Nguyen 						     uint32_t phase)
3913da42859SDinh Nguyen {
3923da42859SDinh Nguyen 	uint32_t r;
3933da42859SDinh Nguyen 
3943da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
3953da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
396*162d60efSMarek Vasut 		scc_mgr_set_dqdqs_output_phase(write_group, phase);
397*162d60efSMarek Vasut 
3983da42859SDinh Nguyen 		/*
3993da42859SDinh Nguyen 		 * USER although the h/w doesn't support different phases per
4003da42859SDinh Nguyen 		 * shadow register, for simplicity our scc manager modeling
4013da42859SDinh Nguyen 		 * keeps different phase settings per shadow reg, and it's
4023da42859SDinh Nguyen 		 * important for us to keep them in sync to match h/w.
4033da42859SDinh Nguyen 		 * for efficiency, the scan chain update should occur only
4043da42859SDinh Nguyen 		 * once to sr0.
4053da42859SDinh Nguyen 		 */
4063da42859SDinh Nguyen 
407*162d60efSMarek Vasut 		if (r == 0) {
4081273dd9eSMarek Vasut 			writel(write_group, &sdr_scc_mgr->dqs_ena);
4091273dd9eSMarek Vasut 			writel(0, &sdr_scc_mgr->update);
4103da42859SDinh Nguyen 		}
4113da42859SDinh Nguyen 	}
4123da42859SDinh Nguyen }
4133da42859SDinh Nguyen 
4143da42859SDinh Nguyen static void scc_mgr_set_dqs_en_delay_all_ranks(uint32_t read_group,
4153da42859SDinh Nguyen 					       uint32_t delay)
4163da42859SDinh Nguyen {
4173da42859SDinh Nguyen 	uint32_t r;
4183da42859SDinh Nguyen 
4193da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
4203da42859SDinh Nguyen 		r += NUM_RANKS_PER_SHADOW_REG) {
4213da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay(read_group, delay);
4223da42859SDinh Nguyen 
4233da42859SDinh Nguyen 		/*
4243da42859SDinh Nguyen 		 * In shadow register mode, the T11 settings are stored in
4253da42859SDinh Nguyen 		 * registers in the core, which are updated by the DQS_ENA
4263da42859SDinh Nguyen 		 * signals. Not issuing the SCC_MGR_UPD command allows us to
4273da42859SDinh Nguyen 		 * save lots of rank switching overhead, by calling
4283da42859SDinh Nguyen 		 * select_shadow_regs_for_update with update_scan_chains
4293da42859SDinh Nguyen 		 * set to 0.
4303da42859SDinh Nguyen 		 */
431*162d60efSMarek Vasut 
432*162d60efSMarek Vasut 		writel(read_group, &sdr_scc_mgr->dqs_ena);
4331273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
4343da42859SDinh Nguyen 	}
4353da42859SDinh Nguyen 	/*
4363da42859SDinh Nguyen 	 * In shadow register mode, the T11 settings are stored in
4373da42859SDinh Nguyen 	 * registers in the core, which are updated by the DQS_ENA
4383da42859SDinh Nguyen 	 * signals. Not issuing the SCC_MGR_UPD command allows us to
4393da42859SDinh Nguyen 	 * save lots of rank switching overhead, by calling
4403da42859SDinh Nguyen 	 * select_shadow_regs_for_update with update_scan_chains
4413da42859SDinh Nguyen 	 * set to 0.
4423da42859SDinh Nguyen 	 */
4431273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
4443da42859SDinh Nguyen }
4453da42859SDinh Nguyen 
4463da42859SDinh Nguyen static void scc_mgr_set_oct_out1_delay(uint32_t write_group, uint32_t delay)
4473da42859SDinh Nguyen {
4483da42859SDinh Nguyen 	uint32_t read_group;
449c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_OCT_OUT1_DELAY_OFFSET;
4503da42859SDinh Nguyen 
4513da42859SDinh Nguyen 	/*
4523da42859SDinh Nguyen 	 * Load the setting in the SCC manager
4533da42859SDinh Nguyen 	 * Although OCT affects only write data, the OCT delay is controlled
4543da42859SDinh Nguyen 	 * by the DQS logic block which is instantiated once per read group.
4553da42859SDinh Nguyen 	 * For protocols where a write group consists of multiple read groups,
4563da42859SDinh Nguyen 	 * the setting must be set multiple times.
4573da42859SDinh Nguyen 	 */
4583da42859SDinh Nguyen 	for (read_group = write_group * RW_MGR_MEM_IF_READ_DQS_WIDTH /
4593da42859SDinh Nguyen 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH;
4603da42859SDinh Nguyen 	     read_group < (write_group + 1) * RW_MGR_MEM_IF_READ_DQS_WIDTH /
4613da42859SDinh Nguyen 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH; ++read_group)
46217fdc916SMarek Vasut 		writel(delay, addr + (read_group << 2));
4633da42859SDinh Nguyen }
4643da42859SDinh Nguyen 
4653da42859SDinh Nguyen static void scc_mgr_set_hhp_extras(void)
4663da42859SDinh Nguyen {
4673da42859SDinh Nguyen 	/*
4683da42859SDinh Nguyen 	 * Load the fixed setting in the SCC manager
4693da42859SDinh Nguyen 	 * bits: 0:0 = 1'b1   - dqs bypass
4703da42859SDinh Nguyen 	 * bits: 1:1 = 1'b1   - dq bypass
4713da42859SDinh Nguyen 	 * bits: 4:2 = 3'b001   - rfifo_mode
4723da42859SDinh Nguyen 	 * bits: 6:5 = 2'b01  - rfifo clock_select
4733da42859SDinh Nguyen 	 * bits: 7:7 = 1'b0  - separate gating from ungating setting
4743da42859SDinh Nguyen 	 * bits: 8:8 = 1'b0  - separate OE from Output delay setting
4753da42859SDinh Nguyen 	 */
4763da42859SDinh Nguyen 	uint32_t value = (0<<8) | (0<<7) | (1<<5) | (1<<2) | (1<<1) | (1<<0);
477c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_HHP_GLOBALS_OFFSET;
4783da42859SDinh Nguyen 
47917fdc916SMarek Vasut 	writel(value, addr + SCC_MGR_HHP_EXTRAS_OFFSET);
4803da42859SDinh Nguyen }
4813da42859SDinh Nguyen 
4823da42859SDinh Nguyen /*
4833da42859SDinh Nguyen  * USER Zero all DQS config
4843da42859SDinh Nguyen  * TODO: maybe rename to scc_mgr_zero_dqs_config (or something)
4853da42859SDinh Nguyen  */
4863da42859SDinh Nguyen static void scc_mgr_zero_all(void)
4873da42859SDinh Nguyen {
4883da42859SDinh Nguyen 	uint32_t i, r;
4893da42859SDinh Nguyen 
4903da42859SDinh Nguyen 	/*
4913da42859SDinh Nguyen 	 * USER Zero all DQS config settings, across all groups and all
4923da42859SDinh Nguyen 	 * shadow registers
4933da42859SDinh Nguyen 	 */
4943da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r +=
4953da42859SDinh Nguyen 	     NUM_RANKS_PER_SHADOW_REG) {
4963da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
4973da42859SDinh Nguyen 			/*
4983da42859SDinh Nguyen 			 * The phases actually don't exist on a per-rank basis,
4993da42859SDinh Nguyen 			 * but there's no harm updating them several times, so
5003da42859SDinh Nguyen 			 * let's keep the code simple.
5013da42859SDinh Nguyen 			 */
5023da42859SDinh Nguyen 			scc_mgr_set_dqs_bus_in_delay(i, IO_DQS_IN_RESERVE);
5033da42859SDinh Nguyen 			scc_mgr_set_dqs_en_phase(i, 0);
5043da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay(i, 0);
5053da42859SDinh Nguyen 		}
5063da42859SDinh Nguyen 
5073da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_WRITE_DQS_WIDTH; i++) {
5083da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, 0);
5093da42859SDinh Nguyen 			/* av/cv don't have out2 */
5103da42859SDinh Nguyen 			scc_mgr_set_oct_out1_delay(i, IO_DQS_OUT_RESERVE);
5113da42859SDinh Nguyen 		}
5123da42859SDinh Nguyen 	}
5133da42859SDinh Nguyen 
5143da42859SDinh Nguyen 	/* multicast to all DQS group enables */
5151273dd9eSMarek Vasut 	writel(0xff, &sdr_scc_mgr->dqs_ena);
5161273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
5173da42859SDinh Nguyen }
5183da42859SDinh Nguyen 
5193da42859SDinh Nguyen static void scc_set_bypass_mode(uint32_t write_group, uint32_t mode)
5203da42859SDinh Nguyen {
5213da42859SDinh Nguyen 	/* mode = 0 : Do NOT bypass - Half Rate Mode */
5223da42859SDinh Nguyen 	/* mode = 1 : Bypass - Full Rate Mode */
5233da42859SDinh Nguyen 
5243da42859SDinh Nguyen 	/* only need to set once for all groups, pins, dq, dqs, dm */
5253da42859SDinh Nguyen 	if (write_group == 0) {
5263da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d Setting HHP Extras\n", __func__,
5273da42859SDinh Nguyen 			   __LINE__);
5283da42859SDinh Nguyen 		scc_mgr_set_hhp_extras();
5293da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d Done Setting HHP Extras\n",
5303da42859SDinh Nguyen 			  __func__, __LINE__);
5313da42859SDinh Nguyen 	}
5323da42859SDinh Nguyen 	/* multicast to all DQ enables */
5331273dd9eSMarek Vasut 	writel(0xff, &sdr_scc_mgr->dq_ena);
5341273dd9eSMarek Vasut 	writel(0xff, &sdr_scc_mgr->dm_ena);
5353da42859SDinh Nguyen 
5363da42859SDinh Nguyen 	/* update current DQS IO enable */
5371273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->dqs_io_ena);
5383da42859SDinh Nguyen 
5393da42859SDinh Nguyen 	/* update the DQS logic */
5401273dd9eSMarek Vasut 	writel(write_group, &sdr_scc_mgr->dqs_ena);
5413da42859SDinh Nguyen 
5423da42859SDinh Nguyen 	/* hit update */
5431273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
5443da42859SDinh Nguyen }
5453da42859SDinh Nguyen 
5465ff825b8SMarek Vasut static void scc_mgr_load_dqs_for_write_group(uint32_t write_group)
5475ff825b8SMarek Vasut {
5485ff825b8SMarek Vasut 	uint32_t read_group;
5495ff825b8SMarek Vasut 	uint32_t addr = (u32)&sdr_scc_mgr->dqs_ena;
5505ff825b8SMarek Vasut 	/*
5515ff825b8SMarek Vasut 	 * Although OCT affects only write data, the OCT delay is controlled
5525ff825b8SMarek Vasut 	 * by the DQS logic block which is instantiated once per read group.
5535ff825b8SMarek Vasut 	 * For protocols where a write group consists of multiple read groups,
5545ff825b8SMarek Vasut 	 * the setting must be scanned multiple times.
5555ff825b8SMarek Vasut 	 */
5565ff825b8SMarek Vasut 	for (read_group = write_group * RW_MGR_MEM_IF_READ_DQS_WIDTH /
5575ff825b8SMarek Vasut 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH;
5585ff825b8SMarek Vasut 	     read_group < (write_group + 1) * RW_MGR_MEM_IF_READ_DQS_WIDTH /
5595ff825b8SMarek Vasut 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH; ++read_group)
5605ff825b8SMarek Vasut 		writel(read_group, addr);
5615ff825b8SMarek Vasut }
5625ff825b8SMarek Vasut 
5633da42859SDinh Nguyen static void scc_mgr_zero_group(uint32_t write_group, uint32_t test_begin,
5643da42859SDinh Nguyen 			       int32_t out_only)
5653da42859SDinh Nguyen {
5663da42859SDinh Nguyen 	uint32_t i, r;
5673da42859SDinh Nguyen 
5683da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r +=
5693da42859SDinh Nguyen 		NUM_RANKS_PER_SHADOW_REG) {
5703da42859SDinh Nguyen 		/* Zero all DQ config settings */
5713da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
57207aee5bdSMarek Vasut 			scc_mgr_set_dq_out1_delay(i, 0);
5733da42859SDinh Nguyen 			if (!out_only)
57407aee5bdSMarek Vasut 				scc_mgr_set_dq_in_delay(i, 0);
5753da42859SDinh Nguyen 		}
5763da42859SDinh Nguyen 
5773da42859SDinh Nguyen 		/* multicast to all DQ enables */
5781273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dq_ena);
5793da42859SDinh Nguyen 
5803da42859SDinh Nguyen 		/* Zero all DM config settings */
5813da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_NUM_DM_PER_WRITE_GROUP; i++) {
58207aee5bdSMarek Vasut 			scc_mgr_set_dm_out1_delay(i, 0);
5833da42859SDinh Nguyen 		}
5843da42859SDinh Nguyen 
5853da42859SDinh Nguyen 		/* multicast to all DM enables */
5861273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dm_ena);
5873da42859SDinh Nguyen 
5883da42859SDinh Nguyen 		/* zero all DQS io settings */
5893da42859SDinh Nguyen 		if (!out_only)
5903da42859SDinh Nguyen 			scc_mgr_set_dqs_io_in_delay(write_group, 0);
5913da42859SDinh Nguyen 		/* av/cv don't have out2 */
5923da42859SDinh Nguyen 		scc_mgr_set_dqs_out1_delay(write_group, IO_DQS_OUT_RESERVE);
5933da42859SDinh Nguyen 		scc_mgr_set_oct_out1_delay(write_group, IO_DQS_OUT_RESERVE);
5943da42859SDinh Nguyen 		scc_mgr_load_dqs_for_write_group(write_group);
5953da42859SDinh Nguyen 
5963da42859SDinh Nguyen 		/* multicast to all DQS IO enables (only 1) */
5971273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->dqs_io_ena);
5983da42859SDinh Nguyen 
5993da42859SDinh Nguyen 		/* hit update to zero everything */
6001273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
6013da42859SDinh Nguyen 	}
6023da42859SDinh Nguyen }
6033da42859SDinh Nguyen 
6043da42859SDinh Nguyen /*
6053da42859SDinh Nguyen  * apply and load a particular input delay for the DQ pins in a group
6063da42859SDinh Nguyen  * group_bgn is the index of the first dq pin (in the write group)
6073da42859SDinh Nguyen  */
6083da42859SDinh Nguyen static void scc_mgr_apply_group_dq_in_delay(uint32_t write_group,
6093da42859SDinh Nguyen 					    uint32_t group_bgn, uint32_t delay)
6103da42859SDinh Nguyen {
6113da42859SDinh Nguyen 	uint32_t i, p;
6123da42859SDinh Nguyen 
6133da42859SDinh Nguyen 	for (i = 0, p = group_bgn; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++, p++) {
61407aee5bdSMarek Vasut 		scc_mgr_set_dq_in_delay(p, delay);
6153da42859SDinh Nguyen 		scc_mgr_load_dq(p);
6163da42859SDinh Nguyen 	}
6173da42859SDinh Nguyen }
6183da42859SDinh Nguyen 
6193da42859SDinh Nguyen /* apply and load a particular output delay for the DQ pins in a group */
6203da42859SDinh Nguyen static void scc_mgr_apply_group_dq_out1_delay(uint32_t write_group,
6213da42859SDinh Nguyen 					      uint32_t group_bgn,
6223da42859SDinh Nguyen 					      uint32_t delay1)
6233da42859SDinh Nguyen {
6243da42859SDinh Nguyen 	uint32_t i, p;
6253da42859SDinh Nguyen 
6263da42859SDinh Nguyen 	for (i = 0, p = group_bgn; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++, p++) {
62707aee5bdSMarek Vasut 		scc_mgr_set_dq_out1_delay(i, delay1);
6283da42859SDinh Nguyen 		scc_mgr_load_dq(i);
6293da42859SDinh Nguyen 	}
6303da42859SDinh Nguyen }
6313da42859SDinh Nguyen 
6323da42859SDinh Nguyen /* apply and load a particular output delay for the DM pins in a group */
6333da42859SDinh Nguyen static void scc_mgr_apply_group_dm_out1_delay(uint32_t write_group,
6343da42859SDinh Nguyen 					      uint32_t delay1)
6353da42859SDinh Nguyen {
6363da42859SDinh Nguyen 	uint32_t i;
6373da42859SDinh Nguyen 
6383da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_NUM_DM_PER_WRITE_GROUP; i++) {
63907aee5bdSMarek Vasut 		scc_mgr_set_dm_out1_delay(i, delay1);
6403da42859SDinh Nguyen 		scc_mgr_load_dm(i);
6413da42859SDinh Nguyen 	}
6423da42859SDinh Nguyen }
6433da42859SDinh Nguyen 
6443da42859SDinh Nguyen 
6453da42859SDinh Nguyen /* apply and load delay on both DQS and OCT out1 */
6463da42859SDinh Nguyen static void scc_mgr_apply_group_dqs_io_and_oct_out1(uint32_t write_group,
6473da42859SDinh Nguyen 						    uint32_t delay)
6483da42859SDinh Nguyen {
6493da42859SDinh Nguyen 	scc_mgr_set_dqs_out1_delay(write_group, delay);
6503da42859SDinh Nguyen 	scc_mgr_load_dqs_io();
6513da42859SDinh Nguyen 
6523da42859SDinh Nguyen 	scc_mgr_set_oct_out1_delay(write_group, delay);
6533da42859SDinh Nguyen 	scc_mgr_load_dqs_for_write_group(write_group);
6543da42859SDinh Nguyen }
6553da42859SDinh Nguyen 
6563da42859SDinh Nguyen /* apply a delay to the entire output side: DQ, DM, DQS, OCT */
6573da42859SDinh Nguyen static void scc_mgr_apply_group_all_out_delay_add(uint32_t write_group,
6583da42859SDinh Nguyen 						  uint32_t group_bgn,
6593da42859SDinh Nguyen 						  uint32_t delay)
6603da42859SDinh Nguyen {
6613da42859SDinh Nguyen 	uint32_t i, p, new_delay;
6623da42859SDinh Nguyen 
6633da42859SDinh Nguyen 	/* dq shift */
6643da42859SDinh Nguyen 	for (i = 0, p = group_bgn; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++, p++) {
6653da42859SDinh Nguyen 		new_delay = READ_SCC_DQ_OUT2_DELAY;
6663da42859SDinh Nguyen 		new_delay += delay;
6673da42859SDinh Nguyen 
6683da42859SDinh Nguyen 		if (new_delay > IO_IO_OUT2_DELAY_MAX) {
6693da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DQ[%u,%u]:\
6703da42859SDinh Nguyen 				   %u > %lu => %lu", __func__, __LINE__,
6713da42859SDinh Nguyen 				   write_group, group_bgn, delay, i, p, new_delay,
6723da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX,
6733da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX);
6743da42859SDinh Nguyen 			new_delay = IO_IO_OUT2_DELAY_MAX;
6753da42859SDinh Nguyen 		}
6763da42859SDinh Nguyen 
6773da42859SDinh Nguyen 		scc_mgr_load_dq(i);
6783da42859SDinh Nguyen 	}
6793da42859SDinh Nguyen 
6803da42859SDinh Nguyen 	/* dm shift */
6813da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_NUM_DM_PER_WRITE_GROUP; i++) {
6823da42859SDinh Nguyen 		new_delay = READ_SCC_DM_IO_OUT2_DELAY;
6833da42859SDinh Nguyen 		new_delay += delay;
6843da42859SDinh Nguyen 
6853da42859SDinh Nguyen 		if (new_delay > IO_IO_OUT2_DELAY_MAX) {
6863da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DM[%u]:\
6873da42859SDinh Nguyen 				   %u > %lu => %lu\n",  __func__, __LINE__,
6883da42859SDinh Nguyen 				   write_group, group_bgn, delay, i, new_delay,
6893da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX,
6903da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX);
6913da42859SDinh Nguyen 			new_delay = IO_IO_OUT2_DELAY_MAX;
6923da42859SDinh Nguyen 		}
6933da42859SDinh Nguyen 
6943da42859SDinh Nguyen 		scc_mgr_load_dm(i);
6953da42859SDinh Nguyen 	}
6963da42859SDinh Nguyen 
6973da42859SDinh Nguyen 	/* dqs shift */
6983da42859SDinh Nguyen 	new_delay = READ_SCC_DQS_IO_OUT2_DELAY;
6993da42859SDinh Nguyen 	new_delay += delay;
7003da42859SDinh Nguyen 
7013da42859SDinh Nguyen 	if (new_delay > IO_IO_OUT2_DELAY_MAX) {
7023da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DQS: %u > %d => %d;"
7033da42859SDinh Nguyen 			   " adding %u to OUT1\n", __func__, __LINE__,
7043da42859SDinh Nguyen 			   write_group, group_bgn, delay, new_delay,
7053da42859SDinh Nguyen 			   IO_IO_OUT2_DELAY_MAX, IO_IO_OUT2_DELAY_MAX,
7063da42859SDinh Nguyen 			   new_delay - IO_IO_OUT2_DELAY_MAX);
7073da42859SDinh Nguyen 		scc_mgr_set_dqs_out1_delay(write_group, new_delay -
7083da42859SDinh Nguyen 					   IO_IO_OUT2_DELAY_MAX);
7093da42859SDinh Nguyen 		new_delay = IO_IO_OUT2_DELAY_MAX;
7103da42859SDinh Nguyen 	}
7113da42859SDinh Nguyen 
7123da42859SDinh Nguyen 	scc_mgr_load_dqs_io();
7133da42859SDinh Nguyen 
7143da42859SDinh Nguyen 	/* oct shift */
7153da42859SDinh Nguyen 	new_delay = READ_SCC_OCT_OUT2_DELAY;
7163da42859SDinh Nguyen 	new_delay += delay;
7173da42859SDinh Nguyen 
7183da42859SDinh Nguyen 	if (new_delay > IO_IO_OUT2_DELAY_MAX) {
7193da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DQS: %u > %d => %d;"
7203da42859SDinh Nguyen 			   " adding %u to OUT1\n", __func__, __LINE__,
7213da42859SDinh Nguyen 			   write_group, group_bgn, delay, new_delay,
7223da42859SDinh Nguyen 			   IO_IO_OUT2_DELAY_MAX, IO_IO_OUT2_DELAY_MAX,
7233da42859SDinh Nguyen 			   new_delay - IO_IO_OUT2_DELAY_MAX);
7243da42859SDinh Nguyen 		scc_mgr_set_oct_out1_delay(write_group, new_delay -
7253da42859SDinh Nguyen 					   IO_IO_OUT2_DELAY_MAX);
7263da42859SDinh Nguyen 		new_delay = IO_IO_OUT2_DELAY_MAX;
7273da42859SDinh Nguyen 	}
7283da42859SDinh Nguyen 
7293da42859SDinh Nguyen 	scc_mgr_load_dqs_for_write_group(write_group);
7303da42859SDinh Nguyen }
7313da42859SDinh Nguyen 
7323da42859SDinh Nguyen /*
7333da42859SDinh Nguyen  * USER apply a delay to the entire output side (DQ, DM, DQS, OCT)
7343da42859SDinh Nguyen  * and to all ranks
7353da42859SDinh Nguyen  */
7363da42859SDinh Nguyen static void scc_mgr_apply_group_all_out_delay_add_all_ranks(
7373da42859SDinh Nguyen 	uint32_t write_group, uint32_t group_bgn, uint32_t delay)
7383da42859SDinh Nguyen {
7393da42859SDinh Nguyen 	uint32_t r;
7403da42859SDinh Nguyen 
7413da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
7423da42859SDinh Nguyen 		r += NUM_RANKS_PER_SHADOW_REG) {
7433da42859SDinh Nguyen 		scc_mgr_apply_group_all_out_delay_add(write_group,
7443da42859SDinh Nguyen 						      group_bgn, delay);
7451273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
7463da42859SDinh Nguyen 	}
7473da42859SDinh Nguyen }
7483da42859SDinh Nguyen 
7493da42859SDinh Nguyen /* optimization used to recover some slots in ddr3 inst_rom */
7503da42859SDinh Nguyen /* could be applied to other protocols if we wanted to */
7513da42859SDinh Nguyen static void set_jump_as_return(void)
7523da42859SDinh Nguyen {
7533da42859SDinh Nguyen 	/*
7543da42859SDinh Nguyen 	 * to save space, we replace return with jump to special shared
7553da42859SDinh Nguyen 	 * RETURN instruction so we set the counter to large value so that
7563da42859SDinh Nguyen 	 * we always jump
7573da42859SDinh Nguyen 	 */
7581273dd9eSMarek Vasut 	writel(0xff, &sdr_rw_load_mgr_regs->load_cntr0);
7591273dd9eSMarek Vasut 	writel(RW_MGR_RETURN, &sdr_rw_load_jump_mgr_regs->load_jump_add0);
7603da42859SDinh Nguyen }
7613da42859SDinh Nguyen 
7623da42859SDinh Nguyen /*
7633da42859SDinh Nguyen  * should always use constants as argument to ensure all computations are
7643da42859SDinh Nguyen  * performed at compile time
7653da42859SDinh Nguyen  */
7663da42859SDinh Nguyen static void delay_for_n_mem_clocks(const uint32_t clocks)
7673da42859SDinh Nguyen {
7683da42859SDinh Nguyen 	uint32_t afi_clocks;
7693da42859SDinh Nguyen 	uint8_t inner = 0;
7703da42859SDinh Nguyen 	uint8_t outer = 0;
7713da42859SDinh Nguyen 	uint16_t c_loop = 0;
7723da42859SDinh Nguyen 
7733da42859SDinh Nguyen 	debug("%s:%d: clocks=%u ... start\n", __func__, __LINE__, clocks);
7743da42859SDinh Nguyen 
7753da42859SDinh Nguyen 
7763da42859SDinh Nguyen 	afi_clocks = (clocks + AFI_RATE_RATIO-1) / AFI_RATE_RATIO;
7773da42859SDinh Nguyen 	/* scale (rounding up) to get afi clocks */
7783da42859SDinh Nguyen 
7793da42859SDinh Nguyen 	/*
7803da42859SDinh Nguyen 	 * Note, we don't bother accounting for being off a little bit
7813da42859SDinh Nguyen 	 * because of a few extra instructions in outer loops
7823da42859SDinh Nguyen 	 * Note, the loops have a test at the end, and do the test before
7833da42859SDinh Nguyen 	 * the decrement, and so always perform the loop
7843da42859SDinh Nguyen 	 * 1 time more than the counter value
7853da42859SDinh Nguyen 	 */
7863da42859SDinh Nguyen 	if (afi_clocks == 0) {
7873da42859SDinh Nguyen 		;
7883da42859SDinh Nguyen 	} else if (afi_clocks <= 0x100) {
7893da42859SDinh Nguyen 		inner = afi_clocks-1;
7903da42859SDinh Nguyen 		outer = 0;
7913da42859SDinh Nguyen 		c_loop = 0;
7923da42859SDinh Nguyen 	} else if (afi_clocks <= 0x10000) {
7933da42859SDinh Nguyen 		inner = 0xff;
7943da42859SDinh Nguyen 		outer = (afi_clocks-1) >> 8;
7953da42859SDinh Nguyen 		c_loop = 0;
7963da42859SDinh Nguyen 	} else {
7973da42859SDinh Nguyen 		inner = 0xff;
7983da42859SDinh Nguyen 		outer = 0xff;
7993da42859SDinh Nguyen 		c_loop = (afi_clocks-1) >> 16;
8003da42859SDinh Nguyen 	}
8013da42859SDinh Nguyen 
8023da42859SDinh Nguyen 	/*
8033da42859SDinh Nguyen 	 * rom instructions are structured as follows:
8043da42859SDinh Nguyen 	 *
8053da42859SDinh Nguyen 	 *    IDLE_LOOP2: jnz cntr0, TARGET_A
8063da42859SDinh Nguyen 	 *    IDLE_LOOP1: jnz cntr1, TARGET_B
8073da42859SDinh Nguyen 	 *                return
8083da42859SDinh Nguyen 	 *
8093da42859SDinh Nguyen 	 * so, when doing nested loops, TARGET_A is set to IDLE_LOOP2, and
8103da42859SDinh Nguyen 	 * TARGET_B is set to IDLE_LOOP2 as well
8113da42859SDinh Nguyen 	 *
8123da42859SDinh Nguyen 	 * if we have no outer loop, though, then we can use IDLE_LOOP1 only,
8133da42859SDinh Nguyen 	 * and set TARGET_B to IDLE_LOOP1 and we skip IDLE_LOOP2 entirely
8143da42859SDinh Nguyen 	 *
8153da42859SDinh Nguyen 	 * a little confusing, but it helps save precious space in the inst_rom
8163da42859SDinh Nguyen 	 * and sequencer rom and keeps the delays more accurate and reduces
8173da42859SDinh Nguyen 	 * overhead
8183da42859SDinh Nguyen 	 */
8193da42859SDinh Nguyen 	if (afi_clocks <= 0x100) {
8201273dd9eSMarek Vasut 		writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(inner),
8211273dd9eSMarek Vasut 			&sdr_rw_load_mgr_regs->load_cntr1);
8223da42859SDinh Nguyen 
8231273dd9eSMarek Vasut 		writel(RW_MGR_IDLE_LOOP1,
8241273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
8253da42859SDinh Nguyen 
8261273dd9eSMarek Vasut 		writel(RW_MGR_IDLE_LOOP1, SDR_PHYGRP_RWMGRGRP_ADDRESS |
8271273dd9eSMarek Vasut 					  RW_MGR_RUN_SINGLE_GROUP_OFFSET);
8283da42859SDinh Nguyen 	} else {
8291273dd9eSMarek Vasut 		writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(inner),
8301273dd9eSMarek Vasut 			&sdr_rw_load_mgr_regs->load_cntr0);
8313da42859SDinh Nguyen 
8321273dd9eSMarek Vasut 		writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(outer),
8331273dd9eSMarek Vasut 			&sdr_rw_load_mgr_regs->load_cntr1);
8343da42859SDinh Nguyen 
8351273dd9eSMarek Vasut 		writel(RW_MGR_IDLE_LOOP2,
8361273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add0);
8373da42859SDinh Nguyen 
8381273dd9eSMarek Vasut 		writel(RW_MGR_IDLE_LOOP2,
8391273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
8403da42859SDinh Nguyen 
8413da42859SDinh Nguyen 		/* hack to get around compiler not being smart enough */
8423da42859SDinh Nguyen 		if (afi_clocks <= 0x10000) {
8433da42859SDinh Nguyen 			/* only need to run once */
8441273dd9eSMarek Vasut 			writel(RW_MGR_IDLE_LOOP2, SDR_PHYGRP_RWMGRGRP_ADDRESS |
8451273dd9eSMarek Vasut 						  RW_MGR_RUN_SINGLE_GROUP_OFFSET);
8463da42859SDinh Nguyen 		} else {
8473da42859SDinh Nguyen 			do {
8481273dd9eSMarek Vasut 				writel(RW_MGR_IDLE_LOOP2,
8491273dd9eSMarek Vasut 					SDR_PHYGRP_RWMGRGRP_ADDRESS |
8501273dd9eSMarek Vasut 					RW_MGR_RUN_SINGLE_GROUP_OFFSET);
8513da42859SDinh Nguyen 			} while (c_loop-- != 0);
8523da42859SDinh Nguyen 		}
8533da42859SDinh Nguyen 	}
8543da42859SDinh Nguyen 	debug("%s:%d clocks=%u ... end\n", __func__, __LINE__, clocks);
8553da42859SDinh Nguyen }
8563da42859SDinh Nguyen 
8573da42859SDinh Nguyen static void rw_mgr_mem_initialize(void)
8583da42859SDinh Nguyen {
8593da42859SDinh Nguyen 	uint32_t r;
8601273dd9eSMarek Vasut 	uint32_t grpaddr = SDR_PHYGRP_RWMGRGRP_ADDRESS |
8611273dd9eSMarek Vasut 			   RW_MGR_RUN_SINGLE_GROUP_OFFSET;
8623da42859SDinh Nguyen 
8633da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
8643da42859SDinh Nguyen 
8653da42859SDinh Nguyen 	/* The reset / cke part of initialization is broadcasted to all ranks */
8661273dd9eSMarek Vasut 	writel(RW_MGR_RANK_ALL, SDR_PHYGRP_RWMGRGRP_ADDRESS |
8671273dd9eSMarek Vasut 				RW_MGR_SET_CS_AND_ODT_MASK_OFFSET);
8683da42859SDinh Nguyen 
8693da42859SDinh Nguyen 	/*
8703da42859SDinh Nguyen 	 * Here's how you load register for a loop
8713da42859SDinh Nguyen 	 * Counters are located @ 0x800
8723da42859SDinh Nguyen 	 * Jump address are located @ 0xC00
8733da42859SDinh Nguyen 	 * For both, registers 0 to 3 are selected using bits 3 and 2, like
8743da42859SDinh Nguyen 	 * in 0x800, 0x804, 0x808, 0x80C and 0xC00, 0xC04, 0xC08, 0xC0C
8753da42859SDinh Nguyen 	 * I know this ain't pretty, but Avalon bus throws away the 2 least
8763da42859SDinh Nguyen 	 * significant bits
8773da42859SDinh Nguyen 	 */
8783da42859SDinh Nguyen 
8793da42859SDinh Nguyen 	/* start with memory RESET activated */
8803da42859SDinh Nguyen 
8813da42859SDinh Nguyen 	/* tINIT = 200us */
8823da42859SDinh Nguyen 
8833da42859SDinh Nguyen 	/*
8843da42859SDinh Nguyen 	 * 200us @ 266MHz (3.75 ns) ~ 54000 clock cycles
8853da42859SDinh Nguyen 	 * If a and b are the number of iteration in 2 nested loops
8863da42859SDinh Nguyen 	 * it takes the following number of cycles to complete the operation:
8873da42859SDinh Nguyen 	 * number_of_cycles = ((2 + n) * a + 2) * b
8883da42859SDinh Nguyen 	 * where n is the number of instruction in the inner loop
8893da42859SDinh Nguyen 	 * One possible solution is n = 0 , a = 256 , b = 106 => a = FF,
8903da42859SDinh Nguyen 	 * b = 6A
8913da42859SDinh Nguyen 	 */
8923da42859SDinh Nguyen 
8933da42859SDinh Nguyen 	/* Load counters */
8943da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TINIT_CNTR0_VAL),
8951273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr0);
8963da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TINIT_CNTR1_VAL),
8971273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr1);
8983da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TINIT_CNTR2_VAL),
8991273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr2);
9003da42859SDinh Nguyen 
9013da42859SDinh Nguyen 	/* Load jump address */
9021273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_0_CKE_0,
9031273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add0);
9041273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_0_CKE_0,
9051273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add1);
9061273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_0_CKE_0,
9071273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add2);
9083da42859SDinh Nguyen 
9093da42859SDinh Nguyen 	/* Execute count instruction */
9101273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_0_CKE_0, grpaddr);
9113da42859SDinh Nguyen 
9123da42859SDinh Nguyen 	/* indicate that memory is stable */
9131273dd9eSMarek Vasut 	writel(1, &phy_mgr_cfg->reset_mem_stbl);
9143da42859SDinh Nguyen 
9153da42859SDinh Nguyen 	/*
9163da42859SDinh Nguyen 	 * transition the RESET to high
9173da42859SDinh Nguyen 	 * Wait for 500us
9183da42859SDinh Nguyen 	 */
9193da42859SDinh Nguyen 
9203da42859SDinh Nguyen 	/*
9213da42859SDinh Nguyen 	 * 500us @ 266MHz (3.75 ns) ~ 134000 clock cycles
9223da42859SDinh Nguyen 	 * If a and b are the number of iteration in 2 nested loops
9233da42859SDinh Nguyen 	 * it takes the following number of cycles to complete the operation
9243da42859SDinh Nguyen 	 * number_of_cycles = ((2 + n) * a + 2) * b
9253da42859SDinh Nguyen 	 * where n is the number of instruction in the inner loop
9263da42859SDinh Nguyen 	 * One possible solution is n = 2 , a = 131 , b = 256 => a = 83,
9273da42859SDinh Nguyen 	 * b = FF
9283da42859SDinh Nguyen 	 */
9293da42859SDinh Nguyen 
9303da42859SDinh Nguyen 	/* Load counters */
9313da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TRESET_CNTR0_VAL),
9321273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr0);
9333da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TRESET_CNTR1_VAL),
9341273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr1);
9353da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TRESET_CNTR2_VAL),
9361273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr2);
9373da42859SDinh Nguyen 
9383da42859SDinh Nguyen 	/* Load jump address */
9391273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_1_CKE_0,
9401273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add0);
9411273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_1_CKE_0,
9421273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add1);
9431273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_1_CKE_0,
9441273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add2);
9453da42859SDinh Nguyen 
9461273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_1_CKE_0, grpaddr);
9473da42859SDinh Nguyen 
9483da42859SDinh Nguyen 	/* bring up clock enable */
9493da42859SDinh Nguyen 
9503da42859SDinh Nguyen 	/* tXRP < 250 ck cycles */
9513da42859SDinh Nguyen 	delay_for_n_mem_clocks(250);
9523da42859SDinh Nguyen 
9533da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r++) {
9543da42859SDinh Nguyen 		if (param->skip_ranks[r]) {
9553da42859SDinh Nguyen 			/* request to skip the rank */
9563da42859SDinh Nguyen 			continue;
9573da42859SDinh Nguyen 		}
9583da42859SDinh Nguyen 
9593da42859SDinh Nguyen 		/* set rank */
9603da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_OFF);
9613da42859SDinh Nguyen 
9623da42859SDinh Nguyen 		/*
9633da42859SDinh Nguyen 		 * USER Use Mirror-ed commands for odd ranks if address
9643da42859SDinh Nguyen 		 * mirrorring is on
9653da42859SDinh Nguyen 		 */
9663da42859SDinh Nguyen 		if ((RW_MGR_MEM_ADDRESS_MIRRORING >> r) & 0x1) {
9673da42859SDinh Nguyen 			set_jump_as_return();
9681273dd9eSMarek Vasut 			writel(RW_MGR_MRS2_MIRR, grpaddr);
9693da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
9703da42859SDinh Nguyen 			set_jump_as_return();
9711273dd9eSMarek Vasut 			writel(RW_MGR_MRS3_MIRR, grpaddr);
9723da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
9733da42859SDinh Nguyen 			set_jump_as_return();
9741273dd9eSMarek Vasut 			writel(RW_MGR_MRS1_MIRR, grpaddr);
9753da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
9763da42859SDinh Nguyen 			set_jump_as_return();
9771273dd9eSMarek Vasut 			writel(RW_MGR_MRS0_DLL_RESET_MIRR, grpaddr);
9783da42859SDinh Nguyen 		} else {
9793da42859SDinh Nguyen 			set_jump_as_return();
9801273dd9eSMarek Vasut 			writel(RW_MGR_MRS2, grpaddr);
9813da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
9823da42859SDinh Nguyen 			set_jump_as_return();
9831273dd9eSMarek Vasut 			writel(RW_MGR_MRS3, grpaddr);
9843da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
9853da42859SDinh Nguyen 			set_jump_as_return();
9861273dd9eSMarek Vasut 			writel(RW_MGR_MRS1, grpaddr);
9873da42859SDinh Nguyen 			set_jump_as_return();
9881273dd9eSMarek Vasut 			writel(RW_MGR_MRS0_DLL_RESET, grpaddr);
9893da42859SDinh Nguyen 		}
9903da42859SDinh Nguyen 		set_jump_as_return();
9911273dd9eSMarek Vasut 		writel(RW_MGR_ZQCL, grpaddr);
9923da42859SDinh Nguyen 
9933da42859SDinh Nguyen 		/* tZQinit = tDLLK = 512 ck cycles */
9943da42859SDinh Nguyen 		delay_for_n_mem_clocks(512);
9953da42859SDinh Nguyen 	}
9963da42859SDinh Nguyen }
9973da42859SDinh Nguyen 
9983da42859SDinh Nguyen /*
9993da42859SDinh Nguyen  * At the end of calibration we have to program the user settings in, and
10003da42859SDinh Nguyen  * USER  hand off the memory to the user.
10013da42859SDinh Nguyen  */
10023da42859SDinh Nguyen static void rw_mgr_mem_handoff(void)
10033da42859SDinh Nguyen {
10043da42859SDinh Nguyen 	uint32_t r;
10051273dd9eSMarek Vasut 	uint32_t grpaddr = SDR_PHYGRP_RWMGRGRP_ADDRESS |
10061273dd9eSMarek Vasut 			   RW_MGR_RUN_SINGLE_GROUP_OFFSET;
10073da42859SDinh Nguyen 
10083da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
10093da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r++) {
10103da42859SDinh Nguyen 		if (param->skip_ranks[r])
10113da42859SDinh Nguyen 			/* request to skip the rank */
10123da42859SDinh Nguyen 			continue;
10133da42859SDinh Nguyen 		/* set rank */
10143da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_OFF);
10153da42859SDinh Nguyen 
10163da42859SDinh Nguyen 		/* precharge all banks ... */
10171273dd9eSMarek Vasut 		writel(RW_MGR_PRECHARGE_ALL, grpaddr);
10183da42859SDinh Nguyen 
10193da42859SDinh Nguyen 		/* load up MR settings specified by user */
10203da42859SDinh Nguyen 
10213da42859SDinh Nguyen 		/*
10223da42859SDinh Nguyen 		 * Use Mirror-ed commands for odd ranks if address
10233da42859SDinh Nguyen 		 * mirrorring is on
10243da42859SDinh Nguyen 		 */
10253da42859SDinh Nguyen 		if ((RW_MGR_MEM_ADDRESS_MIRRORING >> r) & 0x1) {
10263da42859SDinh Nguyen 			set_jump_as_return();
10271273dd9eSMarek Vasut 			writel(RW_MGR_MRS2_MIRR, grpaddr);
10283da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10293da42859SDinh Nguyen 			set_jump_as_return();
10301273dd9eSMarek Vasut 			writel(RW_MGR_MRS3_MIRR, grpaddr);
10313da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10323da42859SDinh Nguyen 			set_jump_as_return();
10331273dd9eSMarek Vasut 			writel(RW_MGR_MRS1_MIRR, grpaddr);
10343da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10353da42859SDinh Nguyen 			set_jump_as_return();
10361273dd9eSMarek Vasut 			writel(RW_MGR_MRS0_USER_MIRR, grpaddr);
10373da42859SDinh Nguyen 		} else {
10383da42859SDinh Nguyen 			set_jump_as_return();
10391273dd9eSMarek Vasut 			writel(RW_MGR_MRS2, grpaddr);
10403da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10413da42859SDinh Nguyen 			set_jump_as_return();
10421273dd9eSMarek Vasut 			writel(RW_MGR_MRS3, grpaddr);
10433da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10443da42859SDinh Nguyen 			set_jump_as_return();
10451273dd9eSMarek Vasut 			writel(RW_MGR_MRS1, grpaddr);
10463da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10473da42859SDinh Nguyen 			set_jump_as_return();
10481273dd9eSMarek Vasut 			writel(RW_MGR_MRS0_USER, grpaddr);
10493da42859SDinh Nguyen 		}
10503da42859SDinh Nguyen 		/*
10513da42859SDinh Nguyen 		 * USER  need to wait tMOD (12CK or 15ns) time before issuing
10523da42859SDinh Nguyen 		 * other commands, but we will have plenty of NIOS cycles before
10533da42859SDinh Nguyen 		 * actual handoff so its okay.
10543da42859SDinh Nguyen 		 */
10553da42859SDinh Nguyen 	}
10563da42859SDinh Nguyen }
10573da42859SDinh Nguyen 
10583da42859SDinh Nguyen /*
10593da42859SDinh Nguyen  * performs a guaranteed read on the patterns we are going to use during a
10603da42859SDinh Nguyen  * read test to ensure memory works
10613da42859SDinh Nguyen  */
10623da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test_patterns(uint32_t rank_bgn,
10633da42859SDinh Nguyen 	uint32_t group, uint32_t num_tries, uint32_t *bit_chk,
10643da42859SDinh Nguyen 	uint32_t all_ranks)
10653da42859SDinh Nguyen {
10663da42859SDinh Nguyen 	uint32_t r, vg;
10673da42859SDinh Nguyen 	uint32_t correct_mask_vg;
10683da42859SDinh Nguyen 	uint32_t tmp_bit_chk;
10693da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
10703da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
10713da42859SDinh Nguyen 	uint32_t addr;
10723da42859SDinh Nguyen 	uint32_t base_rw_mgr;
10733da42859SDinh Nguyen 
10743da42859SDinh Nguyen 	*bit_chk = param->read_correct_mask;
10753da42859SDinh Nguyen 	correct_mask_vg = param->read_correct_mask_vg;
10763da42859SDinh Nguyen 
10773da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
10783da42859SDinh Nguyen 		if (param->skip_ranks[r])
10793da42859SDinh Nguyen 			/* request to skip the rank */
10803da42859SDinh Nguyen 			continue;
10813da42859SDinh Nguyen 
10823da42859SDinh Nguyen 		/* set rank */
10833da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
10843da42859SDinh Nguyen 
10853da42859SDinh Nguyen 		/* Load up a constant bursts of read commands */
10861273dd9eSMarek Vasut 		writel(0x20, &sdr_rw_load_mgr_regs->load_cntr0);
10871273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_READ,
10881273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add0);
10893da42859SDinh Nguyen 
10901273dd9eSMarek Vasut 		writel(0x20, &sdr_rw_load_mgr_regs->load_cntr1);
10911273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_READ_CONT,
10921273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
10933da42859SDinh Nguyen 
10943da42859SDinh Nguyen 		tmp_bit_chk = 0;
10953da42859SDinh Nguyen 		for (vg = RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS-1; ; vg--) {
10963da42859SDinh Nguyen 			/* reset the fifos to get pointers to known state */
10973da42859SDinh Nguyen 
10981273dd9eSMarek Vasut 			writel(0, &phy_mgr_cmd->fifo_reset);
10991273dd9eSMarek Vasut 			writel(0, SDR_PHYGRP_RWMGRGRP_ADDRESS |
11001273dd9eSMarek Vasut 				  RW_MGR_RESET_READ_DATAPATH_OFFSET);
11013da42859SDinh Nguyen 
11023da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk << (RW_MGR_MEM_DQ_PER_READ_DQS
11033da42859SDinh Nguyen 				/ RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS);
11043da42859SDinh Nguyen 
1105c4815f76SMarek Vasut 			addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
110617fdc916SMarek Vasut 			writel(RW_MGR_GUARANTEED_READ, addr +
11073da42859SDinh Nguyen 			       ((group * RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS +
11083da42859SDinh Nguyen 				vg) << 2));
11093da42859SDinh Nguyen 
11101273dd9eSMarek Vasut 			base_rw_mgr = readl(SDR_PHYGRP_RWMGRGRP_ADDRESS);
11113da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk | (correct_mask_vg & (~base_rw_mgr));
11123da42859SDinh Nguyen 
11133da42859SDinh Nguyen 			if (vg == 0)
11143da42859SDinh Nguyen 				break;
11153da42859SDinh Nguyen 		}
11163da42859SDinh Nguyen 		*bit_chk &= tmp_bit_chk;
11173da42859SDinh Nguyen 	}
11183da42859SDinh Nguyen 
1119c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
112017fdc916SMarek Vasut 	writel(RW_MGR_CLEAR_DQS_ENABLE, addr + (group << 2));
11213da42859SDinh Nguyen 
11223da42859SDinh Nguyen 	set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
11233da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d test_load_patterns(%u,ALL) => (%u == %u) =>\
11243da42859SDinh Nguyen 		   %lu\n", __func__, __LINE__, group, *bit_chk, param->read_correct_mask,
11253da42859SDinh Nguyen 		   (long unsigned int)(*bit_chk == param->read_correct_mask));
11263da42859SDinh Nguyen 	return *bit_chk == param->read_correct_mask;
11273da42859SDinh Nguyen }
11283da42859SDinh Nguyen 
11293da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test_patterns_all_ranks
11303da42859SDinh Nguyen 	(uint32_t group, uint32_t num_tries, uint32_t *bit_chk)
11313da42859SDinh Nguyen {
11323da42859SDinh Nguyen 	return rw_mgr_mem_calibrate_read_test_patterns(0, group,
11333da42859SDinh Nguyen 		num_tries, bit_chk, 1);
11343da42859SDinh Nguyen }
11353da42859SDinh Nguyen 
11363da42859SDinh Nguyen /* load up the patterns we are going to use during a read test */
11373da42859SDinh Nguyen static void rw_mgr_mem_calibrate_read_load_patterns(uint32_t rank_bgn,
11383da42859SDinh Nguyen 	uint32_t all_ranks)
11393da42859SDinh Nguyen {
11403da42859SDinh Nguyen 	uint32_t r;
11413da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
11423da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
11433da42859SDinh Nguyen 
11443da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
11453da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
11463da42859SDinh Nguyen 		if (param->skip_ranks[r])
11473da42859SDinh Nguyen 			/* request to skip the rank */
11483da42859SDinh Nguyen 			continue;
11493da42859SDinh Nguyen 
11503da42859SDinh Nguyen 		/* set rank */
11513da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
11523da42859SDinh Nguyen 
11533da42859SDinh Nguyen 		/* Load up a constant bursts */
11541273dd9eSMarek Vasut 		writel(0x20, &sdr_rw_load_mgr_regs->load_cntr0);
11553da42859SDinh Nguyen 
11561273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_WRITE_WAIT0,
11571273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add0);
11583da42859SDinh Nguyen 
11591273dd9eSMarek Vasut 		writel(0x20, &sdr_rw_load_mgr_regs->load_cntr1);
11603da42859SDinh Nguyen 
11611273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_WRITE_WAIT1,
11621273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
11633da42859SDinh Nguyen 
11641273dd9eSMarek Vasut 		writel(0x04, &sdr_rw_load_mgr_regs->load_cntr2);
11653da42859SDinh Nguyen 
11661273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_WRITE_WAIT2,
11671273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add2);
11683da42859SDinh Nguyen 
11691273dd9eSMarek Vasut 		writel(0x04, &sdr_rw_load_mgr_regs->load_cntr3);
11703da42859SDinh Nguyen 
11711273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_WRITE_WAIT3,
11721273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add3);
11733da42859SDinh Nguyen 
11741273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_WRITE, SDR_PHYGRP_RWMGRGRP_ADDRESS |
11751273dd9eSMarek Vasut 						RW_MGR_RUN_SINGLE_GROUP_OFFSET);
11763da42859SDinh Nguyen 	}
11773da42859SDinh Nguyen 
11783da42859SDinh Nguyen 	set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
11793da42859SDinh Nguyen }
11803da42859SDinh Nguyen 
11813da42859SDinh Nguyen /*
11823da42859SDinh Nguyen  * try a read and see if it returns correct data back. has dummy reads
11833da42859SDinh Nguyen  * inserted into the mix used to align dqs enable. has more thorough checks
11843da42859SDinh Nguyen  * than the regular read test.
11853da42859SDinh Nguyen  */
11863da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test(uint32_t rank_bgn, uint32_t group,
11873da42859SDinh Nguyen 	uint32_t num_tries, uint32_t all_correct, uint32_t *bit_chk,
11883da42859SDinh Nguyen 	uint32_t all_groups, uint32_t all_ranks)
11893da42859SDinh Nguyen {
11903da42859SDinh Nguyen 	uint32_t r, vg;
11913da42859SDinh Nguyen 	uint32_t correct_mask_vg;
11923da42859SDinh Nguyen 	uint32_t tmp_bit_chk;
11933da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
11943da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
11953da42859SDinh Nguyen 	uint32_t addr;
11963da42859SDinh Nguyen 	uint32_t base_rw_mgr;
11973da42859SDinh Nguyen 
11983da42859SDinh Nguyen 	*bit_chk = param->read_correct_mask;
11993da42859SDinh Nguyen 	correct_mask_vg = param->read_correct_mask_vg;
12003da42859SDinh Nguyen 
12013da42859SDinh Nguyen 	uint32_t quick_read_mode = (((STATIC_CALIB_STEPS) &
12023da42859SDinh Nguyen 		CALIB_SKIP_DELAY_SWEEPS) && ENABLE_SUPER_QUICK_CALIBRATION);
12033da42859SDinh Nguyen 
12043da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
12053da42859SDinh Nguyen 		if (param->skip_ranks[r])
12063da42859SDinh Nguyen 			/* request to skip the rank */
12073da42859SDinh Nguyen 			continue;
12083da42859SDinh Nguyen 
12093da42859SDinh Nguyen 		/* set rank */
12103da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
12113da42859SDinh Nguyen 
12121273dd9eSMarek Vasut 		writel(0x10, &sdr_rw_load_mgr_regs->load_cntr1);
12133da42859SDinh Nguyen 
12141273dd9eSMarek Vasut 		writel(RW_MGR_READ_B2B_WAIT1,
12151273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
12163da42859SDinh Nguyen 
12171273dd9eSMarek Vasut 		writel(0x10, &sdr_rw_load_mgr_regs->load_cntr2);
12181273dd9eSMarek Vasut 		writel(RW_MGR_READ_B2B_WAIT2,
12191273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add2);
12203da42859SDinh Nguyen 
12213da42859SDinh Nguyen 		if (quick_read_mode)
12221273dd9eSMarek Vasut 			writel(0x1, &sdr_rw_load_mgr_regs->load_cntr0);
12233da42859SDinh Nguyen 			/* need at least two (1+1) reads to capture failures */
12243da42859SDinh Nguyen 		else if (all_groups)
12251273dd9eSMarek Vasut 			writel(0x06, &sdr_rw_load_mgr_regs->load_cntr0);
12263da42859SDinh Nguyen 		else
12271273dd9eSMarek Vasut 			writel(0x32, &sdr_rw_load_mgr_regs->load_cntr0);
12283da42859SDinh Nguyen 
12291273dd9eSMarek Vasut 		writel(RW_MGR_READ_B2B,
12301273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add0);
12313da42859SDinh Nguyen 		if (all_groups)
12323da42859SDinh Nguyen 			writel(RW_MGR_MEM_IF_READ_DQS_WIDTH *
12333da42859SDinh Nguyen 			       RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS - 1,
12341273dd9eSMarek Vasut 			       &sdr_rw_load_mgr_regs->load_cntr3);
12353da42859SDinh Nguyen 		else
12361273dd9eSMarek Vasut 			writel(0x0, &sdr_rw_load_mgr_regs->load_cntr3);
12373da42859SDinh Nguyen 
12381273dd9eSMarek Vasut 		writel(RW_MGR_READ_B2B,
12391273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add3);
12403da42859SDinh Nguyen 
12413da42859SDinh Nguyen 		tmp_bit_chk = 0;
12423da42859SDinh Nguyen 		for (vg = RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS-1; ; vg--) {
12433da42859SDinh Nguyen 			/* reset the fifos to get pointers to known state */
12441273dd9eSMarek Vasut 			writel(0, &phy_mgr_cmd->fifo_reset);
12451273dd9eSMarek Vasut 			writel(0, SDR_PHYGRP_RWMGRGRP_ADDRESS |
12461273dd9eSMarek Vasut 				  RW_MGR_RESET_READ_DATAPATH_OFFSET);
12473da42859SDinh Nguyen 
12483da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk << (RW_MGR_MEM_DQ_PER_READ_DQS
12493da42859SDinh Nguyen 				/ RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS);
12503da42859SDinh Nguyen 
1251c4815f76SMarek Vasut 			if (all_groups)
1252c4815f76SMarek Vasut 				addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_ALL_GROUPS_OFFSET;
1253c4815f76SMarek Vasut 			else
1254c4815f76SMarek Vasut 				addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
1255c4815f76SMarek Vasut 
125617fdc916SMarek Vasut 			writel(RW_MGR_READ_B2B, addr +
12573da42859SDinh Nguyen 			       ((group * RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS +
12583da42859SDinh Nguyen 			       vg) << 2));
12593da42859SDinh Nguyen 
12601273dd9eSMarek Vasut 			base_rw_mgr = readl(SDR_PHYGRP_RWMGRGRP_ADDRESS);
12613da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk | (correct_mask_vg & ~(base_rw_mgr));
12623da42859SDinh Nguyen 
12633da42859SDinh Nguyen 			if (vg == 0)
12643da42859SDinh Nguyen 				break;
12653da42859SDinh Nguyen 		}
12663da42859SDinh Nguyen 		*bit_chk &= tmp_bit_chk;
12673da42859SDinh Nguyen 	}
12683da42859SDinh Nguyen 
1269c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
127017fdc916SMarek Vasut 	writel(RW_MGR_CLEAR_DQS_ENABLE, addr + (group << 2));
12713da42859SDinh Nguyen 
12723da42859SDinh Nguyen 	if (all_correct) {
12733da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
12743da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d read_test(%u,ALL,%u) =>\
12753da42859SDinh Nguyen 			   (%u == %u) => %lu", __func__, __LINE__, group,
12763da42859SDinh Nguyen 			   all_groups, *bit_chk, param->read_correct_mask,
12773da42859SDinh Nguyen 			   (long unsigned int)(*bit_chk ==
12783da42859SDinh Nguyen 			   param->read_correct_mask));
12793da42859SDinh Nguyen 		return *bit_chk == param->read_correct_mask;
12803da42859SDinh Nguyen 	} else	{
12813da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
12823da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d read_test(%u,ONE,%u) =>\
12833da42859SDinh Nguyen 			   (%u != %lu) => %lu\n", __func__, __LINE__,
12843da42859SDinh Nguyen 			   group, all_groups, *bit_chk, (long unsigned int)0,
12853da42859SDinh Nguyen 			   (long unsigned int)(*bit_chk != 0x00));
12863da42859SDinh Nguyen 		return *bit_chk != 0x00;
12873da42859SDinh Nguyen 	}
12883da42859SDinh Nguyen }
12893da42859SDinh Nguyen 
12903da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test_all_ranks(uint32_t group,
12913da42859SDinh Nguyen 	uint32_t num_tries, uint32_t all_correct, uint32_t *bit_chk,
12923da42859SDinh Nguyen 	uint32_t all_groups)
12933da42859SDinh Nguyen {
12943da42859SDinh Nguyen 	return rw_mgr_mem_calibrate_read_test(0, group, num_tries, all_correct,
12953da42859SDinh Nguyen 					      bit_chk, all_groups, 1);
12963da42859SDinh Nguyen }
12973da42859SDinh Nguyen 
12983da42859SDinh Nguyen static void rw_mgr_incr_vfifo(uint32_t grp, uint32_t *v)
12993da42859SDinh Nguyen {
13001273dd9eSMarek Vasut 	writel(grp, &phy_mgr_cmd->inc_vfifo_hard_phy);
13013da42859SDinh Nguyen 	(*v)++;
13023da42859SDinh Nguyen }
13033da42859SDinh Nguyen 
13043da42859SDinh Nguyen static void rw_mgr_decr_vfifo(uint32_t grp, uint32_t *v)
13053da42859SDinh Nguyen {
13063da42859SDinh Nguyen 	uint32_t i;
13073da42859SDinh Nguyen 
13083da42859SDinh Nguyen 	for (i = 0; i < VFIFO_SIZE-1; i++)
13093da42859SDinh Nguyen 		rw_mgr_incr_vfifo(grp, v);
13103da42859SDinh Nguyen }
13113da42859SDinh Nguyen 
13123da42859SDinh Nguyen static int find_vfifo_read(uint32_t grp, uint32_t *bit_chk)
13133da42859SDinh Nguyen {
13143da42859SDinh Nguyen 	uint32_t  v;
13153da42859SDinh Nguyen 	uint32_t fail_cnt = 0;
13163da42859SDinh Nguyen 	uint32_t test_status;
13173da42859SDinh Nguyen 
13183da42859SDinh Nguyen 	for (v = 0; v < VFIFO_SIZE; ) {
13193da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: vfifo %u\n",
13203da42859SDinh Nguyen 			   __func__, __LINE__, v);
13213da42859SDinh Nguyen 		test_status = rw_mgr_mem_calibrate_read_test_all_ranks
13223da42859SDinh Nguyen 			(grp, 1, PASS_ONE_BIT, bit_chk, 0);
13233da42859SDinh Nguyen 		if (!test_status) {
13243da42859SDinh Nguyen 			fail_cnt++;
13253da42859SDinh Nguyen 
13263da42859SDinh Nguyen 			if (fail_cnt == 2)
13273da42859SDinh Nguyen 				break;
13283da42859SDinh Nguyen 		}
13293da42859SDinh Nguyen 
13303da42859SDinh Nguyen 		/* fiddle with FIFO */
13313da42859SDinh Nguyen 		rw_mgr_incr_vfifo(grp, &v);
13323da42859SDinh Nguyen 	}
13333da42859SDinh Nguyen 
13343da42859SDinh Nguyen 	if (v >= VFIFO_SIZE) {
13353da42859SDinh Nguyen 		/* no failing read found!! Something must have gone wrong */
13363da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: vfifo failed\n",
13373da42859SDinh Nguyen 			   __func__, __LINE__);
13383da42859SDinh Nguyen 		return 0;
13393da42859SDinh Nguyen 	} else {
13403da42859SDinh Nguyen 		return v;
13413da42859SDinh Nguyen 	}
13423da42859SDinh Nguyen }
13433da42859SDinh Nguyen 
13443da42859SDinh Nguyen static int find_working_phase(uint32_t *grp, uint32_t *bit_chk,
13453da42859SDinh Nguyen 			      uint32_t dtaps_per_ptap, uint32_t *work_bgn,
13463da42859SDinh Nguyen 			      uint32_t *v, uint32_t *d, uint32_t *p,
13473da42859SDinh Nguyen 			      uint32_t *i, uint32_t *max_working_cnt)
13483da42859SDinh Nguyen {
13493da42859SDinh Nguyen 	uint32_t found_begin = 0;
13503da42859SDinh Nguyen 	uint32_t tmp_delay = 0;
13513da42859SDinh Nguyen 	uint32_t test_status;
13523da42859SDinh Nguyen 
13533da42859SDinh Nguyen 	for (*d = 0; *d <= dtaps_per_ptap; (*d)++, tmp_delay +=
13543da42859SDinh Nguyen 		IO_DELAY_PER_DQS_EN_DCHAIN_TAP) {
13553da42859SDinh Nguyen 		*work_bgn = tmp_delay;
13563da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay_all_ranks(*grp, *d);
13573da42859SDinh Nguyen 
13583da42859SDinh Nguyen 		for (*i = 0; *i < VFIFO_SIZE; (*i)++) {
13593da42859SDinh Nguyen 			for (*p = 0; *p <= IO_DQS_EN_PHASE_MAX; (*p)++, *work_bgn +=
13603da42859SDinh Nguyen 				IO_DELAY_PER_OPA_TAP) {
13613da42859SDinh Nguyen 				scc_mgr_set_dqs_en_phase_all_ranks(*grp, *p);
13623da42859SDinh Nguyen 
13633da42859SDinh Nguyen 				test_status =
13643da42859SDinh Nguyen 				rw_mgr_mem_calibrate_read_test_all_ranks
13653da42859SDinh Nguyen 				(*grp, 1, PASS_ONE_BIT, bit_chk, 0);
13663da42859SDinh Nguyen 
13673da42859SDinh Nguyen 				if (test_status) {
13683da42859SDinh Nguyen 					*max_working_cnt = 1;
13693da42859SDinh Nguyen 					found_begin = 1;
13703da42859SDinh Nguyen 					break;
13713da42859SDinh Nguyen 				}
13723da42859SDinh Nguyen 			}
13733da42859SDinh Nguyen 
13743da42859SDinh Nguyen 			if (found_begin)
13753da42859SDinh Nguyen 				break;
13763da42859SDinh Nguyen 
13773da42859SDinh Nguyen 			if (*p > IO_DQS_EN_PHASE_MAX)
13783da42859SDinh Nguyen 				/* fiddle with FIFO */
13793da42859SDinh Nguyen 				rw_mgr_incr_vfifo(*grp, v);
13803da42859SDinh Nguyen 		}
13813da42859SDinh Nguyen 
13823da42859SDinh Nguyen 		if (found_begin)
13833da42859SDinh Nguyen 			break;
13843da42859SDinh Nguyen 	}
13853da42859SDinh Nguyen 
13863da42859SDinh Nguyen 	if (*i >= VFIFO_SIZE) {
13873da42859SDinh Nguyen 		/* cannot find working solution */
13883da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: no vfifo/\
13893da42859SDinh Nguyen 			   ptap/dtap\n", __func__, __LINE__);
13903da42859SDinh Nguyen 		return 0;
13913da42859SDinh Nguyen 	} else {
13923da42859SDinh Nguyen 		return 1;
13933da42859SDinh Nguyen 	}
13943da42859SDinh Nguyen }
13953da42859SDinh Nguyen 
13963da42859SDinh Nguyen static void sdr_backup_phase(uint32_t *grp, uint32_t *bit_chk,
13973da42859SDinh Nguyen 			     uint32_t *work_bgn, uint32_t *v, uint32_t *d,
13983da42859SDinh Nguyen 			     uint32_t *p, uint32_t *max_working_cnt)
13993da42859SDinh Nguyen {
14003da42859SDinh Nguyen 	uint32_t found_begin = 0;
14013da42859SDinh Nguyen 	uint32_t tmp_delay;
14023da42859SDinh Nguyen 
14033da42859SDinh Nguyen 	/* Special case code for backing up a phase */
14043da42859SDinh Nguyen 	if (*p == 0) {
14053da42859SDinh Nguyen 		*p = IO_DQS_EN_PHASE_MAX;
14063da42859SDinh Nguyen 		rw_mgr_decr_vfifo(*grp, v);
14073da42859SDinh Nguyen 	} else {
14083da42859SDinh Nguyen 		(*p)--;
14093da42859SDinh Nguyen 	}
14103da42859SDinh Nguyen 	tmp_delay = *work_bgn - IO_DELAY_PER_OPA_TAP;
14113da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(*grp, *p);
14123da42859SDinh Nguyen 
14133da42859SDinh Nguyen 	for (*d = 0; *d <= IO_DQS_EN_DELAY_MAX && tmp_delay < *work_bgn;
14143da42859SDinh Nguyen 		(*d)++, tmp_delay += IO_DELAY_PER_DQS_EN_DCHAIN_TAP) {
14153da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay_all_ranks(*grp, *d);
14163da42859SDinh Nguyen 
14173da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_read_test_all_ranks(*grp, 1,
14183da42859SDinh Nguyen 							     PASS_ONE_BIT,
14193da42859SDinh Nguyen 							     bit_chk, 0)) {
14203da42859SDinh Nguyen 			found_begin = 1;
14213da42859SDinh Nguyen 			*work_bgn = tmp_delay;
14223da42859SDinh Nguyen 			break;
14233da42859SDinh Nguyen 		}
14243da42859SDinh Nguyen 	}
14253da42859SDinh Nguyen 
14263da42859SDinh Nguyen 	/* We have found a working dtap before the ptap found above */
14273da42859SDinh Nguyen 	if (found_begin == 1)
14283da42859SDinh Nguyen 		(*max_working_cnt)++;
14293da42859SDinh Nguyen 
14303da42859SDinh Nguyen 	/*
14313da42859SDinh Nguyen 	 * Restore VFIFO to old state before we decremented it
14323da42859SDinh Nguyen 	 * (if needed).
14333da42859SDinh Nguyen 	 */
14343da42859SDinh Nguyen 	(*p)++;
14353da42859SDinh Nguyen 	if (*p > IO_DQS_EN_PHASE_MAX) {
14363da42859SDinh Nguyen 		*p = 0;
14373da42859SDinh Nguyen 		rw_mgr_incr_vfifo(*grp, v);
14383da42859SDinh Nguyen 	}
14393da42859SDinh Nguyen 
14403da42859SDinh Nguyen 	scc_mgr_set_dqs_en_delay_all_ranks(*grp, 0);
14413da42859SDinh Nguyen }
14423da42859SDinh Nguyen 
14433da42859SDinh Nguyen static int sdr_nonworking_phase(uint32_t *grp, uint32_t *bit_chk,
14443da42859SDinh Nguyen 			     uint32_t *work_bgn, uint32_t *v, uint32_t *d,
14453da42859SDinh Nguyen 			     uint32_t *p, uint32_t *i, uint32_t *max_working_cnt,
14463da42859SDinh Nguyen 			     uint32_t *work_end)
14473da42859SDinh Nguyen {
14483da42859SDinh Nguyen 	uint32_t found_end = 0;
14493da42859SDinh Nguyen 
14503da42859SDinh Nguyen 	(*p)++;
14513da42859SDinh Nguyen 	*work_end += IO_DELAY_PER_OPA_TAP;
14523da42859SDinh Nguyen 	if (*p > IO_DQS_EN_PHASE_MAX) {
14533da42859SDinh Nguyen 		/* fiddle with FIFO */
14543da42859SDinh Nguyen 		*p = 0;
14553da42859SDinh Nguyen 		rw_mgr_incr_vfifo(*grp, v);
14563da42859SDinh Nguyen 	}
14573da42859SDinh Nguyen 
14583da42859SDinh Nguyen 	for (; *i < VFIFO_SIZE + 1; (*i)++) {
14593da42859SDinh Nguyen 		for (; *p <= IO_DQS_EN_PHASE_MAX; (*p)++, *work_end
14603da42859SDinh Nguyen 			+= IO_DELAY_PER_OPA_TAP) {
14613da42859SDinh Nguyen 			scc_mgr_set_dqs_en_phase_all_ranks(*grp, *p);
14623da42859SDinh Nguyen 
14633da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_read_test_all_ranks
14643da42859SDinh Nguyen 				(*grp, 1, PASS_ONE_BIT, bit_chk, 0)) {
14653da42859SDinh Nguyen 				found_end = 1;
14663da42859SDinh Nguyen 				break;
14673da42859SDinh Nguyen 			} else {
14683da42859SDinh Nguyen 				(*max_working_cnt)++;
14693da42859SDinh Nguyen 			}
14703da42859SDinh Nguyen 		}
14713da42859SDinh Nguyen 
14723da42859SDinh Nguyen 		if (found_end)
14733da42859SDinh Nguyen 			break;
14743da42859SDinh Nguyen 
14753da42859SDinh Nguyen 		if (*p > IO_DQS_EN_PHASE_MAX) {
14763da42859SDinh Nguyen 			/* fiddle with FIFO */
14773da42859SDinh Nguyen 			rw_mgr_incr_vfifo(*grp, v);
14783da42859SDinh Nguyen 			*p = 0;
14793da42859SDinh Nguyen 		}
14803da42859SDinh Nguyen 	}
14813da42859SDinh Nguyen 
14823da42859SDinh Nguyen 	if (*i >= VFIFO_SIZE + 1) {
14833da42859SDinh Nguyen 		/* cannot see edge of failing read */
14843da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d sdr_nonworking_phase: end:\
14853da42859SDinh Nguyen 			   failed\n", __func__, __LINE__);
14863da42859SDinh Nguyen 		return 0;
14873da42859SDinh Nguyen 	} else {
14883da42859SDinh Nguyen 		return 1;
14893da42859SDinh Nguyen 	}
14903da42859SDinh Nguyen }
14913da42859SDinh Nguyen 
14923da42859SDinh Nguyen static int sdr_find_window_centre(uint32_t *grp, uint32_t *bit_chk,
14933da42859SDinh Nguyen 				  uint32_t *work_bgn, uint32_t *v, uint32_t *d,
14943da42859SDinh Nguyen 				  uint32_t *p, uint32_t *work_mid,
14953da42859SDinh Nguyen 				  uint32_t *work_end)
14963da42859SDinh Nguyen {
14973da42859SDinh Nguyen 	int i;
14983da42859SDinh Nguyen 	int tmp_delay = 0;
14993da42859SDinh Nguyen 
15003da42859SDinh Nguyen 	*work_mid = (*work_bgn + *work_end) / 2;
15013da42859SDinh Nguyen 
15023da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "work_bgn=%d work_end=%d work_mid=%d\n",
15033da42859SDinh Nguyen 		   *work_bgn, *work_end, *work_mid);
15043da42859SDinh Nguyen 	/* Get the middle delay to be less than a VFIFO delay */
15053da42859SDinh Nguyen 	for (*p = 0; *p <= IO_DQS_EN_PHASE_MAX;
15063da42859SDinh Nguyen 		(*p)++, tmp_delay += IO_DELAY_PER_OPA_TAP)
15073da42859SDinh Nguyen 		;
15083da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "vfifo ptap delay %d\n", tmp_delay);
15093da42859SDinh Nguyen 	while (*work_mid > tmp_delay)
15103da42859SDinh Nguyen 		*work_mid -= tmp_delay;
15113da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "new work_mid %d\n", *work_mid);
15123da42859SDinh Nguyen 
15133da42859SDinh Nguyen 	tmp_delay = 0;
15143da42859SDinh Nguyen 	for (*p = 0; *p <= IO_DQS_EN_PHASE_MAX && tmp_delay < *work_mid;
15153da42859SDinh Nguyen 		(*p)++, tmp_delay += IO_DELAY_PER_OPA_TAP)
15163da42859SDinh Nguyen 		;
15173da42859SDinh Nguyen 	tmp_delay -= IO_DELAY_PER_OPA_TAP;
15183da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "new p %d, tmp_delay=%d\n", (*p) - 1, tmp_delay);
15193da42859SDinh Nguyen 	for (*d = 0; *d <= IO_DQS_EN_DELAY_MAX && tmp_delay < *work_mid; (*d)++,
15203da42859SDinh Nguyen 		tmp_delay += IO_DELAY_PER_DQS_EN_DCHAIN_TAP)
15213da42859SDinh Nguyen 		;
15223da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "new d %d, tmp_delay=%d\n", *d, tmp_delay);
15233da42859SDinh Nguyen 
15243da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(*grp, (*p) - 1);
15253da42859SDinh Nguyen 	scc_mgr_set_dqs_en_delay_all_ranks(*grp, *d);
15263da42859SDinh Nguyen 
15273da42859SDinh Nguyen 	/*
15283da42859SDinh Nguyen 	 * push vfifo until we can successfully calibrate. We can do this
15293da42859SDinh Nguyen 	 * because the largest possible margin in 1 VFIFO cycle.
15303da42859SDinh Nguyen 	 */
15313da42859SDinh Nguyen 	for (i = 0; i < VFIFO_SIZE; i++) {
15323da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "find_dqs_en_phase: center: vfifo=%u\n",
15333da42859SDinh Nguyen 			   *v);
15343da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_read_test_all_ranks(*grp, 1,
15353da42859SDinh Nguyen 							     PASS_ONE_BIT,
15363da42859SDinh Nguyen 							     bit_chk, 0)) {
15373da42859SDinh Nguyen 			break;
15383da42859SDinh Nguyen 		}
15393da42859SDinh Nguyen 
15403da42859SDinh Nguyen 		/* fiddle with FIFO */
15413da42859SDinh Nguyen 		rw_mgr_incr_vfifo(*grp, v);
15423da42859SDinh Nguyen 	}
15433da42859SDinh Nguyen 
15443da42859SDinh Nguyen 	if (i >= VFIFO_SIZE) {
15453da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: center: \
15463da42859SDinh Nguyen 			   failed\n", __func__, __LINE__);
15473da42859SDinh Nguyen 		return 0;
15483da42859SDinh Nguyen 	} else {
15493da42859SDinh Nguyen 		return 1;
15503da42859SDinh Nguyen 	}
15513da42859SDinh Nguyen }
15523da42859SDinh Nguyen 
15533da42859SDinh Nguyen /* find a good dqs enable to use */
15543da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase(uint32_t grp)
15553da42859SDinh Nguyen {
15563da42859SDinh Nguyen 	uint32_t v, d, p, i;
15573da42859SDinh Nguyen 	uint32_t max_working_cnt;
15583da42859SDinh Nguyen 	uint32_t bit_chk;
15593da42859SDinh Nguyen 	uint32_t dtaps_per_ptap;
15603da42859SDinh Nguyen 	uint32_t work_bgn, work_mid, work_end;
15613da42859SDinh Nguyen 	uint32_t found_passing_read, found_failing_read, initial_failing_dtap;
15623da42859SDinh Nguyen 
15633da42859SDinh Nguyen 	debug("%s:%d %u\n", __func__, __LINE__, grp);
15643da42859SDinh Nguyen 
15653da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_VFIFO_CENTER);
15663da42859SDinh Nguyen 
15673da42859SDinh Nguyen 	scc_mgr_set_dqs_en_delay_all_ranks(grp, 0);
15683da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(grp, 0);
15693da42859SDinh Nguyen 
15703da42859SDinh Nguyen 	/* ************************************************************** */
15713da42859SDinh Nguyen 	/* * Step 0 : Determine number of delay taps for each phase tap * */
15723da42859SDinh Nguyen 	dtaps_per_ptap = IO_DELAY_PER_OPA_TAP/IO_DELAY_PER_DQS_EN_DCHAIN_TAP;
15733da42859SDinh Nguyen 
15743da42859SDinh Nguyen 	/* ********************************************************* */
15753da42859SDinh Nguyen 	/* * Step 1 : First push vfifo until we get a failing read * */
15763da42859SDinh Nguyen 	v = find_vfifo_read(grp, &bit_chk);
15773da42859SDinh Nguyen 
15783da42859SDinh Nguyen 	max_working_cnt = 0;
15793da42859SDinh Nguyen 
15803da42859SDinh Nguyen 	/* ******************************************************** */
15813da42859SDinh Nguyen 	/* * step 2: find first working phase, increment in ptaps * */
15823da42859SDinh Nguyen 	work_bgn = 0;
15833da42859SDinh Nguyen 	if (find_working_phase(&grp, &bit_chk, dtaps_per_ptap, &work_bgn, &v, &d,
15843da42859SDinh Nguyen 				&p, &i, &max_working_cnt) == 0)
15853da42859SDinh Nguyen 		return 0;
15863da42859SDinh Nguyen 
15873da42859SDinh Nguyen 	work_end = work_bgn;
15883da42859SDinh Nguyen 
15893da42859SDinh Nguyen 	/*
15903da42859SDinh Nguyen 	 * If d is 0 then the working window covers a phase tap and
15913da42859SDinh Nguyen 	 * we can follow the old procedure otherwise, we've found the beginning,
15923da42859SDinh Nguyen 	 * and we need to increment the dtaps until we find the end.
15933da42859SDinh Nguyen 	 */
15943da42859SDinh Nguyen 	if (d == 0) {
15953da42859SDinh Nguyen 		/* ********************************************************* */
15963da42859SDinh Nguyen 		/* * step 3a: if we have room, back off by one and
15973da42859SDinh Nguyen 		increment in dtaps * */
15983da42859SDinh Nguyen 
15993da42859SDinh Nguyen 		sdr_backup_phase(&grp, &bit_chk, &work_bgn, &v, &d, &p,
16003da42859SDinh Nguyen 				 &max_working_cnt);
16013da42859SDinh Nguyen 
16023da42859SDinh Nguyen 		/* ********************************************************* */
16033da42859SDinh Nguyen 		/* * step 4a: go forward from working phase to non working
16043da42859SDinh Nguyen 		phase, increment in ptaps * */
16053da42859SDinh Nguyen 		if (sdr_nonworking_phase(&grp, &bit_chk, &work_bgn, &v, &d, &p,
16063da42859SDinh Nguyen 					 &i, &max_working_cnt, &work_end) == 0)
16073da42859SDinh Nguyen 			return 0;
16083da42859SDinh Nguyen 
16093da42859SDinh Nguyen 		/* ********************************************************* */
16103da42859SDinh Nguyen 		/* * step 5a:  back off one from last, increment in dtaps  * */
16113da42859SDinh Nguyen 
16123da42859SDinh Nguyen 		/* Special case code for backing up a phase */
16133da42859SDinh Nguyen 		if (p == 0) {
16143da42859SDinh Nguyen 			p = IO_DQS_EN_PHASE_MAX;
16153da42859SDinh Nguyen 			rw_mgr_decr_vfifo(grp, &v);
16163da42859SDinh Nguyen 		} else {
16173da42859SDinh Nguyen 			p = p - 1;
16183da42859SDinh Nguyen 		}
16193da42859SDinh Nguyen 
16203da42859SDinh Nguyen 		work_end -= IO_DELAY_PER_OPA_TAP;
16213da42859SDinh Nguyen 		scc_mgr_set_dqs_en_phase_all_ranks(grp, p);
16223da42859SDinh Nguyen 
16233da42859SDinh Nguyen 		/* * The actual increment of dtaps is done outside of
16243da42859SDinh Nguyen 		the if/else loop to share code */
16253da42859SDinh Nguyen 		d = 0;
16263da42859SDinh Nguyen 
16273da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: v/p: \
16283da42859SDinh Nguyen 			   vfifo=%u ptap=%u\n", __func__, __LINE__,
16293da42859SDinh Nguyen 			   v, p);
16303da42859SDinh Nguyen 	} else {
16313da42859SDinh Nguyen 		/* ******************************************************* */
16323da42859SDinh Nguyen 		/* * step 3-5b:  Find the right edge of the window using
16333da42859SDinh Nguyen 		delay taps   * */
16343da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase:vfifo=%u \
16353da42859SDinh Nguyen 			   ptap=%u dtap=%u bgn=%u\n", __func__, __LINE__,
16363da42859SDinh Nguyen 			   v, p, d, work_bgn);
16373da42859SDinh Nguyen 
16383da42859SDinh Nguyen 		work_end = work_bgn;
16393da42859SDinh Nguyen 
16403da42859SDinh Nguyen 		/* * The actual increment of dtaps is done outside of the
16413da42859SDinh Nguyen 		if/else loop to share code */
16423da42859SDinh Nguyen 
16433da42859SDinh Nguyen 		/* Only here to counterbalance a subtract later on which is
16443da42859SDinh Nguyen 		not needed if this branch of the algorithm is taken */
16453da42859SDinh Nguyen 		max_working_cnt++;
16463da42859SDinh Nguyen 	}
16473da42859SDinh Nguyen 
16483da42859SDinh Nguyen 	/* The dtap increment to find the failing edge is done here */
16493da42859SDinh Nguyen 	for (; d <= IO_DQS_EN_DELAY_MAX; d++, work_end +=
16503da42859SDinh Nguyen 		IO_DELAY_PER_DQS_EN_DCHAIN_TAP) {
16513da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: \
16523da42859SDinh Nguyen 				   end-2: dtap=%u\n", __func__, __LINE__, d);
16533da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay_all_ranks(grp, d);
16543da42859SDinh Nguyen 
16553da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_read_test_all_ranks(grp, 1,
16563da42859SDinh Nguyen 								      PASS_ONE_BIT,
16573da42859SDinh Nguyen 								      &bit_chk, 0)) {
16583da42859SDinh Nguyen 				break;
16593da42859SDinh Nguyen 			}
16603da42859SDinh Nguyen 	}
16613da42859SDinh Nguyen 
16623da42859SDinh Nguyen 	/* Go back to working dtap */
16633da42859SDinh Nguyen 	if (d != 0)
16643da42859SDinh Nguyen 		work_end -= IO_DELAY_PER_DQS_EN_DCHAIN_TAP;
16653da42859SDinh Nguyen 
16663da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: v/p/d: vfifo=%u \
16673da42859SDinh Nguyen 		   ptap=%u dtap=%u end=%u\n", __func__, __LINE__,
16683da42859SDinh Nguyen 		   v, p, d-1, work_end);
16693da42859SDinh Nguyen 
16703da42859SDinh Nguyen 	if (work_end < work_bgn) {
16713da42859SDinh Nguyen 		/* nil range */
16723da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: end-2: \
16733da42859SDinh Nguyen 			   failed\n", __func__, __LINE__);
16743da42859SDinh Nguyen 		return 0;
16753da42859SDinh Nguyen 	}
16763da42859SDinh Nguyen 
16773da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: found range [%u,%u]\n",
16783da42859SDinh Nguyen 		   __func__, __LINE__, work_bgn, work_end);
16793da42859SDinh Nguyen 
16803da42859SDinh Nguyen 	/* *************************************************************** */
16813da42859SDinh Nguyen 	/*
16823da42859SDinh Nguyen 	 * * We need to calculate the number of dtaps that equal a ptap
16833da42859SDinh Nguyen 	 * * To do that we'll back up a ptap and re-find the edge of the
16843da42859SDinh Nguyen 	 * * window using dtaps
16853da42859SDinh Nguyen 	 */
16863da42859SDinh Nguyen 
16873da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: calculate dtaps_per_ptap \
16883da42859SDinh Nguyen 		   for tracking\n", __func__, __LINE__);
16893da42859SDinh Nguyen 
16903da42859SDinh Nguyen 	/* Special case code for backing up a phase */
16913da42859SDinh Nguyen 	if (p == 0) {
16923da42859SDinh Nguyen 		p = IO_DQS_EN_PHASE_MAX;
16933da42859SDinh Nguyen 		rw_mgr_decr_vfifo(grp, &v);
16943da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: backedup \
16953da42859SDinh Nguyen 			   cycle/phase: v=%u p=%u\n", __func__, __LINE__,
16963da42859SDinh Nguyen 			   v, p);
16973da42859SDinh Nguyen 	} else {
16983da42859SDinh Nguyen 		p = p - 1;
16993da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: backedup \
17003da42859SDinh Nguyen 			   phase only: v=%u p=%u", __func__, __LINE__,
17013da42859SDinh Nguyen 			   v, p);
17023da42859SDinh Nguyen 	}
17033da42859SDinh Nguyen 
17043da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(grp, p);
17053da42859SDinh Nguyen 
17063da42859SDinh Nguyen 	/*
17073da42859SDinh Nguyen 	 * Increase dtap until we first see a passing read (in case the
17083da42859SDinh Nguyen 	 * window is smaller than a ptap),
17093da42859SDinh Nguyen 	 * and then a failing read to mark the edge of the window again
17103da42859SDinh Nguyen 	 */
17113da42859SDinh Nguyen 
17123da42859SDinh Nguyen 	/* Find a passing read */
17133da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: find passing read\n",
17143da42859SDinh Nguyen 		   __func__, __LINE__);
17153da42859SDinh Nguyen 	found_passing_read = 0;
17163da42859SDinh Nguyen 	found_failing_read = 0;
17173da42859SDinh Nguyen 	initial_failing_dtap = d;
17183da42859SDinh Nguyen 	for (; d <= IO_DQS_EN_DELAY_MAX; d++) {
17193da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: testing \
17203da42859SDinh Nguyen 			   read d=%u\n", __func__, __LINE__, d);
17213da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay_all_ranks(grp, d);
17223da42859SDinh Nguyen 
17233da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_read_test_all_ranks(grp, 1,
17243da42859SDinh Nguyen 							     PASS_ONE_BIT,
17253da42859SDinh Nguyen 							     &bit_chk, 0)) {
17263da42859SDinh Nguyen 			found_passing_read = 1;
17273da42859SDinh Nguyen 			break;
17283da42859SDinh Nguyen 		}
17293da42859SDinh Nguyen 	}
17303da42859SDinh Nguyen 
17313da42859SDinh Nguyen 	if (found_passing_read) {
17323da42859SDinh Nguyen 		/* Find a failing read */
17333da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: find failing \
17343da42859SDinh Nguyen 			   read\n", __func__, __LINE__);
17353da42859SDinh Nguyen 		for (d = d + 1; d <= IO_DQS_EN_DELAY_MAX; d++) {
17363da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: \
17373da42859SDinh Nguyen 				   testing read d=%u\n", __func__, __LINE__, d);
17383da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay_all_ranks(grp, d);
17393da42859SDinh Nguyen 
17403da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_read_test_all_ranks
17413da42859SDinh Nguyen 				(grp, 1, PASS_ONE_BIT, &bit_chk, 0)) {
17423da42859SDinh Nguyen 				found_failing_read = 1;
17433da42859SDinh Nguyen 				break;
17443da42859SDinh Nguyen 			}
17453da42859SDinh Nguyen 		}
17463da42859SDinh Nguyen 	} else {
17473da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d find_dqs_en_phase: failed to \
17483da42859SDinh Nguyen 			   calculate dtaps", __func__, __LINE__);
17493da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "per ptap. Fall back on static value\n");
17503da42859SDinh Nguyen 	}
17513da42859SDinh Nguyen 
17523da42859SDinh Nguyen 	/*
17533da42859SDinh Nguyen 	 * The dynamically calculated dtaps_per_ptap is only valid if we
17543da42859SDinh Nguyen 	 * found a passing/failing read. If we didn't, it means d hit the max
17553da42859SDinh Nguyen 	 * (IO_DQS_EN_DELAY_MAX). Otherwise, dtaps_per_ptap retains its
17563da42859SDinh Nguyen 	 * statically calculated value.
17573da42859SDinh Nguyen 	 */
17583da42859SDinh Nguyen 	if (found_passing_read && found_failing_read)
17593da42859SDinh Nguyen 		dtaps_per_ptap = d - initial_failing_dtap;
17603da42859SDinh Nguyen 
17611273dd9eSMarek Vasut 	writel(dtaps_per_ptap, &sdr_reg_file->dtaps_per_ptap);
17623da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: dtaps_per_ptap=%u \
17633da42859SDinh Nguyen 		   - %u = %u",  __func__, __LINE__, d,
17643da42859SDinh Nguyen 		   initial_failing_dtap, dtaps_per_ptap);
17653da42859SDinh Nguyen 
17663da42859SDinh Nguyen 	/* ******************************************** */
17673da42859SDinh Nguyen 	/* * step 6:  Find the centre of the window   * */
17683da42859SDinh Nguyen 	if (sdr_find_window_centre(&grp, &bit_chk, &work_bgn, &v, &d, &p,
17693da42859SDinh Nguyen 				   &work_mid, &work_end) == 0)
17703da42859SDinh Nguyen 		return 0;
17713da42859SDinh Nguyen 
17723da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: center found: \
17733da42859SDinh Nguyen 		   vfifo=%u ptap=%u dtap=%u\n", __func__, __LINE__,
17743da42859SDinh Nguyen 		   v, p-1, d);
17753da42859SDinh Nguyen 	return 1;
17763da42859SDinh Nguyen }
17773da42859SDinh Nguyen 
17783da42859SDinh Nguyen /*
17793da42859SDinh Nguyen  * Try rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase across different
17803da42859SDinh Nguyen  * dq_in_delay values
17813da42859SDinh Nguyen  */
17823da42859SDinh Nguyen static uint32_t
17833da42859SDinh Nguyen rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase_sweep_dq_in_delay
17843da42859SDinh Nguyen (uint32_t write_group, uint32_t read_group, uint32_t test_bgn)
17853da42859SDinh Nguyen {
17863da42859SDinh Nguyen 	uint32_t found;
17873da42859SDinh Nguyen 	uint32_t i;
17883da42859SDinh Nguyen 	uint32_t p;
17893da42859SDinh Nguyen 	uint32_t d;
17903da42859SDinh Nguyen 	uint32_t r;
17913da42859SDinh Nguyen 
17923da42859SDinh Nguyen 	const uint32_t delay_step = IO_IO_IN_DELAY_MAX /
17933da42859SDinh Nguyen 		(RW_MGR_MEM_DQ_PER_READ_DQS-1);
17943da42859SDinh Nguyen 		/* we start at zero, so have one less dq to devide among */
17953da42859SDinh Nguyen 
17963da42859SDinh Nguyen 	debug("%s:%d (%u,%u,%u)", __func__, __LINE__, write_group, read_group,
17973da42859SDinh Nguyen 	      test_bgn);
17983da42859SDinh Nguyen 
17993da42859SDinh Nguyen 	/* try different dq_in_delays since the dq path is shorter than dqs */
18003da42859SDinh Nguyen 
18013da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
18023da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
18033da42859SDinh Nguyen 		for (i = 0, p = test_bgn, d = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS;
18043da42859SDinh Nguyen 			i++, p++, d += delay_step) {
18053da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d rw_mgr_mem_calibrate_\
18063da42859SDinh Nguyen 				   vfifo_find_dqs_", __func__, __LINE__);
18073da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "en_phase_sweep_dq_in_delay: g=%u/%u ",
18083da42859SDinh Nguyen 			       write_group, read_group);
18093da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "r=%u, i=%u p=%u d=%u\n", r, i , p, d);
181007aee5bdSMarek Vasut 			scc_mgr_set_dq_in_delay(p, d);
18113da42859SDinh Nguyen 			scc_mgr_load_dq(p);
18123da42859SDinh Nguyen 		}
18131273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
18143da42859SDinh Nguyen 	}
18153da42859SDinh Nguyen 
18163da42859SDinh Nguyen 	found = rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase(read_group);
18173da42859SDinh Nguyen 
18183da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d rw_mgr_mem_calibrate_vfifo_find_dqs_\
18193da42859SDinh Nguyen 		   en_phase_sweep_dq", __func__, __LINE__);
18203da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "_in_delay: g=%u/%u found=%u; Reseting delay \
18213da42859SDinh Nguyen 		   chain to zero\n", write_group, read_group, found);
18223da42859SDinh Nguyen 
18233da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
18243da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
18253da42859SDinh Nguyen 		for (i = 0, p = test_bgn; i < RW_MGR_MEM_DQ_PER_READ_DQS;
18263da42859SDinh Nguyen 			i++, p++) {
182707aee5bdSMarek Vasut 			scc_mgr_set_dq_in_delay(p, 0);
18283da42859SDinh Nguyen 			scc_mgr_load_dq(p);
18293da42859SDinh Nguyen 		}
18301273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
18313da42859SDinh Nguyen 	}
18323da42859SDinh Nguyen 
18333da42859SDinh Nguyen 	return found;
18343da42859SDinh Nguyen }
18353da42859SDinh Nguyen 
18363da42859SDinh Nguyen /* per-bit deskew DQ and center */
18373da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo_center(uint32_t rank_bgn,
18383da42859SDinh Nguyen 	uint32_t write_group, uint32_t read_group, uint32_t test_bgn,
18393da42859SDinh Nguyen 	uint32_t use_read_test, uint32_t update_fom)
18403da42859SDinh Nguyen {
18413da42859SDinh Nguyen 	uint32_t i, p, d, min_index;
18423da42859SDinh Nguyen 	/*
18433da42859SDinh Nguyen 	 * Store these as signed since there are comparisons with
18443da42859SDinh Nguyen 	 * signed numbers.
18453da42859SDinh Nguyen 	 */
18463da42859SDinh Nguyen 	uint32_t bit_chk;
18473da42859SDinh Nguyen 	uint32_t sticky_bit_chk;
18483da42859SDinh Nguyen 	int32_t left_edge[RW_MGR_MEM_DQ_PER_READ_DQS];
18493da42859SDinh Nguyen 	int32_t right_edge[RW_MGR_MEM_DQ_PER_READ_DQS];
18503da42859SDinh Nguyen 	int32_t final_dq[RW_MGR_MEM_DQ_PER_READ_DQS];
18513da42859SDinh Nguyen 	int32_t mid;
18523da42859SDinh Nguyen 	int32_t orig_mid_min, mid_min;
18533da42859SDinh Nguyen 	int32_t new_dqs, start_dqs, start_dqs_en, shift_dq, final_dqs,
18543da42859SDinh Nguyen 		final_dqs_en;
18553da42859SDinh Nguyen 	int32_t dq_margin, dqs_margin;
18563da42859SDinh Nguyen 	uint32_t stop;
18573da42859SDinh Nguyen 	uint32_t temp_dq_in_delay1, temp_dq_in_delay2;
18583da42859SDinh Nguyen 	uint32_t addr;
18593da42859SDinh Nguyen 
18603da42859SDinh Nguyen 	debug("%s:%d: %u %u", __func__, __LINE__, read_group, test_bgn);
18613da42859SDinh Nguyen 
1862c4815f76SMarek Vasut 	addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_DQS_IN_DELAY_OFFSET;
186317fdc916SMarek Vasut 	start_dqs = readl(addr + (read_group << 2));
18643da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS)
186517fdc916SMarek Vasut 		start_dqs_en = readl(addr + ((read_group << 2)
18663da42859SDinh Nguyen 				     - IO_DQS_EN_DELAY_OFFSET));
18673da42859SDinh Nguyen 
18683da42859SDinh Nguyen 	/* set the left and right edge of each bit to an illegal value */
18693da42859SDinh Nguyen 	/* use (IO_IO_IN_DELAY_MAX + 1) as an illegal value */
18703da42859SDinh Nguyen 	sticky_bit_chk = 0;
18713da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
18723da42859SDinh Nguyen 		left_edge[i]  = IO_IO_IN_DELAY_MAX + 1;
18733da42859SDinh Nguyen 		right_edge[i] = IO_IO_IN_DELAY_MAX + 1;
18743da42859SDinh Nguyen 	}
18753da42859SDinh Nguyen 
18763da42859SDinh Nguyen 	/* Search for the left edge of the window for each bit */
18773da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_IN_DELAY_MAX; d++) {
18783da42859SDinh Nguyen 		scc_mgr_apply_group_dq_in_delay(write_group, test_bgn, d);
18793da42859SDinh Nguyen 
18801273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
18813da42859SDinh Nguyen 
18823da42859SDinh Nguyen 		/*
18833da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
18843da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
18853da42859SDinh Nguyen 		 */
18863da42859SDinh Nguyen 		if (use_read_test) {
18873da42859SDinh Nguyen 			stop = !rw_mgr_mem_calibrate_read_test(rank_bgn,
18883da42859SDinh Nguyen 				read_group, NUM_READ_PB_TESTS, PASS_ONE_BIT,
18893da42859SDinh Nguyen 				&bit_chk, 0, 0);
18903da42859SDinh Nguyen 		} else {
18913da42859SDinh Nguyen 			rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
18923da42859SDinh Nguyen 							0, PASS_ONE_BIT,
18933da42859SDinh Nguyen 							&bit_chk, 0);
18943da42859SDinh Nguyen 			bit_chk = bit_chk >> (RW_MGR_MEM_DQ_PER_READ_DQS *
18953da42859SDinh Nguyen 				(read_group - (write_group *
18963da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
18973da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH)));
18983da42859SDinh Nguyen 			stop = (bit_chk == 0);
18993da42859SDinh Nguyen 		}
19003da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
19013da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->read_correct_mask);
19023da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center(left): dtap=%u => %u == %u \
19033da42859SDinh Nguyen 			   && %u", __func__, __LINE__, d,
19043da42859SDinh Nguyen 			   sticky_bit_chk,
19053da42859SDinh Nguyen 			param->read_correct_mask, stop);
19063da42859SDinh Nguyen 
19073da42859SDinh Nguyen 		if (stop == 1) {
19083da42859SDinh Nguyen 			break;
19093da42859SDinh Nguyen 		} else {
19103da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
19113da42859SDinh Nguyen 				if (bit_chk & 1) {
19123da42859SDinh Nguyen 					/* Remember a passing test as the
19133da42859SDinh Nguyen 					left_edge */
19143da42859SDinh Nguyen 					left_edge[i] = d;
19153da42859SDinh Nguyen 				} else {
19163da42859SDinh Nguyen 					/* If a left edge has not been seen yet,
19173da42859SDinh Nguyen 					then a future passing test will mark
19183da42859SDinh Nguyen 					this edge as the right edge */
19193da42859SDinh Nguyen 					if (left_edge[i] ==
19203da42859SDinh Nguyen 						IO_IO_IN_DELAY_MAX + 1) {
19213da42859SDinh Nguyen 						right_edge[i] = -(d + 1);
19223da42859SDinh Nguyen 					}
19233da42859SDinh Nguyen 				}
19243da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
19253da42859SDinh Nguyen 			}
19263da42859SDinh Nguyen 		}
19273da42859SDinh Nguyen 	}
19283da42859SDinh Nguyen 
19293da42859SDinh Nguyen 	/* Reset DQ delay chains to 0 */
19303da42859SDinh Nguyen 	scc_mgr_apply_group_dq_in_delay(write_group, test_bgn, 0);
19313da42859SDinh Nguyen 	sticky_bit_chk = 0;
19323da42859SDinh Nguyen 	for (i = RW_MGR_MEM_DQ_PER_READ_DQS - 1;; i--) {
19333da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center: left_edge[%u]: \
19343da42859SDinh Nguyen 			   %d right_edge[%u]: %d\n", __func__, __LINE__,
19353da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
19363da42859SDinh Nguyen 
19373da42859SDinh Nguyen 		/*
19383da42859SDinh Nguyen 		 * Check for cases where we haven't found the left edge,
19393da42859SDinh Nguyen 		 * which makes our assignment of the the right edge invalid.
19403da42859SDinh Nguyen 		 * Reset it to the illegal value.
19413da42859SDinh Nguyen 		 */
19423da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_IN_DELAY_MAX + 1) && (
19433da42859SDinh Nguyen 			right_edge[i] != IO_IO_IN_DELAY_MAX + 1)) {
19443da42859SDinh Nguyen 			right_edge[i] = IO_IO_IN_DELAY_MAX + 1;
19453da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d vfifo_center: reset \
19463da42859SDinh Nguyen 				   right_edge[%u]: %d\n", __func__, __LINE__,
19473da42859SDinh Nguyen 				   i, right_edge[i]);
19483da42859SDinh Nguyen 		}
19493da42859SDinh Nguyen 
19503da42859SDinh Nguyen 		/*
19513da42859SDinh Nguyen 		 * Reset sticky bit (except for bits where we have seen
19523da42859SDinh Nguyen 		 * both the left and right edge).
19533da42859SDinh Nguyen 		 */
19543da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk << 1;
19553da42859SDinh Nguyen 		if ((left_edge[i] != IO_IO_IN_DELAY_MAX + 1) &&
19563da42859SDinh Nguyen 		    (right_edge[i] != IO_IO_IN_DELAY_MAX + 1)) {
19573da42859SDinh Nguyen 			sticky_bit_chk = sticky_bit_chk | 1;
19583da42859SDinh Nguyen 		}
19593da42859SDinh Nguyen 
19603da42859SDinh Nguyen 		if (i == 0)
19613da42859SDinh Nguyen 			break;
19623da42859SDinh Nguyen 	}
19633da42859SDinh Nguyen 
19643da42859SDinh Nguyen 	/* Search for the right edge of the window for each bit */
19653da42859SDinh Nguyen 	for (d = 0; d <= IO_DQS_IN_DELAY_MAX - start_dqs; d++) {
19663da42859SDinh Nguyen 		scc_mgr_set_dqs_bus_in_delay(read_group, d + start_dqs);
19673da42859SDinh Nguyen 		if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
19683da42859SDinh Nguyen 			uint32_t delay = d + start_dqs_en;
19693da42859SDinh Nguyen 			if (delay > IO_DQS_EN_DELAY_MAX)
19703da42859SDinh Nguyen 				delay = IO_DQS_EN_DELAY_MAX;
19713da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay(read_group, delay);
19723da42859SDinh Nguyen 		}
19733da42859SDinh Nguyen 		scc_mgr_load_dqs(read_group);
19743da42859SDinh Nguyen 
19751273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
19763da42859SDinh Nguyen 
19773da42859SDinh Nguyen 		/*
19783da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
19793da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
19803da42859SDinh Nguyen 		 */
19813da42859SDinh Nguyen 		if (use_read_test) {
19823da42859SDinh Nguyen 			stop = !rw_mgr_mem_calibrate_read_test(rank_bgn,
19833da42859SDinh Nguyen 				read_group, NUM_READ_PB_TESTS, PASS_ONE_BIT,
19843da42859SDinh Nguyen 				&bit_chk, 0, 0);
19853da42859SDinh Nguyen 		} else {
19863da42859SDinh Nguyen 			rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
19873da42859SDinh Nguyen 							0, PASS_ONE_BIT,
19883da42859SDinh Nguyen 							&bit_chk, 0);
19893da42859SDinh Nguyen 			bit_chk = bit_chk >> (RW_MGR_MEM_DQ_PER_READ_DQS *
19903da42859SDinh Nguyen 				(read_group - (write_group *
19913da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
19923da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH)));
19933da42859SDinh Nguyen 			stop = (bit_chk == 0);
19943da42859SDinh Nguyen 		}
19953da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
19963da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->read_correct_mask);
19973da42859SDinh Nguyen 
19983da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center(right): dtap=%u => %u == \
19993da42859SDinh Nguyen 			   %u && %u", __func__, __LINE__, d,
20003da42859SDinh Nguyen 			   sticky_bit_chk, param->read_correct_mask, stop);
20013da42859SDinh Nguyen 
20023da42859SDinh Nguyen 		if (stop == 1) {
20033da42859SDinh Nguyen 			break;
20043da42859SDinh Nguyen 		} else {
20053da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
20063da42859SDinh Nguyen 				if (bit_chk & 1) {
20073da42859SDinh Nguyen 					/* Remember a passing test as
20083da42859SDinh Nguyen 					the right_edge */
20093da42859SDinh Nguyen 					right_edge[i] = d;
20103da42859SDinh Nguyen 				} else {
20113da42859SDinh Nguyen 					if (d != 0) {
20123da42859SDinh Nguyen 						/* If a right edge has not been
20133da42859SDinh Nguyen 						seen yet, then a future passing
20143da42859SDinh Nguyen 						test will mark this edge as the
20153da42859SDinh Nguyen 						left edge */
20163da42859SDinh Nguyen 						if (right_edge[i] ==
20173da42859SDinh Nguyen 						IO_IO_IN_DELAY_MAX + 1) {
20183da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
20193da42859SDinh Nguyen 						}
20203da42859SDinh Nguyen 					} else {
20213da42859SDinh Nguyen 						/* d = 0 failed, but it passed
20223da42859SDinh Nguyen 						when testing the left edge,
20233da42859SDinh Nguyen 						so it must be marginal,
20243da42859SDinh Nguyen 						set it to -1 */
20253da42859SDinh Nguyen 						if (right_edge[i] ==
20263da42859SDinh Nguyen 							IO_IO_IN_DELAY_MAX + 1 &&
20273da42859SDinh Nguyen 							left_edge[i] !=
20283da42859SDinh Nguyen 							IO_IO_IN_DELAY_MAX
20293da42859SDinh Nguyen 							+ 1) {
20303da42859SDinh Nguyen 							right_edge[i] = -1;
20313da42859SDinh Nguyen 						}
20323da42859SDinh Nguyen 						/* If a right edge has not been
20333da42859SDinh Nguyen 						seen yet, then a future passing
20343da42859SDinh Nguyen 						test will mark this edge as the
20353da42859SDinh Nguyen 						left edge */
20363da42859SDinh Nguyen 						else if (right_edge[i] ==
20373da42859SDinh Nguyen 							IO_IO_IN_DELAY_MAX +
20383da42859SDinh Nguyen 							1) {
20393da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
20403da42859SDinh Nguyen 						}
20413da42859SDinh Nguyen 					}
20423da42859SDinh Nguyen 				}
20433da42859SDinh Nguyen 
20443da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "%s:%d vfifo_center[r,\
20453da42859SDinh Nguyen 					   d=%u]: ", __func__, __LINE__, d);
20463da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "bit_chk_test=%d left_edge[%u]: %d ",
20473da42859SDinh Nguyen 					   (int)(bit_chk & 1), i, left_edge[i]);
20483da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "right_edge[%u]: %d\n", i,
20493da42859SDinh Nguyen 					   right_edge[i]);
20503da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
20513da42859SDinh Nguyen 			}
20523da42859SDinh Nguyen 		}
20533da42859SDinh Nguyen 	}
20543da42859SDinh Nguyen 
20553da42859SDinh Nguyen 	/* Check that all bits have a window */
20563da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
20573da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center: left_edge[%u]: \
20583da42859SDinh Nguyen 			   %d right_edge[%u]: %d", __func__, __LINE__,
20593da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
20603da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_IN_DELAY_MAX + 1) || (right_edge[i]
20613da42859SDinh Nguyen 			== IO_IO_IN_DELAY_MAX + 1)) {
20623da42859SDinh Nguyen 			/*
20633da42859SDinh Nguyen 			 * Restore delay chain settings before letting the loop
20643da42859SDinh Nguyen 			 * in rw_mgr_mem_calibrate_vfifo to retry different
20653da42859SDinh Nguyen 			 * dqs/ck relationships.
20663da42859SDinh Nguyen 			 */
20673da42859SDinh Nguyen 			scc_mgr_set_dqs_bus_in_delay(read_group, start_dqs);
20683da42859SDinh Nguyen 			if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
20693da42859SDinh Nguyen 				scc_mgr_set_dqs_en_delay(read_group,
20703da42859SDinh Nguyen 							 start_dqs_en);
20713da42859SDinh Nguyen 			}
20723da42859SDinh Nguyen 			scc_mgr_load_dqs(read_group);
20731273dd9eSMarek Vasut 			writel(0, &sdr_scc_mgr->update);
20743da42859SDinh Nguyen 
20753da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d vfifo_center: failed to \
20763da42859SDinh Nguyen 				   find edge [%u]: %d %d", __func__, __LINE__,
20773da42859SDinh Nguyen 				   i, left_edge[i], right_edge[i]);
20783da42859SDinh Nguyen 			if (use_read_test) {
20793da42859SDinh Nguyen 				set_failing_group_stage(read_group *
20803da42859SDinh Nguyen 					RW_MGR_MEM_DQ_PER_READ_DQS + i,
20813da42859SDinh Nguyen 					CAL_STAGE_VFIFO,
20823da42859SDinh Nguyen 					CAL_SUBSTAGE_VFIFO_CENTER);
20833da42859SDinh Nguyen 			} else {
20843da42859SDinh Nguyen 				set_failing_group_stage(read_group *
20853da42859SDinh Nguyen 					RW_MGR_MEM_DQ_PER_READ_DQS + i,
20863da42859SDinh Nguyen 					CAL_STAGE_VFIFO_AFTER_WRITES,
20873da42859SDinh Nguyen 					CAL_SUBSTAGE_VFIFO_CENTER);
20883da42859SDinh Nguyen 			}
20893da42859SDinh Nguyen 			return 0;
20903da42859SDinh Nguyen 		}
20913da42859SDinh Nguyen 	}
20923da42859SDinh Nguyen 
20933da42859SDinh Nguyen 	/* Find middle of window for each DQ bit */
20943da42859SDinh Nguyen 	mid_min = left_edge[0] - right_edge[0];
20953da42859SDinh Nguyen 	min_index = 0;
20963da42859SDinh Nguyen 	for (i = 1; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
20973da42859SDinh Nguyen 		mid = left_edge[i] - right_edge[i];
20983da42859SDinh Nguyen 		if (mid < mid_min) {
20993da42859SDinh Nguyen 			mid_min = mid;
21003da42859SDinh Nguyen 			min_index = i;
21013da42859SDinh Nguyen 		}
21023da42859SDinh Nguyen 	}
21033da42859SDinh Nguyen 
21043da42859SDinh Nguyen 	/*
21053da42859SDinh Nguyen 	 * -mid_min/2 represents the amount that we need to move DQS.
21063da42859SDinh Nguyen 	 * If mid_min is odd and positive we'll need to add one to
21073da42859SDinh Nguyen 	 * make sure the rounding in further calculations is correct
21083da42859SDinh Nguyen 	 * (always bias to the right), so just add 1 for all positive values.
21093da42859SDinh Nguyen 	 */
21103da42859SDinh Nguyen 	if (mid_min > 0)
21113da42859SDinh Nguyen 		mid_min++;
21123da42859SDinh Nguyen 
21133da42859SDinh Nguyen 	mid_min = mid_min / 2;
21143da42859SDinh Nguyen 
21153da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d vfifo_center: mid_min=%d (index=%u)\n",
21163da42859SDinh Nguyen 		   __func__, __LINE__, mid_min, min_index);
21173da42859SDinh Nguyen 
21183da42859SDinh Nguyen 	/* Determine the amount we can change DQS (which is -mid_min) */
21193da42859SDinh Nguyen 	orig_mid_min = mid_min;
21203da42859SDinh Nguyen 	new_dqs = start_dqs - mid_min;
21213da42859SDinh Nguyen 	if (new_dqs > IO_DQS_IN_DELAY_MAX)
21223da42859SDinh Nguyen 		new_dqs = IO_DQS_IN_DELAY_MAX;
21233da42859SDinh Nguyen 	else if (new_dqs < 0)
21243da42859SDinh Nguyen 		new_dqs = 0;
21253da42859SDinh Nguyen 
21263da42859SDinh Nguyen 	mid_min = start_dqs - new_dqs;
21273da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "vfifo_center: new mid_min=%d new_dqs=%d\n",
21283da42859SDinh Nguyen 		   mid_min, new_dqs);
21293da42859SDinh Nguyen 
21303da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
21313da42859SDinh Nguyen 		if (start_dqs_en - mid_min > IO_DQS_EN_DELAY_MAX)
21323da42859SDinh Nguyen 			mid_min += start_dqs_en - mid_min - IO_DQS_EN_DELAY_MAX;
21333da42859SDinh Nguyen 		else if (start_dqs_en - mid_min < 0)
21343da42859SDinh Nguyen 			mid_min += start_dqs_en - mid_min;
21353da42859SDinh Nguyen 	}
21363da42859SDinh Nguyen 	new_dqs = start_dqs - mid_min;
21373da42859SDinh Nguyen 
21383da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "vfifo_center: start_dqs=%d start_dqs_en=%d \
21393da42859SDinh Nguyen 		   new_dqs=%d mid_min=%d\n", start_dqs,
21403da42859SDinh Nguyen 		   IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS ? start_dqs_en : -1,
21413da42859SDinh Nguyen 		   new_dqs, mid_min);
21423da42859SDinh Nguyen 
21433da42859SDinh Nguyen 	/* Initialize data for export structures */
21443da42859SDinh Nguyen 	dqs_margin = IO_IO_IN_DELAY_MAX + 1;
21453da42859SDinh Nguyen 	dq_margin  = IO_IO_IN_DELAY_MAX + 1;
21463da42859SDinh Nguyen 
21473da42859SDinh Nguyen 	/* add delay to bring centre of all DQ windows to the same "level" */
21483da42859SDinh Nguyen 	for (i = 0, p = test_bgn; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++, p++) {
21493da42859SDinh Nguyen 		/* Use values before divide by 2 to reduce round off error */
21503da42859SDinh Nguyen 		shift_dq = (left_edge[i] - right_edge[i] -
21513da42859SDinh Nguyen 			(left_edge[min_index] - right_edge[min_index]))/2  +
21523da42859SDinh Nguyen 			(orig_mid_min - mid_min);
21533da42859SDinh Nguyen 
21543da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "vfifo_center: before: \
21553da42859SDinh Nguyen 			   shift_dq[%u]=%d\n", i, shift_dq);
21563da42859SDinh Nguyen 
21571273dd9eSMarek Vasut 		addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_IN_DELAY_OFFSET;
215817fdc916SMarek Vasut 		temp_dq_in_delay1 = readl(addr + (p << 2));
215917fdc916SMarek Vasut 		temp_dq_in_delay2 = readl(addr + (i << 2));
21603da42859SDinh Nguyen 
21613da42859SDinh Nguyen 		if (shift_dq + (int32_t)temp_dq_in_delay1 >
21623da42859SDinh Nguyen 			(int32_t)IO_IO_IN_DELAY_MAX) {
21633da42859SDinh Nguyen 			shift_dq = (int32_t)IO_IO_IN_DELAY_MAX - temp_dq_in_delay2;
21643da42859SDinh Nguyen 		} else if (shift_dq + (int32_t)temp_dq_in_delay1 < 0) {
21653da42859SDinh Nguyen 			shift_dq = -(int32_t)temp_dq_in_delay1;
21663da42859SDinh Nguyen 		}
21673da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "vfifo_center: after: \
21683da42859SDinh Nguyen 			   shift_dq[%u]=%d\n", i, shift_dq);
21693da42859SDinh Nguyen 		final_dq[i] = temp_dq_in_delay1 + shift_dq;
217007aee5bdSMarek Vasut 		scc_mgr_set_dq_in_delay(p, final_dq[i]);
21713da42859SDinh Nguyen 		scc_mgr_load_dq(p);
21723da42859SDinh Nguyen 
21733da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "vfifo_center: margin[%u]=[%d,%d]\n", i,
21743da42859SDinh Nguyen 			   left_edge[i] - shift_dq + (-mid_min),
21753da42859SDinh Nguyen 			   right_edge[i] + shift_dq - (-mid_min));
21763da42859SDinh Nguyen 		/* To determine values for export structures */
21773da42859SDinh Nguyen 		if (left_edge[i] - shift_dq + (-mid_min) < dq_margin)
21783da42859SDinh Nguyen 			dq_margin = left_edge[i] - shift_dq + (-mid_min);
21793da42859SDinh Nguyen 
21803da42859SDinh Nguyen 		if (right_edge[i] + shift_dq - (-mid_min) < dqs_margin)
21813da42859SDinh Nguyen 			dqs_margin = right_edge[i] + shift_dq - (-mid_min);
21823da42859SDinh Nguyen 	}
21833da42859SDinh Nguyen 
21843da42859SDinh Nguyen 	final_dqs = new_dqs;
21853da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS)
21863da42859SDinh Nguyen 		final_dqs_en = start_dqs_en - mid_min;
21873da42859SDinh Nguyen 
21883da42859SDinh Nguyen 	/* Move DQS-en */
21893da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
21903da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay(read_group, final_dqs_en);
21913da42859SDinh Nguyen 		scc_mgr_load_dqs(read_group);
21923da42859SDinh Nguyen 	}
21933da42859SDinh Nguyen 
21943da42859SDinh Nguyen 	/* Move DQS */
21953da42859SDinh Nguyen 	scc_mgr_set_dqs_bus_in_delay(read_group, final_dqs);
21963da42859SDinh Nguyen 	scc_mgr_load_dqs(read_group);
21973da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d vfifo_center: dq_margin=%d \
21983da42859SDinh Nguyen 		   dqs_margin=%d", __func__, __LINE__,
21993da42859SDinh Nguyen 		   dq_margin, dqs_margin);
22003da42859SDinh Nguyen 
22013da42859SDinh Nguyen 	/*
22023da42859SDinh Nguyen 	 * Do not remove this line as it makes sure all of our decisions
22033da42859SDinh Nguyen 	 * have been applied. Apply the update bit.
22043da42859SDinh Nguyen 	 */
22051273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
22063da42859SDinh Nguyen 
22073da42859SDinh Nguyen 	return (dq_margin >= 0) && (dqs_margin >= 0);
22083da42859SDinh Nguyen }
22093da42859SDinh Nguyen 
22103da42859SDinh Nguyen /*
22113da42859SDinh Nguyen  * calibrate the read valid prediction FIFO.
22123da42859SDinh Nguyen  *
22133da42859SDinh Nguyen  *  - read valid prediction will consist of finding a good DQS enable phase,
22143da42859SDinh Nguyen  * DQS enable delay, DQS input phase, and DQS input delay.
22153da42859SDinh Nguyen  *  - we also do a per-bit deskew on the DQ lines.
22163da42859SDinh Nguyen  */
22173da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo(uint32_t read_group,
22183da42859SDinh Nguyen 					   uint32_t test_bgn)
22193da42859SDinh Nguyen {
22203da42859SDinh Nguyen 	uint32_t p, d, rank_bgn, sr;
22213da42859SDinh Nguyen 	uint32_t dtaps_per_ptap;
22223da42859SDinh Nguyen 	uint32_t tmp_delay;
22233da42859SDinh Nguyen 	uint32_t bit_chk;
22243da42859SDinh Nguyen 	uint32_t grp_calibrated;
22253da42859SDinh Nguyen 	uint32_t write_group, write_test_bgn;
22263da42859SDinh Nguyen 	uint32_t failed_substage;
22273da42859SDinh Nguyen 
22287ac40d25SMarek Vasut 	debug("%s:%d: %u %u\n", __func__, __LINE__, read_group, test_bgn);
22293da42859SDinh Nguyen 
22303da42859SDinh Nguyen 	/* update info for sims */
22313da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_VFIFO);
22323da42859SDinh Nguyen 
22333da42859SDinh Nguyen 	write_group = read_group;
22343da42859SDinh Nguyen 	write_test_bgn = test_bgn;
22353da42859SDinh Nguyen 
22363da42859SDinh Nguyen 	/* USER Determine number of delay taps for each phase tap */
22373da42859SDinh Nguyen 	dtaps_per_ptap = 0;
22383da42859SDinh Nguyen 	tmp_delay = 0;
22393da42859SDinh Nguyen 	while (tmp_delay < IO_DELAY_PER_OPA_TAP) {
22403da42859SDinh Nguyen 		dtaps_per_ptap++;
22413da42859SDinh Nguyen 		tmp_delay += IO_DELAY_PER_DQS_EN_DCHAIN_TAP;
22423da42859SDinh Nguyen 	}
22433da42859SDinh Nguyen 	dtaps_per_ptap--;
22443da42859SDinh Nguyen 	tmp_delay = 0;
22453da42859SDinh Nguyen 
22463da42859SDinh Nguyen 	/* update info for sims */
22473da42859SDinh Nguyen 	reg_file_set_group(read_group);
22483da42859SDinh Nguyen 
22493da42859SDinh Nguyen 	grp_calibrated = 0;
22503da42859SDinh Nguyen 
22513da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_GUARANTEED_READ);
22523da42859SDinh Nguyen 	failed_substage = CAL_SUBSTAGE_GUARANTEED_READ;
22533da42859SDinh Nguyen 
22543da42859SDinh Nguyen 	for (d = 0; d <= dtaps_per_ptap && grp_calibrated == 0; d += 2) {
22553da42859SDinh Nguyen 		/*
22563da42859SDinh Nguyen 		 * In RLDRAMX we may be messing the delay of pins in
22573da42859SDinh Nguyen 		 * the same write group but outside of the current read
22583da42859SDinh Nguyen 		 * the group, but that's ok because we haven't
22593da42859SDinh Nguyen 		 * calibrated output side yet.
22603da42859SDinh Nguyen 		 */
22613da42859SDinh Nguyen 		if (d > 0) {
22623da42859SDinh Nguyen 			scc_mgr_apply_group_all_out_delay_add_all_ranks
22633da42859SDinh Nguyen 			(write_group, write_test_bgn, d);
22643da42859SDinh Nguyen 		}
22653da42859SDinh Nguyen 
22663da42859SDinh Nguyen 		for (p = 0; p <= IO_DQDQS_OUT_PHASE_MAX && grp_calibrated == 0;
22673da42859SDinh Nguyen 			p++) {
22683da42859SDinh Nguyen 			/* set a particular dqdqs phase */
22693da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase_all_ranks(read_group, p);
22703da42859SDinh Nguyen 
22713da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d calibrate_vfifo: g=%u \
22723da42859SDinh Nguyen 				   p=%u d=%u\n", __func__, __LINE__,
22733da42859SDinh Nguyen 				   read_group, p, d);
22743da42859SDinh Nguyen 
22753da42859SDinh Nguyen 			/*
22763da42859SDinh Nguyen 			 * Load up the patterns used by read calibration
22773da42859SDinh Nguyen 			 * using current DQDQS phase.
22783da42859SDinh Nguyen 			 */
22793da42859SDinh Nguyen 			rw_mgr_mem_calibrate_read_load_patterns(0, 1);
22803da42859SDinh Nguyen 			if (!(gbl->phy_debug_mode_flags &
22813da42859SDinh Nguyen 				PHY_DEBUG_DISABLE_GUARANTEED_READ)) {
22823da42859SDinh Nguyen 				if (!rw_mgr_mem_calibrate_read_test_patterns_all_ranks
22833da42859SDinh Nguyen 				    (read_group, 1, &bit_chk)) {
22843da42859SDinh Nguyen 					debug_cond(DLEVEL == 1, "%s:%d Guaranteed read test failed:",
22853da42859SDinh Nguyen 						   __func__, __LINE__);
22863da42859SDinh Nguyen 					debug_cond(DLEVEL == 1, " g=%u p=%u d=%u\n",
22873da42859SDinh Nguyen 						   read_group, p, d);
22883da42859SDinh Nguyen 					break;
22893da42859SDinh Nguyen 				}
22903da42859SDinh Nguyen 			}
22913da42859SDinh Nguyen 
22923da42859SDinh Nguyen /* case:56390 */
22933da42859SDinh Nguyen 			grp_calibrated = 1;
22943da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase_sweep_dq_in_delay
22953da42859SDinh Nguyen 		    (write_group, read_group, test_bgn)) {
22963da42859SDinh Nguyen 				/*
22973da42859SDinh Nguyen 				 * USER Read per-bit deskew can be done on a
22983da42859SDinh Nguyen 				 * per shadow register basis.
22993da42859SDinh Nguyen 				 */
23003da42859SDinh Nguyen 				for (rank_bgn = 0, sr = 0;
23013da42859SDinh Nguyen 					rank_bgn < RW_MGR_MEM_NUMBER_OF_RANKS;
23023da42859SDinh Nguyen 					rank_bgn += NUM_RANKS_PER_SHADOW_REG,
23033da42859SDinh Nguyen 					++sr) {
23043da42859SDinh Nguyen 					/*
23053da42859SDinh Nguyen 					 * Determine if this set of ranks
23063da42859SDinh Nguyen 					 * should be skipped entirely.
23073da42859SDinh Nguyen 					 */
23083da42859SDinh Nguyen 					if (!param->skip_shadow_regs[sr]) {
23093da42859SDinh Nguyen 						/*
23103da42859SDinh Nguyen 						 * If doing read after write
23113da42859SDinh Nguyen 						 * calibration, do not update
23123da42859SDinh Nguyen 						 * FOM, now - do it then.
23133da42859SDinh Nguyen 						 */
23143da42859SDinh Nguyen 					if (!rw_mgr_mem_calibrate_vfifo_center
23153da42859SDinh Nguyen 						(rank_bgn, write_group,
23163da42859SDinh Nguyen 						read_group, test_bgn, 1, 0)) {
23173da42859SDinh Nguyen 							grp_calibrated = 0;
23183da42859SDinh Nguyen 							failed_substage =
23193da42859SDinh Nguyen 						CAL_SUBSTAGE_VFIFO_CENTER;
23203da42859SDinh Nguyen 						}
23213da42859SDinh Nguyen 					}
23223da42859SDinh Nguyen 				}
23233da42859SDinh Nguyen 			} else {
23243da42859SDinh Nguyen 				grp_calibrated = 0;
23253da42859SDinh Nguyen 				failed_substage = CAL_SUBSTAGE_DQS_EN_PHASE;
23263da42859SDinh Nguyen 			}
23273da42859SDinh Nguyen 		}
23283da42859SDinh Nguyen 	}
23293da42859SDinh Nguyen 
23303da42859SDinh Nguyen 	if (grp_calibrated == 0) {
23313da42859SDinh Nguyen 		set_failing_group_stage(write_group, CAL_STAGE_VFIFO,
23323da42859SDinh Nguyen 					failed_substage);
23333da42859SDinh Nguyen 		return 0;
23343da42859SDinh Nguyen 	}
23353da42859SDinh Nguyen 
23363da42859SDinh Nguyen 	/*
23373da42859SDinh Nguyen 	 * Reset the delay chains back to zero if they have moved > 1
23383da42859SDinh Nguyen 	 * (check for > 1 because loop will increase d even when pass in
23393da42859SDinh Nguyen 	 * first case).
23403da42859SDinh Nguyen 	 */
23413da42859SDinh Nguyen 	if (d > 2)
23423da42859SDinh Nguyen 		scc_mgr_zero_group(write_group, write_test_bgn, 1);
23433da42859SDinh Nguyen 
23443da42859SDinh Nguyen 	return 1;
23453da42859SDinh Nguyen }
23463da42859SDinh Nguyen 
23473da42859SDinh Nguyen /* VFIFO Calibration -- Read Deskew Calibration after write deskew */
23483da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo_end(uint32_t read_group,
23493da42859SDinh Nguyen 					       uint32_t test_bgn)
23503da42859SDinh Nguyen {
23513da42859SDinh Nguyen 	uint32_t rank_bgn, sr;
23523da42859SDinh Nguyen 	uint32_t grp_calibrated;
23533da42859SDinh Nguyen 	uint32_t write_group;
23543da42859SDinh Nguyen 
23553da42859SDinh Nguyen 	debug("%s:%d %u %u", __func__, __LINE__, read_group, test_bgn);
23563da42859SDinh Nguyen 
23573da42859SDinh Nguyen 	/* update info for sims */
23583da42859SDinh Nguyen 
23593da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_VFIFO_AFTER_WRITES);
23603da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_VFIFO_CENTER);
23613da42859SDinh Nguyen 
23623da42859SDinh Nguyen 	write_group = read_group;
23633da42859SDinh Nguyen 
23643da42859SDinh Nguyen 	/* update info for sims */
23653da42859SDinh Nguyen 	reg_file_set_group(read_group);
23663da42859SDinh Nguyen 
23673da42859SDinh Nguyen 	grp_calibrated = 1;
23683da42859SDinh Nguyen 	/* Read per-bit deskew can be done on a per shadow register basis */
23693da42859SDinh Nguyen 	for (rank_bgn = 0, sr = 0; rank_bgn < RW_MGR_MEM_NUMBER_OF_RANKS;
23703da42859SDinh Nguyen 		rank_bgn += NUM_RANKS_PER_SHADOW_REG, ++sr) {
23713da42859SDinh Nguyen 		/* Determine if this set of ranks should be skipped entirely */
23723da42859SDinh Nguyen 		if (!param->skip_shadow_regs[sr]) {
23733da42859SDinh Nguyen 		/* This is the last calibration round, update FOM here */
23743da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_vfifo_center(rank_bgn,
23753da42859SDinh Nguyen 								write_group,
23763da42859SDinh Nguyen 								read_group,
23773da42859SDinh Nguyen 								test_bgn, 0,
23783da42859SDinh Nguyen 								1)) {
23793da42859SDinh Nguyen 				grp_calibrated = 0;
23803da42859SDinh Nguyen 			}
23813da42859SDinh Nguyen 		}
23823da42859SDinh Nguyen 	}
23833da42859SDinh Nguyen 
23843da42859SDinh Nguyen 
23853da42859SDinh Nguyen 	if (grp_calibrated == 0) {
23863da42859SDinh Nguyen 		set_failing_group_stage(write_group,
23873da42859SDinh Nguyen 					CAL_STAGE_VFIFO_AFTER_WRITES,
23883da42859SDinh Nguyen 					CAL_SUBSTAGE_VFIFO_CENTER);
23893da42859SDinh Nguyen 		return 0;
23903da42859SDinh Nguyen 	}
23913da42859SDinh Nguyen 
23923da42859SDinh Nguyen 	return 1;
23933da42859SDinh Nguyen }
23943da42859SDinh Nguyen 
23953da42859SDinh Nguyen /* Calibrate LFIFO to find smallest read latency */
23963da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_lfifo(void)
23973da42859SDinh Nguyen {
23983da42859SDinh Nguyen 	uint32_t found_one;
23993da42859SDinh Nguyen 	uint32_t bit_chk;
24003da42859SDinh Nguyen 
24013da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
24023da42859SDinh Nguyen 
24033da42859SDinh Nguyen 	/* update info for sims */
24043da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_LFIFO);
24053da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_READ_LATENCY);
24063da42859SDinh Nguyen 
24073da42859SDinh Nguyen 	/* Load up the patterns used by read calibration for all ranks */
24083da42859SDinh Nguyen 	rw_mgr_mem_calibrate_read_load_patterns(0, 1);
24093da42859SDinh Nguyen 	found_one = 0;
24103da42859SDinh Nguyen 
24113da42859SDinh Nguyen 	do {
24121273dd9eSMarek Vasut 		writel(gbl->curr_read_lat, &phy_mgr_cfg->phy_rlat);
24133da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d lfifo: read_lat=%u",
24143da42859SDinh Nguyen 			   __func__, __LINE__, gbl->curr_read_lat);
24153da42859SDinh Nguyen 
24163da42859SDinh Nguyen 		if (!rw_mgr_mem_calibrate_read_test_all_ranks(0,
24173da42859SDinh Nguyen 							      NUM_READ_TESTS,
24183da42859SDinh Nguyen 							      PASS_ALL_BITS,
24193da42859SDinh Nguyen 							      &bit_chk, 1)) {
24203da42859SDinh Nguyen 			break;
24213da42859SDinh Nguyen 		}
24223da42859SDinh Nguyen 
24233da42859SDinh Nguyen 		found_one = 1;
24243da42859SDinh Nguyen 		/* reduce read latency and see if things are working */
24253da42859SDinh Nguyen 		/* correctly */
24263da42859SDinh Nguyen 		gbl->curr_read_lat--;
24273da42859SDinh Nguyen 	} while (gbl->curr_read_lat > 0);
24283da42859SDinh Nguyen 
24293da42859SDinh Nguyen 	/* reset the fifos to get pointers to known state */
24303da42859SDinh Nguyen 
24311273dd9eSMarek Vasut 	writel(0, &phy_mgr_cmd->fifo_reset);
24323da42859SDinh Nguyen 
24333da42859SDinh Nguyen 	if (found_one) {
24343da42859SDinh Nguyen 		/* add a fudge factor to the read latency that was determined */
24353da42859SDinh Nguyen 		gbl->curr_read_lat += 2;
24361273dd9eSMarek Vasut 		writel(gbl->curr_read_lat, &phy_mgr_cfg->phy_rlat);
24373da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d lfifo: success: using \
24383da42859SDinh Nguyen 			   read_lat=%u\n", __func__, __LINE__,
24393da42859SDinh Nguyen 			   gbl->curr_read_lat);
24403da42859SDinh Nguyen 		return 1;
24413da42859SDinh Nguyen 	} else {
24423da42859SDinh Nguyen 		set_failing_group_stage(0xff, CAL_STAGE_LFIFO,
24433da42859SDinh Nguyen 					CAL_SUBSTAGE_READ_LATENCY);
24443da42859SDinh Nguyen 
24453da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d lfifo: failed at initial \
24463da42859SDinh Nguyen 			   read_lat=%u\n", __func__, __LINE__,
24473da42859SDinh Nguyen 			   gbl->curr_read_lat);
24483da42859SDinh Nguyen 		return 0;
24493da42859SDinh Nguyen 	}
24503da42859SDinh Nguyen }
24513da42859SDinh Nguyen 
24523da42859SDinh Nguyen /*
24533da42859SDinh Nguyen  * issue write test command.
24543da42859SDinh Nguyen  * two variants are provided. one that just tests a write pattern and
24553da42859SDinh Nguyen  * another that tests datamask functionality.
24563da42859SDinh Nguyen  */
24573da42859SDinh Nguyen static void rw_mgr_mem_calibrate_write_test_issue(uint32_t group,
24583da42859SDinh Nguyen 						  uint32_t test_dm)
24593da42859SDinh Nguyen {
24603da42859SDinh Nguyen 	uint32_t mcc_instruction;
24613da42859SDinh Nguyen 	uint32_t quick_write_mode = (((STATIC_CALIB_STEPS) & CALIB_SKIP_WRITES) &&
24623da42859SDinh Nguyen 		ENABLE_SUPER_QUICK_CALIBRATION);
24633da42859SDinh Nguyen 	uint32_t rw_wl_nop_cycles;
24643da42859SDinh Nguyen 	uint32_t addr;
24653da42859SDinh Nguyen 
24663da42859SDinh Nguyen 	/*
24673da42859SDinh Nguyen 	 * Set counter and jump addresses for the right
24683da42859SDinh Nguyen 	 * number of NOP cycles.
24693da42859SDinh Nguyen 	 * The number of supported NOP cycles can range from -1 to infinity
24703da42859SDinh Nguyen 	 * Three different cases are handled:
24713da42859SDinh Nguyen 	 *
24723da42859SDinh Nguyen 	 * 1. For a number of NOP cycles greater than 0, the RW Mgr looping
24733da42859SDinh Nguyen 	 *    mechanism will be used to insert the right number of NOPs
24743da42859SDinh Nguyen 	 *
24753da42859SDinh Nguyen 	 * 2. For a number of NOP cycles equals to 0, the micro-instruction
24763da42859SDinh Nguyen 	 *    issuing the write command will jump straight to the
24773da42859SDinh Nguyen 	 *    micro-instruction that turns on DQS (for DDRx), or outputs write
24783da42859SDinh Nguyen 	 *    data (for RLD), skipping
24793da42859SDinh Nguyen 	 *    the NOP micro-instruction all together
24803da42859SDinh Nguyen 	 *
24813da42859SDinh Nguyen 	 * 3. A number of NOP cycles equal to -1 indicates that DQS must be
24823da42859SDinh Nguyen 	 *    turned on in the same micro-instruction that issues the write
24833da42859SDinh Nguyen 	 *    command. Then we need
24843da42859SDinh Nguyen 	 *    to directly jump to the micro-instruction that sends out the data
24853da42859SDinh Nguyen 	 *
24863da42859SDinh Nguyen 	 * NOTE: Implementing this mechanism uses 2 RW Mgr jump-counters
24873da42859SDinh Nguyen 	 *       (2 and 3). One jump-counter (0) is used to perform multiple
24883da42859SDinh Nguyen 	 *       write-read operations.
24893da42859SDinh Nguyen 	 *       one counter left to issue this command in "multiple-group" mode
24903da42859SDinh Nguyen 	 */
24913da42859SDinh Nguyen 
24923da42859SDinh Nguyen 	rw_wl_nop_cycles = gbl->rw_wl_nop_cycles;
24933da42859SDinh Nguyen 
24943da42859SDinh Nguyen 	if (rw_wl_nop_cycles == -1) {
24953da42859SDinh Nguyen 		/*
24963da42859SDinh Nguyen 		 * CNTR 2 - We want to execute the special write operation that
24973da42859SDinh Nguyen 		 * turns on DQS right away and then skip directly to the
24983da42859SDinh Nguyen 		 * instruction that sends out the data. We set the counter to a
24993da42859SDinh Nguyen 		 * large number so that the jump is always taken.
25003da42859SDinh Nguyen 		 */
25011273dd9eSMarek Vasut 		writel(0xFF, &sdr_rw_load_mgr_regs->load_cntr2);
25023da42859SDinh Nguyen 
25033da42859SDinh Nguyen 		/* CNTR 3 - Not used */
25043da42859SDinh Nguyen 		if (test_dm) {
25053da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_DM_BANK_0_WL_1;
25063da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_DATA,
25071273dd9eSMarek Vasut 			       &sdr_rw_load_jump_mgr_regs->load_jump_add2);
25083da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_NOP,
25091273dd9eSMarek Vasut 			       &sdr_rw_load_jump_mgr_regs->load_jump_add3);
25103da42859SDinh Nguyen 		} else {
25113da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_BANK_0_WL_1;
25121273dd9eSMarek Vasut 			writel(RW_MGR_LFSR_WR_RD_BANK_0_DATA,
25131273dd9eSMarek Vasut 				&sdr_rw_load_jump_mgr_regs->load_jump_add2);
25141273dd9eSMarek Vasut 			writel(RW_MGR_LFSR_WR_RD_BANK_0_NOP,
25151273dd9eSMarek Vasut 				&sdr_rw_load_jump_mgr_regs->load_jump_add3);
25163da42859SDinh Nguyen 		}
25173da42859SDinh Nguyen 	} else if (rw_wl_nop_cycles == 0) {
25183da42859SDinh Nguyen 		/*
25193da42859SDinh Nguyen 		 * CNTR 2 - We want to skip the NOP operation and go straight
25203da42859SDinh Nguyen 		 * to the DQS enable instruction. We set the counter to a large
25213da42859SDinh Nguyen 		 * number so that the jump is always taken.
25223da42859SDinh Nguyen 		 */
25231273dd9eSMarek Vasut 		writel(0xFF, &sdr_rw_load_mgr_regs->load_cntr2);
25243da42859SDinh Nguyen 
25253da42859SDinh Nguyen 		/* CNTR 3 - Not used */
25263da42859SDinh Nguyen 		if (test_dm) {
25273da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_DM_BANK_0;
25283da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_DQS,
25291273dd9eSMarek Vasut 			       &sdr_rw_load_jump_mgr_regs->load_jump_add2);
25303da42859SDinh Nguyen 		} else {
25313da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_BANK_0;
25321273dd9eSMarek Vasut 			writel(RW_MGR_LFSR_WR_RD_BANK_0_DQS,
25331273dd9eSMarek Vasut 				&sdr_rw_load_jump_mgr_regs->load_jump_add2);
25343da42859SDinh Nguyen 		}
25353da42859SDinh Nguyen 	} else {
25363da42859SDinh Nguyen 		/*
25373da42859SDinh Nguyen 		 * CNTR 2 - In this case we want to execute the next instruction
25383da42859SDinh Nguyen 		 * and NOT take the jump. So we set the counter to 0. The jump
25393da42859SDinh Nguyen 		 * address doesn't count.
25403da42859SDinh Nguyen 		 */
25411273dd9eSMarek Vasut 		writel(0x0, &sdr_rw_load_mgr_regs->load_cntr2);
25421273dd9eSMarek Vasut 		writel(0x0, &sdr_rw_load_jump_mgr_regs->load_jump_add2);
25433da42859SDinh Nguyen 
25443da42859SDinh Nguyen 		/*
25453da42859SDinh Nguyen 		 * CNTR 3 - Set the nop counter to the number of cycles we
25463da42859SDinh Nguyen 		 * need to loop for, minus 1.
25473da42859SDinh Nguyen 		 */
25481273dd9eSMarek Vasut 		writel(rw_wl_nop_cycles - 1, &sdr_rw_load_mgr_regs->load_cntr3);
25493da42859SDinh Nguyen 		if (test_dm) {
25503da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_DM_BANK_0;
25511273dd9eSMarek Vasut 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_NOP,
25521273dd9eSMarek Vasut 				&sdr_rw_load_jump_mgr_regs->load_jump_add3);
25533da42859SDinh Nguyen 		} else {
25543da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_BANK_0;
25551273dd9eSMarek Vasut 			writel(RW_MGR_LFSR_WR_RD_BANK_0_NOP,
25561273dd9eSMarek Vasut 				&sdr_rw_load_jump_mgr_regs->load_jump_add3);
25573da42859SDinh Nguyen 		}
25583da42859SDinh Nguyen 	}
25593da42859SDinh Nguyen 
25601273dd9eSMarek Vasut 	writel(0, SDR_PHYGRP_RWMGRGRP_ADDRESS |
25611273dd9eSMarek Vasut 		  RW_MGR_RESET_READ_DATAPATH_OFFSET);
25623da42859SDinh Nguyen 
25633da42859SDinh Nguyen 	if (quick_write_mode)
25641273dd9eSMarek Vasut 		writel(0x08, &sdr_rw_load_mgr_regs->load_cntr0);
25653da42859SDinh Nguyen 	else
25661273dd9eSMarek Vasut 		writel(0x40, &sdr_rw_load_mgr_regs->load_cntr0);
25673da42859SDinh Nguyen 
25681273dd9eSMarek Vasut 	writel(mcc_instruction, &sdr_rw_load_jump_mgr_regs->load_jump_add0);
25693da42859SDinh Nguyen 
25703da42859SDinh Nguyen 	/*
25713da42859SDinh Nguyen 	 * CNTR 1 - This is used to ensure enough time elapses
25723da42859SDinh Nguyen 	 * for read data to come back.
25733da42859SDinh Nguyen 	 */
25741273dd9eSMarek Vasut 	writel(0x30, &sdr_rw_load_mgr_regs->load_cntr1);
25753da42859SDinh Nguyen 
25763da42859SDinh Nguyen 	if (test_dm) {
25771273dd9eSMarek Vasut 		writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_WAIT,
25781273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
25793da42859SDinh Nguyen 	} else {
25801273dd9eSMarek Vasut 		writel(RW_MGR_LFSR_WR_RD_BANK_0_WAIT,
25811273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
25823da42859SDinh Nguyen 	}
25833da42859SDinh Nguyen 
2584c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
258517fdc916SMarek Vasut 	writel(mcc_instruction, addr + (group << 2));
25863da42859SDinh Nguyen }
25873da42859SDinh Nguyen 
25883da42859SDinh Nguyen /* Test writes, can check for a single bit pass or multiple bit pass */
25893da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_write_test(uint32_t rank_bgn,
25903da42859SDinh Nguyen 	uint32_t write_group, uint32_t use_dm, uint32_t all_correct,
25913da42859SDinh Nguyen 	uint32_t *bit_chk, uint32_t all_ranks)
25923da42859SDinh Nguyen {
25933da42859SDinh Nguyen 	uint32_t r;
25943da42859SDinh Nguyen 	uint32_t correct_mask_vg;
25953da42859SDinh Nguyen 	uint32_t tmp_bit_chk;
25963da42859SDinh Nguyen 	uint32_t vg;
25973da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
25983da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
25993da42859SDinh Nguyen 	uint32_t addr_rw_mgr;
26003da42859SDinh Nguyen 	uint32_t base_rw_mgr;
26013da42859SDinh Nguyen 
26023da42859SDinh Nguyen 	*bit_chk = param->write_correct_mask;
26033da42859SDinh Nguyen 	correct_mask_vg = param->write_correct_mask_vg;
26043da42859SDinh Nguyen 
26053da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
26063da42859SDinh Nguyen 		if (param->skip_ranks[r]) {
26073da42859SDinh Nguyen 			/* request to skip the rank */
26083da42859SDinh Nguyen 			continue;
26093da42859SDinh Nguyen 		}
26103da42859SDinh Nguyen 
26113da42859SDinh Nguyen 		/* set rank */
26123da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
26133da42859SDinh Nguyen 
26143da42859SDinh Nguyen 		tmp_bit_chk = 0;
2615a4bfa463SMarek Vasut 		addr_rw_mgr = SDR_PHYGRP_RWMGRGRP_ADDRESS;
26163da42859SDinh Nguyen 		for (vg = RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS-1; ; vg--) {
26173da42859SDinh Nguyen 			/* reset the fifos to get pointers to known state */
26181273dd9eSMarek Vasut 			writel(0, &phy_mgr_cmd->fifo_reset);
26193da42859SDinh Nguyen 
26203da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk <<
26213da42859SDinh Nguyen 				(RW_MGR_MEM_DQ_PER_WRITE_DQS /
26223da42859SDinh Nguyen 				RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS);
26233da42859SDinh Nguyen 			rw_mgr_mem_calibrate_write_test_issue(write_group *
26243da42859SDinh Nguyen 				RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS+vg,
26253da42859SDinh Nguyen 				use_dm);
26263da42859SDinh Nguyen 
262717fdc916SMarek Vasut 			base_rw_mgr = readl(addr_rw_mgr);
26283da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk | (correct_mask_vg & ~(base_rw_mgr));
26293da42859SDinh Nguyen 			if (vg == 0)
26303da42859SDinh Nguyen 				break;
26313da42859SDinh Nguyen 		}
26323da42859SDinh Nguyen 		*bit_chk &= tmp_bit_chk;
26333da42859SDinh Nguyen 	}
26343da42859SDinh Nguyen 
26353da42859SDinh Nguyen 	if (all_correct) {
26363da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
26373da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_test(%u,%u,ALL) : %u == \
26383da42859SDinh Nguyen 			   %u => %lu", write_group, use_dm,
26393da42859SDinh Nguyen 			   *bit_chk, param->write_correct_mask,
26403da42859SDinh Nguyen 			   (long unsigned int)(*bit_chk ==
26413da42859SDinh Nguyen 			   param->write_correct_mask));
26423da42859SDinh Nguyen 		return *bit_chk == param->write_correct_mask;
26433da42859SDinh Nguyen 	} else {
26443da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
26453da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_test(%u,%u,ONE) : %u != ",
26463da42859SDinh Nguyen 		       write_group, use_dm, *bit_chk);
26473da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%lu" " => %lu", (long unsigned int)0,
26483da42859SDinh Nguyen 			(long unsigned int)(*bit_chk != 0));
26493da42859SDinh Nguyen 		return *bit_chk != 0x00;
26503da42859SDinh Nguyen 	}
26513da42859SDinh Nguyen }
26523da42859SDinh Nguyen 
26533da42859SDinh Nguyen /*
26543da42859SDinh Nguyen  * center all windows. do per-bit-deskew to possibly increase size of
26553da42859SDinh Nguyen  * certain windows.
26563da42859SDinh Nguyen  */
26573da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_writes_center(uint32_t rank_bgn,
26583da42859SDinh Nguyen 	uint32_t write_group, uint32_t test_bgn)
26593da42859SDinh Nguyen {
26603da42859SDinh Nguyen 	uint32_t i, p, min_index;
26613da42859SDinh Nguyen 	int32_t d;
26623da42859SDinh Nguyen 	/*
26633da42859SDinh Nguyen 	 * Store these as signed since there are comparisons with
26643da42859SDinh Nguyen 	 * signed numbers.
26653da42859SDinh Nguyen 	 */
26663da42859SDinh Nguyen 	uint32_t bit_chk;
26673da42859SDinh Nguyen 	uint32_t sticky_bit_chk;
26683da42859SDinh Nguyen 	int32_t left_edge[RW_MGR_MEM_DQ_PER_WRITE_DQS];
26693da42859SDinh Nguyen 	int32_t right_edge[RW_MGR_MEM_DQ_PER_WRITE_DQS];
26703da42859SDinh Nguyen 	int32_t mid;
26713da42859SDinh Nguyen 	int32_t mid_min, orig_mid_min;
26723da42859SDinh Nguyen 	int32_t new_dqs, start_dqs, shift_dq;
26733da42859SDinh Nguyen 	int32_t dq_margin, dqs_margin, dm_margin;
26743da42859SDinh Nguyen 	uint32_t stop;
26753da42859SDinh Nguyen 	uint32_t temp_dq_out1_delay;
26763da42859SDinh Nguyen 	uint32_t addr;
26773da42859SDinh Nguyen 
26783da42859SDinh Nguyen 	debug("%s:%d %u %u", __func__, __LINE__, write_group, test_bgn);
26793da42859SDinh Nguyen 
26803da42859SDinh Nguyen 	dm_margin = 0;
26813da42859SDinh Nguyen 
2682c4815f76SMarek Vasut 	addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
268317fdc916SMarek Vasut 	start_dqs = readl(addr +
26843da42859SDinh Nguyen 			  (RW_MGR_MEM_DQ_PER_WRITE_DQS << 2));
26853da42859SDinh Nguyen 
26863da42859SDinh Nguyen 	/* per-bit deskew */
26873da42859SDinh Nguyen 
26883da42859SDinh Nguyen 	/*
26893da42859SDinh Nguyen 	 * set the left and right edge of each bit to an illegal value
26903da42859SDinh Nguyen 	 * use (IO_IO_OUT1_DELAY_MAX + 1) as an illegal value.
26913da42859SDinh Nguyen 	 */
26923da42859SDinh Nguyen 	sticky_bit_chk = 0;
26933da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
26943da42859SDinh Nguyen 		left_edge[i]  = IO_IO_OUT1_DELAY_MAX + 1;
26953da42859SDinh Nguyen 		right_edge[i] = IO_IO_OUT1_DELAY_MAX + 1;
26963da42859SDinh Nguyen 	}
26973da42859SDinh Nguyen 
26983da42859SDinh Nguyen 	/* Search for the left edge of the window for each bit */
26993da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_OUT1_DELAY_MAX; d++) {
27003da42859SDinh Nguyen 		scc_mgr_apply_group_dq_out1_delay(write_group, test_bgn, d);
27013da42859SDinh Nguyen 
27021273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
27033da42859SDinh Nguyen 
27043da42859SDinh Nguyen 		/*
27053da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
27063da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
27073da42859SDinh Nguyen 		 */
27083da42859SDinh Nguyen 		stop = !rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
27093da42859SDinh Nguyen 			0, PASS_ONE_BIT, &bit_chk, 0);
27103da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
27113da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->write_correct_mask);
27123da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center(left): dtap=%d => %u \
27133da42859SDinh Nguyen 			   == %u && %u [bit_chk= %u ]\n",
27143da42859SDinh Nguyen 			d, sticky_bit_chk, param->write_correct_mask,
27153da42859SDinh Nguyen 			stop, bit_chk);
27163da42859SDinh Nguyen 
27173da42859SDinh Nguyen 		if (stop == 1) {
27183da42859SDinh Nguyen 			break;
27193da42859SDinh Nguyen 		} else {
27203da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
27213da42859SDinh Nguyen 				if (bit_chk & 1) {
27223da42859SDinh Nguyen 					/*
27233da42859SDinh Nguyen 					 * Remember a passing test as the
27243da42859SDinh Nguyen 					 * left_edge.
27253da42859SDinh Nguyen 					 */
27263da42859SDinh Nguyen 					left_edge[i] = d;
27273da42859SDinh Nguyen 				} else {
27283da42859SDinh Nguyen 					/*
27293da42859SDinh Nguyen 					 * If a left edge has not been seen
27303da42859SDinh Nguyen 					 * yet, then a future passing test will
27313da42859SDinh Nguyen 					 * mark this edge as the right edge.
27323da42859SDinh Nguyen 					 */
27333da42859SDinh Nguyen 					if (left_edge[i] ==
27343da42859SDinh Nguyen 						IO_IO_OUT1_DELAY_MAX + 1) {
27353da42859SDinh Nguyen 						right_edge[i] = -(d + 1);
27363da42859SDinh Nguyen 					}
27373da42859SDinh Nguyen 				}
27383da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "write_center[l,d=%d):", d);
27393da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "bit_chk_test=%d left_edge[%u]: %d",
27403da42859SDinh Nguyen 					   (int)(bit_chk & 1), i, left_edge[i]);
27413da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "right_edge[%u]: %d\n", i,
27423da42859SDinh Nguyen 				       right_edge[i]);
27433da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
27443da42859SDinh Nguyen 			}
27453da42859SDinh Nguyen 		}
27463da42859SDinh Nguyen 	}
27473da42859SDinh Nguyen 
27483da42859SDinh Nguyen 	/* Reset DQ delay chains to 0 */
27493da42859SDinh Nguyen 	scc_mgr_apply_group_dq_out1_delay(write_group, test_bgn, 0);
27503da42859SDinh Nguyen 	sticky_bit_chk = 0;
27513da42859SDinh Nguyen 	for (i = RW_MGR_MEM_DQ_PER_WRITE_DQS - 1;; i--) {
27523da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d write_center: left_edge[%u]: \
27533da42859SDinh Nguyen 			   %d right_edge[%u]: %d\n", __func__, __LINE__,
27543da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
27553da42859SDinh Nguyen 
27563da42859SDinh Nguyen 		/*
27573da42859SDinh Nguyen 		 * Check for cases where we haven't found the left edge,
27583da42859SDinh Nguyen 		 * which makes our assignment of the the right edge invalid.
27593da42859SDinh Nguyen 		 * Reset it to the illegal value.
27603da42859SDinh Nguyen 		 */
27613da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_OUT1_DELAY_MAX + 1) &&
27623da42859SDinh Nguyen 		    (right_edge[i] != IO_IO_OUT1_DELAY_MAX + 1)) {
27633da42859SDinh Nguyen 			right_edge[i] = IO_IO_OUT1_DELAY_MAX + 1;
27643da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d write_center: reset \
27653da42859SDinh Nguyen 				   right_edge[%u]: %d\n", __func__, __LINE__,
27663da42859SDinh Nguyen 				   i, right_edge[i]);
27673da42859SDinh Nguyen 		}
27683da42859SDinh Nguyen 
27693da42859SDinh Nguyen 		/*
27703da42859SDinh Nguyen 		 * Reset sticky bit (except for bits where we have
27713da42859SDinh Nguyen 		 * seen the left edge).
27723da42859SDinh Nguyen 		 */
27733da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk << 1;
27743da42859SDinh Nguyen 		if ((left_edge[i] != IO_IO_OUT1_DELAY_MAX + 1))
27753da42859SDinh Nguyen 			sticky_bit_chk = sticky_bit_chk | 1;
27763da42859SDinh Nguyen 
27773da42859SDinh Nguyen 		if (i == 0)
27783da42859SDinh Nguyen 			break;
27793da42859SDinh Nguyen 	}
27803da42859SDinh Nguyen 
27813da42859SDinh Nguyen 	/* Search for the right edge of the window for each bit */
27823da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_OUT1_DELAY_MAX - start_dqs; d++) {
27833da42859SDinh Nguyen 		scc_mgr_apply_group_dqs_io_and_oct_out1(write_group,
27843da42859SDinh Nguyen 							d + start_dqs);
27853da42859SDinh Nguyen 
27861273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
27873da42859SDinh Nguyen 
27883da42859SDinh Nguyen 		/*
27893da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
27903da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
27913da42859SDinh Nguyen 		 */
27923da42859SDinh Nguyen 		stop = !rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
27933da42859SDinh Nguyen 			0, PASS_ONE_BIT, &bit_chk, 0);
27943da42859SDinh Nguyen 
27953da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
27963da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->write_correct_mask);
27973da42859SDinh Nguyen 
27983da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center (right): dtap=%u => %u == \
27993da42859SDinh Nguyen 			   %u && %u\n", d, sticky_bit_chk,
28003da42859SDinh Nguyen 			   param->write_correct_mask, stop);
28013da42859SDinh Nguyen 
28023da42859SDinh Nguyen 		if (stop == 1) {
28033da42859SDinh Nguyen 			if (d == 0) {
28043da42859SDinh Nguyen 				for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS;
28053da42859SDinh Nguyen 					i++) {
28063da42859SDinh Nguyen 					/* d = 0 failed, but it passed when
28073da42859SDinh Nguyen 					testing the left edge, so it must be
28083da42859SDinh Nguyen 					marginal, set it to -1 */
28093da42859SDinh Nguyen 					if (right_edge[i] ==
28103da42859SDinh Nguyen 						IO_IO_OUT1_DELAY_MAX + 1 &&
28113da42859SDinh Nguyen 						left_edge[i] !=
28123da42859SDinh Nguyen 						IO_IO_OUT1_DELAY_MAX + 1) {
28133da42859SDinh Nguyen 						right_edge[i] = -1;
28143da42859SDinh Nguyen 					}
28153da42859SDinh Nguyen 				}
28163da42859SDinh Nguyen 			}
28173da42859SDinh Nguyen 			break;
28183da42859SDinh Nguyen 		} else {
28193da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
28203da42859SDinh Nguyen 				if (bit_chk & 1) {
28213da42859SDinh Nguyen 					/*
28223da42859SDinh Nguyen 					 * Remember a passing test as
28233da42859SDinh Nguyen 					 * the right_edge.
28243da42859SDinh Nguyen 					 */
28253da42859SDinh Nguyen 					right_edge[i] = d;
28263da42859SDinh Nguyen 				} else {
28273da42859SDinh Nguyen 					if (d != 0) {
28283da42859SDinh Nguyen 						/*
28293da42859SDinh Nguyen 						 * If a right edge has not
28303da42859SDinh Nguyen 						 * been seen yet, then a future
28313da42859SDinh Nguyen 						 * passing test will mark this
28323da42859SDinh Nguyen 						 * edge as the left edge.
28333da42859SDinh Nguyen 						 */
28343da42859SDinh Nguyen 						if (right_edge[i] ==
28353da42859SDinh Nguyen 						    IO_IO_OUT1_DELAY_MAX + 1)
28363da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
28373da42859SDinh Nguyen 					} else {
28383da42859SDinh Nguyen 						/*
28393da42859SDinh Nguyen 						 * d = 0 failed, but it passed
28403da42859SDinh Nguyen 						 * when testing the left edge,
28413da42859SDinh Nguyen 						 * so it must be marginal, set
28423da42859SDinh Nguyen 						 * it to -1.
28433da42859SDinh Nguyen 						 */
28443da42859SDinh Nguyen 						if (right_edge[i] ==
28453da42859SDinh Nguyen 						    IO_IO_OUT1_DELAY_MAX + 1 &&
28463da42859SDinh Nguyen 						    left_edge[i] !=
28473da42859SDinh Nguyen 						    IO_IO_OUT1_DELAY_MAX + 1)
28483da42859SDinh Nguyen 							right_edge[i] = -1;
28493da42859SDinh Nguyen 						/*
28503da42859SDinh Nguyen 						 * If a right edge has not been
28513da42859SDinh Nguyen 						 * seen yet, then a future
28523da42859SDinh Nguyen 						 * passing test will mark this
28533da42859SDinh Nguyen 						 * edge as the left edge.
28543da42859SDinh Nguyen 						 */
28553da42859SDinh Nguyen 						else if (right_edge[i] ==
28563da42859SDinh Nguyen 							IO_IO_OUT1_DELAY_MAX +
28573da42859SDinh Nguyen 							1)
28583da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
28593da42859SDinh Nguyen 					}
28603da42859SDinh Nguyen 				}
28613da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "write_center[r,d=%d):", d);
28623da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "bit_chk_test=%d left_edge[%u]: %d",
28633da42859SDinh Nguyen 					   (int)(bit_chk & 1), i, left_edge[i]);
28643da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "right_edge[%u]: %d\n", i,
28653da42859SDinh Nguyen 					   right_edge[i]);
28663da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
28673da42859SDinh Nguyen 			}
28683da42859SDinh Nguyen 		}
28693da42859SDinh Nguyen 	}
28703da42859SDinh Nguyen 
28713da42859SDinh Nguyen 	/* Check that all bits have a window */
28723da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
28733da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d write_center: left_edge[%u]: \
28743da42859SDinh Nguyen 			   %d right_edge[%u]: %d", __func__, __LINE__,
28753da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
28763da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_OUT1_DELAY_MAX + 1) ||
28773da42859SDinh Nguyen 		    (right_edge[i] == IO_IO_OUT1_DELAY_MAX + 1)) {
28783da42859SDinh Nguyen 			set_failing_group_stage(test_bgn + i,
28793da42859SDinh Nguyen 						CAL_STAGE_WRITES,
28803da42859SDinh Nguyen 						CAL_SUBSTAGE_WRITES_CENTER);
28813da42859SDinh Nguyen 			return 0;
28823da42859SDinh Nguyen 		}
28833da42859SDinh Nguyen 	}
28843da42859SDinh Nguyen 
28853da42859SDinh Nguyen 	/* Find middle of window for each DQ bit */
28863da42859SDinh Nguyen 	mid_min = left_edge[0] - right_edge[0];
28873da42859SDinh Nguyen 	min_index = 0;
28883da42859SDinh Nguyen 	for (i = 1; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
28893da42859SDinh Nguyen 		mid = left_edge[i] - right_edge[i];
28903da42859SDinh Nguyen 		if (mid < mid_min) {
28913da42859SDinh Nguyen 			mid_min = mid;
28923da42859SDinh Nguyen 			min_index = i;
28933da42859SDinh Nguyen 		}
28943da42859SDinh Nguyen 	}
28953da42859SDinh Nguyen 
28963da42859SDinh Nguyen 	/*
28973da42859SDinh Nguyen 	 * -mid_min/2 represents the amount that we need to move DQS.
28983da42859SDinh Nguyen 	 * If mid_min is odd and positive we'll need to add one to
28993da42859SDinh Nguyen 	 * make sure the rounding in further calculations is correct
29003da42859SDinh Nguyen 	 * (always bias to the right), so just add 1 for all positive values.
29013da42859SDinh Nguyen 	 */
29023da42859SDinh Nguyen 	if (mid_min > 0)
29033da42859SDinh Nguyen 		mid_min++;
29043da42859SDinh Nguyen 	mid_min = mid_min / 2;
29053da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d write_center: mid_min=%d\n", __func__,
29063da42859SDinh Nguyen 		   __LINE__, mid_min);
29073da42859SDinh Nguyen 
29083da42859SDinh Nguyen 	/* Determine the amount we can change DQS (which is -mid_min) */
29093da42859SDinh Nguyen 	orig_mid_min = mid_min;
29103da42859SDinh Nguyen 	new_dqs = start_dqs;
29113da42859SDinh Nguyen 	mid_min = 0;
29123da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d write_center: start_dqs=%d new_dqs=%d \
29133da42859SDinh Nguyen 		   mid_min=%d\n", __func__, __LINE__, start_dqs, new_dqs, mid_min);
29143da42859SDinh Nguyen 	/* Initialize data for export structures */
29153da42859SDinh Nguyen 	dqs_margin = IO_IO_OUT1_DELAY_MAX + 1;
29163da42859SDinh Nguyen 	dq_margin  = IO_IO_OUT1_DELAY_MAX + 1;
29173da42859SDinh Nguyen 
29183da42859SDinh Nguyen 	/* add delay to bring centre of all DQ windows to the same "level" */
29193da42859SDinh Nguyen 	for (i = 0, p = test_bgn; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++, p++) {
29203da42859SDinh Nguyen 		/* Use values before divide by 2 to reduce round off error */
29213da42859SDinh Nguyen 		shift_dq = (left_edge[i] - right_edge[i] -
29223da42859SDinh Nguyen 			(left_edge[min_index] - right_edge[min_index]))/2  +
29233da42859SDinh Nguyen 		(orig_mid_min - mid_min);
29243da42859SDinh Nguyen 
29253da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d write_center: before: shift_dq \
29263da42859SDinh Nguyen 			   [%u]=%d\n", __func__, __LINE__, i, shift_dq);
29273da42859SDinh Nguyen 
29281273dd9eSMarek Vasut 		addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
292917fdc916SMarek Vasut 		temp_dq_out1_delay = readl(addr + (i << 2));
29303da42859SDinh Nguyen 		if (shift_dq + (int32_t)temp_dq_out1_delay >
29313da42859SDinh Nguyen 			(int32_t)IO_IO_OUT1_DELAY_MAX) {
29323da42859SDinh Nguyen 			shift_dq = (int32_t)IO_IO_OUT1_DELAY_MAX - temp_dq_out1_delay;
29333da42859SDinh Nguyen 		} else if (shift_dq + (int32_t)temp_dq_out1_delay < 0) {
29343da42859SDinh Nguyen 			shift_dq = -(int32_t)temp_dq_out1_delay;
29353da42859SDinh Nguyen 		}
29363da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center: after: shift_dq[%u]=%d\n",
29373da42859SDinh Nguyen 			   i, shift_dq);
293807aee5bdSMarek Vasut 		scc_mgr_set_dq_out1_delay(i, temp_dq_out1_delay + shift_dq);
29393da42859SDinh Nguyen 		scc_mgr_load_dq(i);
29403da42859SDinh Nguyen 
29413da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center: margin[%u]=[%d,%d]\n", i,
29423da42859SDinh Nguyen 			   left_edge[i] - shift_dq + (-mid_min),
29433da42859SDinh Nguyen 			   right_edge[i] + shift_dq - (-mid_min));
29443da42859SDinh Nguyen 		/* To determine values for export structures */
29453da42859SDinh Nguyen 		if (left_edge[i] - shift_dq + (-mid_min) < dq_margin)
29463da42859SDinh Nguyen 			dq_margin = left_edge[i] - shift_dq + (-mid_min);
29473da42859SDinh Nguyen 
29483da42859SDinh Nguyen 		if (right_edge[i] + shift_dq - (-mid_min) < dqs_margin)
29493da42859SDinh Nguyen 			dqs_margin = right_edge[i] + shift_dq - (-mid_min);
29503da42859SDinh Nguyen 	}
29513da42859SDinh Nguyen 
29523da42859SDinh Nguyen 	/* Move DQS */
29533da42859SDinh Nguyen 	scc_mgr_apply_group_dqs_io_and_oct_out1(write_group, new_dqs);
29541273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
29553da42859SDinh Nguyen 
29563da42859SDinh Nguyen 	/* Centre DM */
29573da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d write_center: DM\n", __func__, __LINE__);
29583da42859SDinh Nguyen 
29593da42859SDinh Nguyen 	/*
29603da42859SDinh Nguyen 	 * set the left and right edge of each bit to an illegal value,
29613da42859SDinh Nguyen 	 * use (IO_IO_OUT1_DELAY_MAX + 1) as an illegal value,
29623da42859SDinh Nguyen 	 */
29633da42859SDinh Nguyen 	left_edge[0]  = IO_IO_OUT1_DELAY_MAX + 1;
29643da42859SDinh Nguyen 	right_edge[0] = IO_IO_OUT1_DELAY_MAX + 1;
29653da42859SDinh Nguyen 	int32_t bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
29663da42859SDinh Nguyen 	int32_t end_curr = IO_IO_OUT1_DELAY_MAX + 1;
29673da42859SDinh Nguyen 	int32_t bgn_best = IO_IO_OUT1_DELAY_MAX + 1;
29683da42859SDinh Nguyen 	int32_t end_best = IO_IO_OUT1_DELAY_MAX + 1;
29693da42859SDinh Nguyen 	int32_t win_best = 0;
29703da42859SDinh Nguyen 
29713da42859SDinh Nguyen 	/* Search for the/part of the window with DM shift */
29723da42859SDinh Nguyen 	for (d = IO_IO_OUT1_DELAY_MAX; d >= 0; d -= DELTA_D) {
29733da42859SDinh Nguyen 		scc_mgr_apply_group_dm_out1_delay(write_group, d);
29741273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
29753da42859SDinh Nguyen 
29763da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_write_test(rank_bgn, write_group, 1,
29773da42859SDinh Nguyen 						    PASS_ALL_BITS, &bit_chk,
29783da42859SDinh Nguyen 						    0)) {
29793da42859SDinh Nguyen 			/* USE Set current end of the window */
29803da42859SDinh Nguyen 			end_curr = -d;
29813da42859SDinh Nguyen 			/*
29823da42859SDinh Nguyen 			 * If a starting edge of our window has not been seen
29833da42859SDinh Nguyen 			 * this is our current start of the DM window.
29843da42859SDinh Nguyen 			 */
29853da42859SDinh Nguyen 			if (bgn_curr == IO_IO_OUT1_DELAY_MAX + 1)
29863da42859SDinh Nguyen 				bgn_curr = -d;
29873da42859SDinh Nguyen 
29883da42859SDinh Nguyen 			/*
29893da42859SDinh Nguyen 			 * If current window is bigger than best seen.
29903da42859SDinh Nguyen 			 * Set best seen to be current window.
29913da42859SDinh Nguyen 			 */
29923da42859SDinh Nguyen 			if ((end_curr-bgn_curr+1) > win_best) {
29933da42859SDinh Nguyen 				win_best = end_curr-bgn_curr+1;
29943da42859SDinh Nguyen 				bgn_best = bgn_curr;
29953da42859SDinh Nguyen 				end_best = end_curr;
29963da42859SDinh Nguyen 			}
29973da42859SDinh Nguyen 		} else {
29983da42859SDinh Nguyen 			/* We just saw a failing test. Reset temp edge */
29993da42859SDinh Nguyen 			bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
30003da42859SDinh Nguyen 			end_curr = IO_IO_OUT1_DELAY_MAX + 1;
30013da42859SDinh Nguyen 			}
30023da42859SDinh Nguyen 		}
30033da42859SDinh Nguyen 
30043da42859SDinh Nguyen 
30053da42859SDinh Nguyen 	/* Reset DM delay chains to 0 */
30063da42859SDinh Nguyen 	scc_mgr_apply_group_dm_out1_delay(write_group, 0);
30073da42859SDinh Nguyen 
30083da42859SDinh Nguyen 	/*
30093da42859SDinh Nguyen 	 * Check to see if the current window nudges up aganist 0 delay.
30103da42859SDinh Nguyen 	 * If so we need to continue the search by shifting DQS otherwise DQS
30113da42859SDinh Nguyen 	 * search begins as a new search. */
30123da42859SDinh Nguyen 	if (end_curr != 0) {
30133da42859SDinh Nguyen 		bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
30143da42859SDinh Nguyen 		end_curr = IO_IO_OUT1_DELAY_MAX + 1;
30153da42859SDinh Nguyen 	}
30163da42859SDinh Nguyen 
30173da42859SDinh Nguyen 	/* Search for the/part of the window with DQS shifts */
30183da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_OUT1_DELAY_MAX - new_dqs; d += DELTA_D) {
30193da42859SDinh Nguyen 		/*
30203da42859SDinh Nguyen 		 * Note: This only shifts DQS, so are we limiting ourselve to
30213da42859SDinh Nguyen 		 * width of DQ unnecessarily.
30223da42859SDinh Nguyen 		 */
30233da42859SDinh Nguyen 		scc_mgr_apply_group_dqs_io_and_oct_out1(write_group,
30243da42859SDinh Nguyen 							d + new_dqs);
30253da42859SDinh Nguyen 
30261273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
30273da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_write_test(rank_bgn, write_group, 1,
30283da42859SDinh Nguyen 						    PASS_ALL_BITS, &bit_chk,
30293da42859SDinh Nguyen 						    0)) {
30303da42859SDinh Nguyen 			/* USE Set current end of the window */
30313da42859SDinh Nguyen 			end_curr = d;
30323da42859SDinh Nguyen 			/*
30333da42859SDinh Nguyen 			 * If a beginning edge of our window has not been seen
30343da42859SDinh Nguyen 			 * this is our current begin of the DM window.
30353da42859SDinh Nguyen 			 */
30363da42859SDinh Nguyen 			if (bgn_curr == IO_IO_OUT1_DELAY_MAX + 1)
30373da42859SDinh Nguyen 				bgn_curr = d;
30383da42859SDinh Nguyen 
30393da42859SDinh Nguyen 			/*
30403da42859SDinh Nguyen 			 * If current window is bigger than best seen. Set best
30413da42859SDinh Nguyen 			 * seen to be current window.
30423da42859SDinh Nguyen 			 */
30433da42859SDinh Nguyen 			if ((end_curr-bgn_curr+1) > win_best) {
30443da42859SDinh Nguyen 				win_best = end_curr-bgn_curr+1;
30453da42859SDinh Nguyen 				bgn_best = bgn_curr;
30463da42859SDinh Nguyen 				end_best = end_curr;
30473da42859SDinh Nguyen 			}
30483da42859SDinh Nguyen 		} else {
30493da42859SDinh Nguyen 			/* We just saw a failing test. Reset temp edge */
30503da42859SDinh Nguyen 			bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
30513da42859SDinh Nguyen 			end_curr = IO_IO_OUT1_DELAY_MAX + 1;
30523da42859SDinh Nguyen 
30533da42859SDinh Nguyen 			/* Early exit optimization: if ther remaining delay
30543da42859SDinh Nguyen 			chain space is less than already seen largest window
30553da42859SDinh Nguyen 			we can exit */
30563da42859SDinh Nguyen 			if ((win_best-1) >
30573da42859SDinh Nguyen 				(IO_IO_OUT1_DELAY_MAX - new_dqs - d)) {
30583da42859SDinh Nguyen 					break;
30593da42859SDinh Nguyen 				}
30603da42859SDinh Nguyen 			}
30613da42859SDinh Nguyen 		}
30623da42859SDinh Nguyen 
30633da42859SDinh Nguyen 	/* assign left and right edge for cal and reporting; */
30643da42859SDinh Nguyen 	left_edge[0] = -1*bgn_best;
30653da42859SDinh Nguyen 	right_edge[0] = end_best;
30663da42859SDinh Nguyen 
30673da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d dm_calib: left=%d right=%d\n", __func__,
30683da42859SDinh Nguyen 		   __LINE__, left_edge[0], right_edge[0]);
30693da42859SDinh Nguyen 
30703da42859SDinh Nguyen 	/* Move DQS (back to orig) */
30713da42859SDinh Nguyen 	scc_mgr_apply_group_dqs_io_and_oct_out1(write_group, new_dqs);
30723da42859SDinh Nguyen 
30733da42859SDinh Nguyen 	/* Move DM */
30743da42859SDinh Nguyen 
30753da42859SDinh Nguyen 	/* Find middle of window for the DM bit */
30763da42859SDinh Nguyen 	mid = (left_edge[0] - right_edge[0]) / 2;
30773da42859SDinh Nguyen 
30783da42859SDinh Nguyen 	/* only move right, since we are not moving DQS/DQ */
30793da42859SDinh Nguyen 	if (mid < 0)
30803da42859SDinh Nguyen 		mid = 0;
30813da42859SDinh Nguyen 
30823da42859SDinh Nguyen 	/* dm_marign should fail if we never find a window */
30833da42859SDinh Nguyen 	if (win_best == 0)
30843da42859SDinh Nguyen 		dm_margin = -1;
30853da42859SDinh Nguyen 	else
30863da42859SDinh Nguyen 		dm_margin = left_edge[0] - mid;
30873da42859SDinh Nguyen 
30883da42859SDinh Nguyen 	scc_mgr_apply_group_dm_out1_delay(write_group, mid);
30891273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
30903da42859SDinh Nguyen 
30913da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d dm_calib: left=%d right=%d mid=%d \
30923da42859SDinh Nguyen 		   dm_margin=%d\n", __func__, __LINE__, left_edge[0],
30933da42859SDinh Nguyen 		   right_edge[0], mid, dm_margin);
30943da42859SDinh Nguyen 	/* Export values */
30953da42859SDinh Nguyen 	gbl->fom_out += dq_margin + dqs_margin;
30963da42859SDinh Nguyen 
30973da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d write_center: dq_margin=%d \
30983da42859SDinh Nguyen 		   dqs_margin=%d dm_margin=%d\n", __func__, __LINE__,
30993da42859SDinh Nguyen 		   dq_margin, dqs_margin, dm_margin);
31003da42859SDinh Nguyen 
31013da42859SDinh Nguyen 	/*
31023da42859SDinh Nguyen 	 * Do not remove this line as it makes sure all of our
31033da42859SDinh Nguyen 	 * decisions have been applied.
31043da42859SDinh Nguyen 	 */
31051273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
31063da42859SDinh Nguyen 	return (dq_margin >= 0) && (dqs_margin >= 0) && (dm_margin >= 0);
31073da42859SDinh Nguyen }
31083da42859SDinh Nguyen 
31093da42859SDinh Nguyen /* calibrate the write operations */
31103da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_writes(uint32_t rank_bgn, uint32_t g,
31113da42859SDinh Nguyen 	uint32_t test_bgn)
31123da42859SDinh Nguyen {
31133da42859SDinh Nguyen 	/* update info for sims */
31143da42859SDinh Nguyen 	debug("%s:%d %u %u\n", __func__, __LINE__, g, test_bgn);
31153da42859SDinh Nguyen 
31163da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_WRITES);
31173da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_WRITES_CENTER);
31183da42859SDinh Nguyen 
31193da42859SDinh Nguyen 	reg_file_set_group(g);
31203da42859SDinh Nguyen 
31213da42859SDinh Nguyen 	if (!rw_mgr_mem_calibrate_writes_center(rank_bgn, g, test_bgn)) {
31223da42859SDinh Nguyen 		set_failing_group_stage(g, CAL_STAGE_WRITES,
31233da42859SDinh Nguyen 					CAL_SUBSTAGE_WRITES_CENTER);
31243da42859SDinh Nguyen 		return 0;
31253da42859SDinh Nguyen 	}
31263da42859SDinh Nguyen 
31273da42859SDinh Nguyen 	return 1;
31283da42859SDinh Nguyen }
31293da42859SDinh Nguyen 
31303da42859SDinh Nguyen /* precharge all banks and activate row 0 in bank "000..." and bank "111..." */
31313da42859SDinh Nguyen static void mem_precharge_and_activate(void)
31323da42859SDinh Nguyen {
31333da42859SDinh Nguyen 	uint32_t r;
31343da42859SDinh Nguyen 
31353da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r++) {
31363da42859SDinh Nguyen 		if (param->skip_ranks[r]) {
31373da42859SDinh Nguyen 			/* request to skip the rank */
31383da42859SDinh Nguyen 			continue;
31393da42859SDinh Nguyen 		}
31403da42859SDinh Nguyen 
31413da42859SDinh Nguyen 		/* set rank */
31423da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_OFF);
31433da42859SDinh Nguyen 
31443da42859SDinh Nguyen 		/* precharge all banks ... */
31451273dd9eSMarek Vasut 		writel(RW_MGR_PRECHARGE_ALL, SDR_PHYGRP_RWMGRGRP_ADDRESS |
31461273dd9eSMarek Vasut 					     RW_MGR_RUN_SINGLE_GROUP_OFFSET);
31473da42859SDinh Nguyen 
31481273dd9eSMarek Vasut 		writel(0x0F, &sdr_rw_load_mgr_regs->load_cntr0);
31491273dd9eSMarek Vasut 		writel(RW_MGR_ACTIVATE_0_AND_1_WAIT1,
31501273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add0);
31513da42859SDinh Nguyen 
31521273dd9eSMarek Vasut 		writel(0x0F, &sdr_rw_load_mgr_regs->load_cntr1);
31531273dd9eSMarek Vasut 		writel(RW_MGR_ACTIVATE_0_AND_1_WAIT2,
31541273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
31553da42859SDinh Nguyen 
31563da42859SDinh Nguyen 		/* activate rows */
31571273dd9eSMarek Vasut 		writel(RW_MGR_ACTIVATE_0_AND_1, SDR_PHYGRP_RWMGRGRP_ADDRESS |
31581273dd9eSMarek Vasut 						RW_MGR_RUN_SINGLE_GROUP_OFFSET);
31593da42859SDinh Nguyen 	}
31603da42859SDinh Nguyen }
31613da42859SDinh Nguyen 
31623da42859SDinh Nguyen /* Configure various memory related parameters. */
31633da42859SDinh Nguyen static void mem_config(void)
31643da42859SDinh Nguyen {
31653da42859SDinh Nguyen 	uint32_t rlat, wlat;
31663da42859SDinh Nguyen 	uint32_t rw_wl_nop_cycles;
31673da42859SDinh Nguyen 	uint32_t max_latency;
31683da42859SDinh Nguyen 
31693da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
31703da42859SDinh Nguyen 	/* read in write and read latency */
31711273dd9eSMarek Vasut 	wlat = readl(&data_mgr->t_wl_add);
31721273dd9eSMarek Vasut 	wlat += readl(&data_mgr->mem_t_add);
31733da42859SDinh Nguyen 
31743da42859SDinh Nguyen 	/* WL for hard phy does not include additive latency */
31753da42859SDinh Nguyen 
31763da42859SDinh Nguyen 	/*
31773da42859SDinh Nguyen 	 * add addtional write latency to offset the address/command extra
31783da42859SDinh Nguyen 	 * clock cycle. We change the AC mux setting causing AC to be delayed
31793da42859SDinh Nguyen 	 * by one mem clock cycle. Only do this for DDR3
31803da42859SDinh Nguyen 	 */
31813da42859SDinh Nguyen 	wlat = wlat + 1;
31823da42859SDinh Nguyen 
31831273dd9eSMarek Vasut 	rlat = readl(&data_mgr->t_rl_add);
31843da42859SDinh Nguyen 
31853da42859SDinh Nguyen 	rw_wl_nop_cycles = wlat - 2;
31863da42859SDinh Nguyen 	gbl->rw_wl_nop_cycles = rw_wl_nop_cycles;
31873da42859SDinh Nguyen 
31883da42859SDinh Nguyen 	/*
31893da42859SDinh Nguyen 	 * For AV/CV, lfifo is hardened and always runs at full rate so
31903da42859SDinh Nguyen 	 * max latency in AFI clocks, used here, is correspondingly smaller.
31913da42859SDinh Nguyen 	 */
31923da42859SDinh Nguyen 	max_latency = (1<<MAX_LATENCY_COUNT_WIDTH)/1 - 1;
31933da42859SDinh Nguyen 	/* configure for a burst length of 8 */
31943da42859SDinh Nguyen 
31953da42859SDinh Nguyen 	/* write latency */
31963da42859SDinh Nguyen 	/* Adjust Write Latency for Hard PHY */
31973da42859SDinh Nguyen 	wlat = wlat + 1;
31983da42859SDinh Nguyen 
31993da42859SDinh Nguyen 	/* set a pretty high read latency initially */
32003da42859SDinh Nguyen 	gbl->curr_read_lat = rlat + 16;
32013da42859SDinh Nguyen 
32023da42859SDinh Nguyen 	if (gbl->curr_read_lat > max_latency)
32033da42859SDinh Nguyen 		gbl->curr_read_lat = max_latency;
32043da42859SDinh Nguyen 
32051273dd9eSMarek Vasut 	writel(gbl->curr_read_lat, &phy_mgr_cfg->phy_rlat);
32063da42859SDinh Nguyen 
32073da42859SDinh Nguyen 	/* advertise write latency */
32083da42859SDinh Nguyen 	gbl->curr_write_lat = wlat;
32091273dd9eSMarek Vasut 	writel(wlat - 2, &phy_mgr_cfg->afi_wlat);
32103da42859SDinh Nguyen 
32113da42859SDinh Nguyen 	/* initialize bit slips */
32123da42859SDinh Nguyen 	mem_precharge_and_activate();
32133da42859SDinh Nguyen }
32143da42859SDinh Nguyen 
32153da42859SDinh Nguyen /* Set VFIFO and LFIFO to instant-on settings in skip calibration mode */
32163da42859SDinh Nguyen static void mem_skip_calibrate(void)
32173da42859SDinh Nguyen {
32183da42859SDinh Nguyen 	uint32_t vfifo_offset;
32193da42859SDinh Nguyen 	uint32_t i, j, r;
32203da42859SDinh Nguyen 
32213da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
32223da42859SDinh Nguyen 	/* Need to update every shadow register set used by the interface */
32233da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
32243da42859SDinh Nguyen 		r += NUM_RANKS_PER_SHADOW_REG) {
32253da42859SDinh Nguyen 		/*
32263da42859SDinh Nguyen 		 * Set output phase alignment settings appropriate for
32273da42859SDinh Nguyen 		 * skip calibration.
32283da42859SDinh Nguyen 		 */
32293da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
32303da42859SDinh Nguyen 			scc_mgr_set_dqs_en_phase(i, 0);
32313da42859SDinh Nguyen #if IO_DLL_CHAIN_LENGTH == 6
32323da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, 6);
32333da42859SDinh Nguyen #else
32343da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, 7);
32353da42859SDinh Nguyen #endif
32363da42859SDinh Nguyen 			/*
32373da42859SDinh Nguyen 			 * Case:33398
32383da42859SDinh Nguyen 			 *
32393da42859SDinh Nguyen 			 * Write data arrives to the I/O two cycles before write
32403da42859SDinh Nguyen 			 * latency is reached (720 deg).
32413da42859SDinh Nguyen 			 *   -> due to bit-slip in a/c bus
32423da42859SDinh Nguyen 			 *   -> to allow board skew where dqs is longer than ck
32433da42859SDinh Nguyen 			 *      -> how often can this happen!?
32443da42859SDinh Nguyen 			 *      -> can claim back some ptaps for high freq
32453da42859SDinh Nguyen 			 *       support if we can relax this, but i digress...
32463da42859SDinh Nguyen 			 *
32473da42859SDinh Nguyen 			 * The write_clk leads mem_ck by 90 deg
32483da42859SDinh Nguyen 			 * The minimum ptap of the OPA is 180 deg
32493da42859SDinh Nguyen 			 * Each ptap has (360 / IO_DLL_CHAIN_LENGH) deg of delay
32503da42859SDinh Nguyen 			 * The write_clk is always delayed by 2 ptaps
32513da42859SDinh Nguyen 			 *
32523da42859SDinh Nguyen 			 * Hence, to make DQS aligned to CK, we need to delay
32533da42859SDinh Nguyen 			 * DQS by:
32543da42859SDinh Nguyen 			 *    (720 - 90 - 180 - 2 * (360 / IO_DLL_CHAIN_LENGTH))
32553da42859SDinh Nguyen 			 *
32563da42859SDinh Nguyen 			 * Dividing the above by (360 / IO_DLL_CHAIN_LENGTH)
32573da42859SDinh Nguyen 			 * gives us the number of ptaps, which simplies to:
32583da42859SDinh Nguyen 			 *
32593da42859SDinh Nguyen 			 *    (1.25 * IO_DLL_CHAIN_LENGTH - 2)
32603da42859SDinh Nguyen 			 */
32613da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, (1.25 *
32623da42859SDinh Nguyen 				IO_DLL_CHAIN_LENGTH - 2));
32633da42859SDinh Nguyen 		}
32641273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dqs_ena);
32651273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dqs_io_ena);
32663da42859SDinh Nguyen 
32673da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_WRITE_DQS_WIDTH; i++) {
32681273dd9eSMarek Vasut 			writel(i, SDR_PHYGRP_SCCGRP_ADDRESS |
32691273dd9eSMarek Vasut 				  SCC_MGR_GROUP_COUNTER_OFFSET);
32703da42859SDinh Nguyen 		}
32711273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dq_ena);
32721273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dm_ena);
32731273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
32743da42859SDinh Nguyen 	}
32753da42859SDinh Nguyen 
32763da42859SDinh Nguyen 	/* Compensate for simulation model behaviour */
32773da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
32783da42859SDinh Nguyen 		scc_mgr_set_dqs_bus_in_delay(i, 10);
32793da42859SDinh Nguyen 		scc_mgr_load_dqs(i);
32803da42859SDinh Nguyen 	}
32811273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
32823da42859SDinh Nguyen 
32833da42859SDinh Nguyen 	/*
32843da42859SDinh Nguyen 	 * ArriaV has hard FIFOs that can only be initialized by incrementing
32853da42859SDinh Nguyen 	 * in sequencer.
32863da42859SDinh Nguyen 	 */
32873da42859SDinh Nguyen 	vfifo_offset = CALIB_VFIFO_OFFSET;
32883da42859SDinh Nguyen 	for (j = 0; j < vfifo_offset; j++) {
32891273dd9eSMarek Vasut 		writel(0xff, &phy_mgr_cmd->inc_vfifo_hard_phy);
32903da42859SDinh Nguyen 	}
32911273dd9eSMarek Vasut 	writel(0, &phy_mgr_cmd->fifo_reset);
32923da42859SDinh Nguyen 
32933da42859SDinh Nguyen 	/*
32943da42859SDinh Nguyen 	 * For ACV with hard lfifo, we get the skip-cal setting from
32953da42859SDinh Nguyen 	 * generation-time constant.
32963da42859SDinh Nguyen 	 */
32973da42859SDinh Nguyen 	gbl->curr_read_lat = CALIB_LFIFO_OFFSET;
32981273dd9eSMarek Vasut 	writel(gbl->curr_read_lat, &phy_mgr_cfg->phy_rlat);
32993da42859SDinh Nguyen }
33003da42859SDinh Nguyen 
33013da42859SDinh Nguyen /* Memory calibration entry point */
33023da42859SDinh Nguyen static uint32_t mem_calibrate(void)
33033da42859SDinh Nguyen {
33043da42859SDinh Nguyen 	uint32_t i;
33053da42859SDinh Nguyen 	uint32_t rank_bgn, sr;
33063da42859SDinh Nguyen 	uint32_t write_group, write_test_bgn;
33073da42859SDinh Nguyen 	uint32_t read_group, read_test_bgn;
33083da42859SDinh Nguyen 	uint32_t run_groups, current_run;
33093da42859SDinh Nguyen 	uint32_t failing_groups = 0;
33103da42859SDinh Nguyen 	uint32_t group_failed = 0;
33113da42859SDinh Nguyen 	uint32_t sr_failed = 0;
33123da42859SDinh Nguyen 
33133da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
33143da42859SDinh Nguyen 	/* Initialize the data settings */
33153da42859SDinh Nguyen 
33163da42859SDinh Nguyen 	gbl->error_substage = CAL_SUBSTAGE_NIL;
33173da42859SDinh Nguyen 	gbl->error_stage = CAL_STAGE_NIL;
33183da42859SDinh Nguyen 	gbl->error_group = 0xff;
33193da42859SDinh Nguyen 	gbl->fom_in = 0;
33203da42859SDinh Nguyen 	gbl->fom_out = 0;
33213da42859SDinh Nguyen 
33223da42859SDinh Nguyen 	mem_config();
33233da42859SDinh Nguyen 
33243da42859SDinh Nguyen 	uint32_t bypass_mode = 0x1;
33253da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
33261273dd9eSMarek Vasut 		writel(i, SDR_PHYGRP_SCCGRP_ADDRESS |
33271273dd9eSMarek Vasut 			  SCC_MGR_GROUP_COUNTER_OFFSET);
33283da42859SDinh Nguyen 		scc_set_bypass_mode(i, bypass_mode);
33293da42859SDinh Nguyen 	}
33303da42859SDinh Nguyen 
33313da42859SDinh Nguyen 	if ((dyn_calib_steps & CALIB_SKIP_ALL) == CALIB_SKIP_ALL) {
33323da42859SDinh Nguyen 		/*
33333da42859SDinh Nguyen 		 * Set VFIFO and LFIFO to instant-on settings in skip
33343da42859SDinh Nguyen 		 * calibration mode.
33353da42859SDinh Nguyen 		 */
33363da42859SDinh Nguyen 		mem_skip_calibrate();
33373da42859SDinh Nguyen 	} else {
33383da42859SDinh Nguyen 		for (i = 0; i < NUM_CALIB_REPEAT; i++) {
33393da42859SDinh Nguyen 			/*
33403da42859SDinh Nguyen 			 * Zero all delay chain/phase settings for all
33413da42859SDinh Nguyen 			 * groups and all shadow register sets.
33423da42859SDinh Nguyen 			 */
33433da42859SDinh Nguyen 			scc_mgr_zero_all();
33443da42859SDinh Nguyen 
33453da42859SDinh Nguyen 			run_groups = ~param->skip_groups;
33463da42859SDinh Nguyen 
33473da42859SDinh Nguyen 			for (write_group = 0, write_test_bgn = 0; write_group
33483da42859SDinh Nguyen 				< RW_MGR_MEM_IF_WRITE_DQS_WIDTH; write_group++,
33493da42859SDinh Nguyen 				write_test_bgn += RW_MGR_MEM_DQ_PER_WRITE_DQS) {
33503da42859SDinh Nguyen 				/* Initialized the group failure */
33513da42859SDinh Nguyen 				group_failed = 0;
33523da42859SDinh Nguyen 
33533da42859SDinh Nguyen 				current_run = run_groups & ((1 <<
33543da42859SDinh Nguyen 					RW_MGR_NUM_DQS_PER_WRITE_GROUP) - 1);
33553da42859SDinh Nguyen 				run_groups = run_groups >>
33563da42859SDinh Nguyen 					RW_MGR_NUM_DQS_PER_WRITE_GROUP;
33573da42859SDinh Nguyen 
33583da42859SDinh Nguyen 				if (current_run == 0)
33593da42859SDinh Nguyen 					continue;
33603da42859SDinh Nguyen 
33611273dd9eSMarek Vasut 				writel(write_group, SDR_PHYGRP_SCCGRP_ADDRESS |
33621273dd9eSMarek Vasut 						    SCC_MGR_GROUP_COUNTER_OFFSET);
33633da42859SDinh Nguyen 				scc_mgr_zero_group(write_group, write_test_bgn,
33643da42859SDinh Nguyen 						   0);
33653da42859SDinh Nguyen 
33663da42859SDinh Nguyen 				for (read_group = write_group *
33673da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
33683da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH,
33693da42859SDinh Nguyen 					read_test_bgn = 0;
33703da42859SDinh Nguyen 					read_group < (write_group + 1) *
33713da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
33723da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH &&
33733da42859SDinh Nguyen 					group_failed == 0;
33743da42859SDinh Nguyen 					read_group++, read_test_bgn +=
33753da42859SDinh Nguyen 					RW_MGR_MEM_DQ_PER_READ_DQS) {
33763da42859SDinh Nguyen 					/* Calibrate the VFIFO */
33773da42859SDinh Nguyen 					if (!((STATIC_CALIB_STEPS) &
33783da42859SDinh Nguyen 						CALIB_SKIP_VFIFO)) {
33793da42859SDinh Nguyen 						if (!rw_mgr_mem_calibrate_vfifo
33803da42859SDinh Nguyen 							(read_group,
33813da42859SDinh Nguyen 							read_test_bgn)) {
33823da42859SDinh Nguyen 							group_failed = 1;
33833da42859SDinh Nguyen 
33843da42859SDinh Nguyen 							if (!(gbl->
33853da42859SDinh Nguyen 							phy_debug_mode_flags &
33863da42859SDinh Nguyen 						PHY_DEBUG_SWEEP_ALL_GROUPS)) {
33873da42859SDinh Nguyen 								return 0;
33883da42859SDinh Nguyen 							}
33893da42859SDinh Nguyen 						}
33903da42859SDinh Nguyen 					}
33913da42859SDinh Nguyen 				}
33923da42859SDinh Nguyen 
33933da42859SDinh Nguyen 				/* Calibrate the output side */
33943da42859SDinh Nguyen 				if (group_failed == 0)	{
33953da42859SDinh Nguyen 					for (rank_bgn = 0, sr = 0; rank_bgn
33963da42859SDinh Nguyen 						< RW_MGR_MEM_NUMBER_OF_RANKS;
33973da42859SDinh Nguyen 						rank_bgn +=
33983da42859SDinh Nguyen 						NUM_RANKS_PER_SHADOW_REG,
33993da42859SDinh Nguyen 						++sr) {
34003da42859SDinh Nguyen 						sr_failed = 0;
34013da42859SDinh Nguyen 						if (!((STATIC_CALIB_STEPS) &
34023da42859SDinh Nguyen 						CALIB_SKIP_WRITES)) {
34033da42859SDinh Nguyen 							if ((STATIC_CALIB_STEPS)
34043da42859SDinh Nguyen 						& CALIB_SKIP_DELAY_SWEEPS) {
34053da42859SDinh Nguyen 						/* not needed in quick mode! */
34063da42859SDinh Nguyen 							} else {
34073da42859SDinh Nguyen 						/*
34083da42859SDinh Nguyen 						 * Determine if this set of
34093da42859SDinh Nguyen 						 * ranks should be skipped
34103da42859SDinh Nguyen 						 * entirely.
34113da42859SDinh Nguyen 						 */
34123da42859SDinh Nguyen 					if (!param->skip_shadow_regs[sr]) {
34133da42859SDinh Nguyen 						if (!rw_mgr_mem_calibrate_writes
34143da42859SDinh Nguyen 						(rank_bgn, write_group,
34153da42859SDinh Nguyen 						write_test_bgn)) {
34163da42859SDinh Nguyen 							sr_failed = 1;
34173da42859SDinh Nguyen 							if (!(gbl->
34183da42859SDinh Nguyen 							phy_debug_mode_flags &
34193da42859SDinh Nguyen 						PHY_DEBUG_SWEEP_ALL_GROUPS)) {
34203da42859SDinh Nguyen 								return 0;
34213da42859SDinh Nguyen 									}
34223da42859SDinh Nguyen 									}
34233da42859SDinh Nguyen 								}
34243da42859SDinh Nguyen 							}
34253da42859SDinh Nguyen 						}
34263da42859SDinh Nguyen 						if (sr_failed != 0)
34273da42859SDinh Nguyen 							group_failed = 1;
34283da42859SDinh Nguyen 					}
34293da42859SDinh Nguyen 				}
34303da42859SDinh Nguyen 
34313da42859SDinh Nguyen 				if (group_failed == 0) {
34323da42859SDinh Nguyen 					for (read_group = write_group *
34333da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
34343da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH,
34353da42859SDinh Nguyen 					read_test_bgn = 0;
34363da42859SDinh Nguyen 						read_group < (write_group + 1)
34373da42859SDinh Nguyen 						* RW_MGR_MEM_IF_READ_DQS_WIDTH
34383da42859SDinh Nguyen 						/ RW_MGR_MEM_IF_WRITE_DQS_WIDTH &&
34393da42859SDinh Nguyen 						group_failed == 0;
34403da42859SDinh Nguyen 						read_group++, read_test_bgn +=
34413da42859SDinh Nguyen 						RW_MGR_MEM_DQ_PER_READ_DQS) {
34423da42859SDinh Nguyen 						if (!((STATIC_CALIB_STEPS) &
34433da42859SDinh Nguyen 							CALIB_SKIP_WRITES)) {
34443da42859SDinh Nguyen 					if (!rw_mgr_mem_calibrate_vfifo_end
34453da42859SDinh Nguyen 						(read_group, read_test_bgn)) {
34463da42859SDinh Nguyen 							group_failed = 1;
34473da42859SDinh Nguyen 
34483da42859SDinh Nguyen 						if (!(gbl->phy_debug_mode_flags
34493da42859SDinh Nguyen 						& PHY_DEBUG_SWEEP_ALL_GROUPS)) {
34503da42859SDinh Nguyen 								return 0;
34513da42859SDinh Nguyen 								}
34523da42859SDinh Nguyen 							}
34533da42859SDinh Nguyen 						}
34543da42859SDinh Nguyen 					}
34553da42859SDinh Nguyen 				}
34563da42859SDinh Nguyen 
34573da42859SDinh Nguyen 				if (group_failed != 0)
34583da42859SDinh Nguyen 					failing_groups++;
34593da42859SDinh Nguyen 			}
34603da42859SDinh Nguyen 
34613da42859SDinh Nguyen 			/*
34623da42859SDinh Nguyen 			 * USER If there are any failing groups then report
34633da42859SDinh Nguyen 			 * the failure.
34643da42859SDinh Nguyen 			 */
34653da42859SDinh Nguyen 			if (failing_groups != 0)
34663da42859SDinh Nguyen 				return 0;
34673da42859SDinh Nguyen 
34683da42859SDinh Nguyen 			/* Calibrate the LFIFO */
34693da42859SDinh Nguyen 			if (!((STATIC_CALIB_STEPS) & CALIB_SKIP_LFIFO)) {
34703da42859SDinh Nguyen 				/*
34713da42859SDinh Nguyen 				 * If we're skipping groups as part of debug,
34723da42859SDinh Nguyen 				 * don't calibrate LFIFO.
34733da42859SDinh Nguyen 				 */
34743da42859SDinh Nguyen 				if (param->skip_groups == 0) {
34753da42859SDinh Nguyen 					if (!rw_mgr_mem_calibrate_lfifo())
34763da42859SDinh Nguyen 						return 0;
34773da42859SDinh Nguyen 				}
34783da42859SDinh Nguyen 			}
34793da42859SDinh Nguyen 		}
34803da42859SDinh Nguyen 	}
34813da42859SDinh Nguyen 
34823da42859SDinh Nguyen 	/*
34833da42859SDinh Nguyen 	 * Do not remove this line as it makes sure all of our decisions
34843da42859SDinh Nguyen 	 * have been applied.
34853da42859SDinh Nguyen 	 */
34861273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
34873da42859SDinh Nguyen 	return 1;
34883da42859SDinh Nguyen }
34893da42859SDinh Nguyen 
34903da42859SDinh Nguyen static uint32_t run_mem_calibrate(void)
34913da42859SDinh Nguyen {
34923da42859SDinh Nguyen 	uint32_t pass;
34933da42859SDinh Nguyen 	uint32_t debug_info;
34943da42859SDinh Nguyen 
34953da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
34963da42859SDinh Nguyen 
34973da42859SDinh Nguyen 	/* Reset pass/fail status shown on afi_cal_success/fail */
34981273dd9eSMarek Vasut 	writel(PHY_MGR_CAL_RESET, &phy_mgr_cfg->cal_status);
34993da42859SDinh Nguyen 
35003da42859SDinh Nguyen 	/* stop tracking manger */
35016cb9f167SMarek Vasut 	uint32_t ctrlcfg = readl(&sdr_ctrl->ctrl_cfg);
35023da42859SDinh Nguyen 
35036cb9f167SMarek Vasut 	writel(ctrlcfg & 0xFFBFFFFF, &sdr_ctrl->ctrl_cfg);
35043da42859SDinh Nguyen 
35053da42859SDinh Nguyen 	initialize();
35063da42859SDinh Nguyen 	rw_mgr_mem_initialize();
35073da42859SDinh Nguyen 
35083da42859SDinh Nguyen 	pass = mem_calibrate();
35093da42859SDinh Nguyen 
35103da42859SDinh Nguyen 	mem_precharge_and_activate();
35111273dd9eSMarek Vasut 	writel(0, &phy_mgr_cmd->fifo_reset);
35123da42859SDinh Nguyen 
35133da42859SDinh Nguyen 	/*
35143da42859SDinh Nguyen 	 * Handoff:
35153da42859SDinh Nguyen 	 * Don't return control of the PHY back to AFI when in debug mode.
35163da42859SDinh Nguyen 	 */
35173da42859SDinh Nguyen 	if ((gbl->phy_debug_mode_flags & PHY_DEBUG_IN_DEBUG_MODE) == 0) {
35183da42859SDinh Nguyen 		rw_mgr_mem_handoff();
35193da42859SDinh Nguyen 		/*
35203da42859SDinh Nguyen 		 * In Hard PHY this is a 2-bit control:
35213da42859SDinh Nguyen 		 * 0: AFI Mux Select
35223da42859SDinh Nguyen 		 * 1: DDIO Mux Select
35233da42859SDinh Nguyen 		 */
35241273dd9eSMarek Vasut 		writel(0x2, &phy_mgr_cfg->mux_sel);
35253da42859SDinh Nguyen 	}
35263da42859SDinh Nguyen 
35276cb9f167SMarek Vasut 	writel(ctrlcfg, &sdr_ctrl->ctrl_cfg);
35283da42859SDinh Nguyen 
35293da42859SDinh Nguyen 	if (pass) {
35303da42859SDinh Nguyen 		printf("%s: CALIBRATION PASSED\n", __FILE__);
35313da42859SDinh Nguyen 
35323da42859SDinh Nguyen 		gbl->fom_in /= 2;
35333da42859SDinh Nguyen 		gbl->fom_out /= 2;
35343da42859SDinh Nguyen 
35353da42859SDinh Nguyen 		if (gbl->fom_in > 0xff)
35363da42859SDinh Nguyen 			gbl->fom_in = 0xff;
35373da42859SDinh Nguyen 
35383da42859SDinh Nguyen 		if (gbl->fom_out > 0xff)
35393da42859SDinh Nguyen 			gbl->fom_out = 0xff;
35403da42859SDinh Nguyen 
35413da42859SDinh Nguyen 		/* Update the FOM in the register file */
35423da42859SDinh Nguyen 		debug_info = gbl->fom_in;
35433da42859SDinh Nguyen 		debug_info |= gbl->fom_out << 8;
35441273dd9eSMarek Vasut 		writel(debug_info, &sdr_reg_file->fom);
35453da42859SDinh Nguyen 
35461273dd9eSMarek Vasut 		writel(debug_info, &phy_mgr_cfg->cal_debug_info);
35471273dd9eSMarek Vasut 		writel(PHY_MGR_CAL_SUCCESS, &phy_mgr_cfg->cal_status);
35483da42859SDinh Nguyen 	} else {
35493da42859SDinh Nguyen 		printf("%s: CALIBRATION FAILED\n", __FILE__);
35503da42859SDinh Nguyen 
35513da42859SDinh Nguyen 		debug_info = gbl->error_stage;
35523da42859SDinh Nguyen 		debug_info |= gbl->error_substage << 8;
35533da42859SDinh Nguyen 		debug_info |= gbl->error_group << 16;
35543da42859SDinh Nguyen 
35551273dd9eSMarek Vasut 		writel(debug_info, &sdr_reg_file->failing_stage);
35561273dd9eSMarek Vasut 		writel(debug_info, &phy_mgr_cfg->cal_debug_info);
35571273dd9eSMarek Vasut 		writel(PHY_MGR_CAL_FAIL, &phy_mgr_cfg->cal_status);
35583da42859SDinh Nguyen 
35593da42859SDinh Nguyen 		/* Update the failing group/stage in the register file */
35603da42859SDinh Nguyen 		debug_info = gbl->error_stage;
35613da42859SDinh Nguyen 		debug_info |= gbl->error_substage << 8;
35623da42859SDinh Nguyen 		debug_info |= gbl->error_group << 16;
35631273dd9eSMarek Vasut 		writel(debug_info, &sdr_reg_file->failing_stage);
35643da42859SDinh Nguyen 	}
35653da42859SDinh Nguyen 
35663da42859SDinh Nguyen 	return pass;
35673da42859SDinh Nguyen }
35683da42859SDinh Nguyen 
3569bb06434bSMarek Vasut /**
3570bb06434bSMarek Vasut  * hc_initialize_rom_data() - Initialize ROM data
3571bb06434bSMarek Vasut  *
3572bb06434bSMarek Vasut  * Initialize ROM data.
3573bb06434bSMarek Vasut  */
35743da42859SDinh Nguyen static void hc_initialize_rom_data(void)
35753da42859SDinh Nguyen {
3576bb06434bSMarek Vasut 	u32 i, addr;
35773da42859SDinh Nguyen 
3578c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_INST_ROM_WRITE_OFFSET;
3579bb06434bSMarek Vasut 	for (i = 0; i < ARRAY_SIZE(inst_rom_init); i++)
3580bb06434bSMarek Vasut 		writel(inst_rom_init[i], addr + (i << 2));
35813da42859SDinh Nguyen 
3582c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_AC_ROM_WRITE_OFFSET;
3583bb06434bSMarek Vasut 	for (i = 0; i < ARRAY_SIZE(ac_rom_init); i++)
3584bb06434bSMarek Vasut 		writel(ac_rom_init[i], addr + (i << 2));
35853da42859SDinh Nguyen }
35863da42859SDinh Nguyen 
35879c1ab2caSMarek Vasut /**
35889c1ab2caSMarek Vasut  * initialize_reg_file() - Initialize SDR register file
35899c1ab2caSMarek Vasut  *
35909c1ab2caSMarek Vasut  * Initialize SDR register file.
35919c1ab2caSMarek Vasut  */
35923da42859SDinh Nguyen static void initialize_reg_file(void)
35933da42859SDinh Nguyen {
35943da42859SDinh Nguyen 	/* Initialize the register file with the correct data */
35951273dd9eSMarek Vasut 	writel(REG_FILE_INIT_SEQ_SIGNATURE, &sdr_reg_file->signature);
35961273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->debug_data_addr);
35971273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->cur_stage);
35981273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->fom);
35991273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->failing_stage);
36001273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->debug1);
36011273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->debug2);
36023da42859SDinh Nguyen }
36033da42859SDinh Nguyen 
36042ca151f8SMarek Vasut /**
36052ca151f8SMarek Vasut  * initialize_hps_phy() - Initialize HPS PHY
36062ca151f8SMarek Vasut  *
36072ca151f8SMarek Vasut  * Initialize HPS PHY.
36082ca151f8SMarek Vasut  */
36093da42859SDinh Nguyen static void initialize_hps_phy(void)
36103da42859SDinh Nguyen {
36113da42859SDinh Nguyen 	uint32_t reg;
36123da42859SDinh Nguyen 	/*
36133da42859SDinh Nguyen 	 * Tracking also gets configured here because it's in the
36143da42859SDinh Nguyen 	 * same register.
36153da42859SDinh Nguyen 	 */
36163da42859SDinh Nguyen 	uint32_t trk_sample_count = 7500;
36173da42859SDinh Nguyen 	uint32_t trk_long_idle_sample_count = (10 << 16) | 100;
36183da42859SDinh Nguyen 	/*
36193da42859SDinh Nguyen 	 * Format is number of outer loops in the 16 MSB, sample
36203da42859SDinh Nguyen 	 * count in 16 LSB.
36213da42859SDinh Nguyen 	 */
36223da42859SDinh Nguyen 
36233da42859SDinh Nguyen 	reg = 0;
36243da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_ACDELAYEN_SET(2);
36253da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_DQDELAYEN_SET(1);
36263da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_DQSDELAYEN_SET(1);
36273da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_DQSLOGICDELAYEN_SET(1);
36283da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_RESETDELAYEN_SET(0);
36293da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_LPDDRDIS_SET(1);
36303da42859SDinh Nguyen 	/*
36313da42859SDinh Nguyen 	 * This field selects the intrinsic latency to RDATA_EN/FULL path.
36323da42859SDinh Nguyen 	 * 00-bypass, 01- add 5 cycles, 10- add 10 cycles, 11- add 15 cycles.
36333da42859SDinh Nguyen 	 */
36343da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_ADDLATSEL_SET(0);
36353da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_SAMPLECOUNT_19_0_SET(
36363da42859SDinh Nguyen 		trk_sample_count);
36376cb9f167SMarek Vasut 	writel(reg, &sdr_ctrl->phy_ctrl0);
36383da42859SDinh Nguyen 
36393da42859SDinh Nguyen 	reg = 0;
36403da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_1_SAMPLECOUNT_31_20_SET(
36413da42859SDinh Nguyen 		trk_sample_count >>
36423da42859SDinh Nguyen 		SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_SAMPLECOUNT_19_0_WIDTH);
36433da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_1_LONGIDLESAMPLECOUNT_19_0_SET(
36443da42859SDinh Nguyen 		trk_long_idle_sample_count);
36456cb9f167SMarek Vasut 	writel(reg, &sdr_ctrl->phy_ctrl1);
36463da42859SDinh Nguyen 
36473da42859SDinh Nguyen 	reg = 0;
36483da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_2_LONGIDLESAMPLECOUNT_31_20_SET(
36493da42859SDinh Nguyen 		trk_long_idle_sample_count >>
36503da42859SDinh Nguyen 		SDR_CTRLGRP_PHYCTRL_PHYCTRL_1_LONGIDLESAMPLECOUNT_19_0_WIDTH);
36516cb9f167SMarek Vasut 	writel(reg, &sdr_ctrl->phy_ctrl2);
36523da42859SDinh Nguyen }
36533da42859SDinh Nguyen 
36543da42859SDinh Nguyen static void initialize_tracking(void)
36553da42859SDinh Nguyen {
36563da42859SDinh Nguyen 	uint32_t concatenated_longidle = 0x0;
36573da42859SDinh Nguyen 	uint32_t concatenated_delays = 0x0;
36583da42859SDinh Nguyen 	uint32_t concatenated_rw_addr = 0x0;
36593da42859SDinh Nguyen 	uint32_t concatenated_refresh = 0x0;
36603da42859SDinh Nguyen 	uint32_t trk_sample_count = 7500;
36613da42859SDinh Nguyen 	uint32_t dtaps_per_ptap;
36623da42859SDinh Nguyen 	uint32_t tmp_delay;
36633da42859SDinh Nguyen 
36643da42859SDinh Nguyen 	/*
36653da42859SDinh Nguyen 	 * compute usable version of value in case we skip full
36663da42859SDinh Nguyen 	 * computation later
36673da42859SDinh Nguyen 	 */
36683da42859SDinh Nguyen 	dtaps_per_ptap = 0;
36693da42859SDinh Nguyen 	tmp_delay = 0;
36703da42859SDinh Nguyen 	while (tmp_delay < IO_DELAY_PER_OPA_TAP) {
36713da42859SDinh Nguyen 		dtaps_per_ptap++;
36723da42859SDinh Nguyen 		tmp_delay += IO_DELAY_PER_DCHAIN_TAP;
36733da42859SDinh Nguyen 	}
36743da42859SDinh Nguyen 	dtaps_per_ptap--;
36753da42859SDinh Nguyen 
36763da42859SDinh Nguyen 	concatenated_longidle = concatenated_longidle ^ 10;
36773da42859SDinh Nguyen 		/*longidle outer loop */
36783da42859SDinh Nguyen 	concatenated_longidle = concatenated_longidle << 16;
36793da42859SDinh Nguyen 	concatenated_longidle = concatenated_longidle ^ 100;
36803da42859SDinh Nguyen 		/*longidle sample count */
36813da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 243;
36823da42859SDinh Nguyen 		/* trfc, worst case of 933Mhz 4Gb */
36833da42859SDinh Nguyen 	concatenated_delays = concatenated_delays << 8;
36843da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 14;
36853da42859SDinh Nguyen 		/* trcd, worst case */
36863da42859SDinh Nguyen 	concatenated_delays = concatenated_delays << 8;
36873da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 10;
36883da42859SDinh Nguyen 		/* vfifo wait */
36893da42859SDinh Nguyen 	concatenated_delays = concatenated_delays << 8;
36903da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 4;
36913da42859SDinh Nguyen 		/* mux delay */
36923da42859SDinh Nguyen 
36933da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_IDLE;
36943da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr << 8;
36953da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_ACTIVATE_1;
36963da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr << 8;
36973da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_SGLE_READ;
36983da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr << 8;
36993da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_PRECHARGE_ALL;
37003da42859SDinh Nguyen 
37013da42859SDinh Nguyen 	concatenated_refresh = concatenated_refresh ^ RW_MGR_REFRESH_ALL;
37023da42859SDinh Nguyen 	concatenated_refresh = concatenated_refresh << 24;
37033da42859SDinh Nguyen 	concatenated_refresh = concatenated_refresh ^ 1000; /* trefi */
37043da42859SDinh Nguyen 
37053da42859SDinh Nguyen 	/* Initialize the register file with the correct data */
37061273dd9eSMarek Vasut 	writel(dtaps_per_ptap, &sdr_reg_file->dtaps_per_ptap);
37071273dd9eSMarek Vasut 	writel(trk_sample_count, &sdr_reg_file->trk_sample_count);
37081273dd9eSMarek Vasut 	writel(concatenated_longidle, &sdr_reg_file->trk_longidle);
37091273dd9eSMarek Vasut 	writel(concatenated_delays, &sdr_reg_file->delays);
37101273dd9eSMarek Vasut 	writel(concatenated_rw_addr, &sdr_reg_file->trk_rw_mgr_addr);
37111273dd9eSMarek Vasut 	writel(RW_MGR_MEM_IF_READ_DQS_WIDTH, &sdr_reg_file->trk_read_dqs_width);
37121273dd9eSMarek Vasut 	writel(concatenated_refresh, &sdr_reg_file->trk_rfsh);
37133da42859SDinh Nguyen }
37143da42859SDinh Nguyen 
37153da42859SDinh Nguyen int sdram_calibration_full(void)
37163da42859SDinh Nguyen {
37173da42859SDinh Nguyen 	struct param_type my_param;
37183da42859SDinh Nguyen 	struct gbl_type my_gbl;
37193da42859SDinh Nguyen 	uint32_t pass;
37203da42859SDinh Nguyen 	uint32_t i;
37213da42859SDinh Nguyen 
37223da42859SDinh Nguyen 	param = &my_param;
37233da42859SDinh Nguyen 	gbl = &my_gbl;
37243da42859SDinh Nguyen 
37253da42859SDinh Nguyen 	/* Initialize the debug mode flags */
37263da42859SDinh Nguyen 	gbl->phy_debug_mode_flags = 0;
37273da42859SDinh Nguyen 	/* Set the calibration enabled by default */
37283da42859SDinh Nguyen 	gbl->phy_debug_mode_flags |= PHY_DEBUG_ENABLE_CAL_RPT;
37293da42859SDinh Nguyen 	/*
37303da42859SDinh Nguyen 	 * Only sweep all groups (regardless of fail state) by default
37313da42859SDinh Nguyen 	 * Set enabled read test by default.
37323da42859SDinh Nguyen 	 */
37333da42859SDinh Nguyen #if DISABLE_GUARANTEED_READ
37343da42859SDinh Nguyen 	gbl->phy_debug_mode_flags |= PHY_DEBUG_DISABLE_GUARANTEED_READ;
37353da42859SDinh Nguyen #endif
37363da42859SDinh Nguyen 	/* Initialize the register file */
37373da42859SDinh Nguyen 	initialize_reg_file();
37383da42859SDinh Nguyen 
37393da42859SDinh Nguyen 	/* Initialize any PHY CSR */
37403da42859SDinh Nguyen 	initialize_hps_phy();
37413da42859SDinh Nguyen 
37423da42859SDinh Nguyen 	scc_mgr_initialize();
37433da42859SDinh Nguyen 
37443da42859SDinh Nguyen 	initialize_tracking();
37453da42859SDinh Nguyen 
37463da42859SDinh Nguyen 	/* USER Enable all ranks, groups */
37473da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_NUMBER_OF_RANKS; i++)
37483da42859SDinh Nguyen 		param->skip_ranks[i] = 0;
37493da42859SDinh Nguyen 	for (i = 0; i < NUM_SHADOW_REGS; ++i)
37503da42859SDinh Nguyen 		param->skip_shadow_regs[i] = 0;
37513da42859SDinh Nguyen 	param->skip_groups = 0;
37523da42859SDinh Nguyen 
37533da42859SDinh Nguyen 	printf("%s: Preparing to start memory calibration\n", __FILE__);
37543da42859SDinh Nguyen 
37553da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
375623f62b36SMarek Vasut 	debug_cond(DLEVEL == 1,
375723f62b36SMarek Vasut 		   "DDR3 FULL_RATE ranks=%u cs/dimm=%u dq/dqs=%u,%u vg/dqs=%u,%u ",
375823f62b36SMarek Vasut 		   RW_MGR_MEM_NUMBER_OF_RANKS, RW_MGR_MEM_NUMBER_OF_CS_PER_DIMM,
375923f62b36SMarek Vasut 		   RW_MGR_MEM_DQ_PER_READ_DQS, RW_MGR_MEM_DQ_PER_WRITE_DQS,
376023f62b36SMarek Vasut 		   RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS,
376123f62b36SMarek Vasut 		   RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS);
376223f62b36SMarek Vasut 	debug_cond(DLEVEL == 1,
376323f62b36SMarek Vasut 		   "dqs=%u,%u dq=%u dm=%u ptap_delay=%u dtap_delay=%u ",
376423f62b36SMarek Vasut 		   RW_MGR_MEM_IF_READ_DQS_WIDTH, RW_MGR_MEM_IF_WRITE_DQS_WIDTH,
376523f62b36SMarek Vasut 		   RW_MGR_MEM_DATA_WIDTH, RW_MGR_MEM_DATA_MASK_WIDTH,
376623f62b36SMarek Vasut 		   IO_DELAY_PER_OPA_TAP, IO_DELAY_PER_DCHAIN_TAP);
376723f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "dtap_dqsen_delay=%u, dll=%u",
376823f62b36SMarek Vasut 		   IO_DELAY_PER_DQS_EN_DCHAIN_TAP, IO_DLL_CHAIN_LENGTH);
376923f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "max values: en_p=%u dqdqs_p=%u en_d=%u dqs_in_d=%u ",
377023f62b36SMarek Vasut 		   IO_DQS_EN_PHASE_MAX, IO_DQDQS_OUT_PHASE_MAX,
377123f62b36SMarek Vasut 		   IO_DQS_EN_DELAY_MAX, IO_DQS_IN_DELAY_MAX);
377223f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "io_in_d=%u io_out1_d=%u io_out2_d=%u ",
377323f62b36SMarek Vasut 		   IO_IO_IN_DELAY_MAX, IO_IO_OUT1_DELAY_MAX,
377423f62b36SMarek Vasut 		   IO_IO_OUT2_DELAY_MAX);
377523f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "dqs_in_reserve=%u dqs_out_reserve=%u\n",
377623f62b36SMarek Vasut 		   IO_DQS_IN_RESERVE, IO_DQS_OUT_RESERVE);
37773da42859SDinh Nguyen 
37783da42859SDinh Nguyen 	hc_initialize_rom_data();
37793da42859SDinh Nguyen 
37803da42859SDinh Nguyen 	/* update info for sims */
37813da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_NIL);
37823da42859SDinh Nguyen 	reg_file_set_group(0);
37833da42859SDinh Nguyen 
37843da42859SDinh Nguyen 	/*
37853da42859SDinh Nguyen 	 * Load global needed for those actions that require
37863da42859SDinh Nguyen 	 * some dynamic calibration support.
37873da42859SDinh Nguyen 	 */
37883da42859SDinh Nguyen 	dyn_calib_steps = STATIC_CALIB_STEPS;
37893da42859SDinh Nguyen 	/*
37903da42859SDinh Nguyen 	 * Load global to allow dynamic selection of delay loop settings
37913da42859SDinh Nguyen 	 * based on calibration mode.
37923da42859SDinh Nguyen 	 */
37933da42859SDinh Nguyen 	if (!(dyn_calib_steps & CALIB_SKIP_DELAY_LOOPS))
37943da42859SDinh Nguyen 		skip_delay_mask = 0xff;
37953da42859SDinh Nguyen 	else
37963da42859SDinh Nguyen 		skip_delay_mask = 0x0;
37973da42859SDinh Nguyen 
37983da42859SDinh Nguyen 	pass = run_mem_calibrate();
37993da42859SDinh Nguyen 
38003da42859SDinh Nguyen 	printf("%s: Calibration complete\n", __FILE__);
38013da42859SDinh Nguyen 	return pass;
38023da42859SDinh Nguyen }
3803