xref: /rk3399_rockchip-uboot/drivers/ddr/altera/sequencer.c (revision 1273dd9ea3b15f2db45f5f4d9a065a849d1d301a)
13da42859SDinh Nguyen /*
23da42859SDinh Nguyen  * Copyright Altera Corporation (C) 2012-2015
33da42859SDinh Nguyen  *
43da42859SDinh Nguyen  * SPDX-License-Identifier:    BSD-3-Clause
53da42859SDinh Nguyen  */
63da42859SDinh Nguyen 
73da42859SDinh Nguyen #include <common.h>
83da42859SDinh Nguyen #include <asm/io.h>
93da42859SDinh Nguyen #include <asm/arch/sdram.h>
103da42859SDinh Nguyen #include "sequencer.h"
113da42859SDinh Nguyen #include "sequencer_auto.h"
123da42859SDinh Nguyen #include "sequencer_auto_ac_init.h"
133da42859SDinh Nguyen #include "sequencer_auto_inst_init.h"
143da42859SDinh Nguyen #include "sequencer_defines.h"
153da42859SDinh Nguyen 
163da42859SDinh Nguyen static void scc_mgr_load_dqs_for_write_group(uint32_t write_group);
173da42859SDinh Nguyen 
183da42859SDinh Nguyen static struct socfpga_sdr_rw_load_manager *sdr_rw_load_mgr_regs =
196afb4fe2SMarek Vasut 	(struct socfpga_sdr_rw_load_manager *)(SDR_PHYGRP_RWMGRGRP_ADDRESS | 0x800);
203da42859SDinh Nguyen 
213da42859SDinh Nguyen static struct socfpga_sdr_rw_load_jump_manager *sdr_rw_load_jump_mgr_regs =
226afb4fe2SMarek Vasut 	(struct socfpga_sdr_rw_load_jump_manager *)(SDR_PHYGRP_RWMGRGRP_ADDRESS | 0xC00);
233da42859SDinh Nguyen 
243da42859SDinh Nguyen static struct socfpga_sdr_reg_file *sdr_reg_file =
25a1c654a8SMarek Vasut 	(struct socfpga_sdr_reg_file *)SDR_PHYGRP_REGFILEGRP_ADDRESS;
263da42859SDinh Nguyen 
273da42859SDinh Nguyen static struct socfpga_sdr_scc_mgr *sdr_scc_mgr =
28e79025a7SMarek Vasut 	(struct socfpga_sdr_scc_mgr *)(SDR_PHYGRP_SCCGRP_ADDRESS | 0xe00);
293da42859SDinh Nguyen 
303da42859SDinh Nguyen static struct socfpga_phy_mgr_cmd *phy_mgr_cmd =
311bc6f14aSMarek Vasut 	(struct socfpga_phy_mgr_cmd *)SDR_PHYGRP_PHYMGRGRP_ADDRESS;
323da42859SDinh Nguyen 
333da42859SDinh Nguyen static struct socfpga_phy_mgr_cfg *phy_mgr_cfg =
341bc6f14aSMarek Vasut 	(struct socfpga_phy_mgr_cfg *)(SDR_PHYGRP_PHYMGRGRP_ADDRESS | 0x40);
353da42859SDinh Nguyen 
363da42859SDinh Nguyen static struct socfpga_data_mgr *data_mgr =
37c4815f76SMarek Vasut 	(struct socfpga_data_mgr *)SDR_PHYGRP_DATAMGRGRP_ADDRESS;
383da42859SDinh Nguyen 
396cb9f167SMarek Vasut static struct socfpga_sdr_ctrl *sdr_ctrl =
406cb9f167SMarek Vasut 	(struct socfpga_sdr_ctrl *)SDR_CTRLGRP_ADDRESS;
416cb9f167SMarek Vasut 
423da42859SDinh Nguyen #define DELTA_D		1
433da42859SDinh Nguyen 
443da42859SDinh Nguyen /*
453da42859SDinh Nguyen  * In order to reduce ROM size, most of the selectable calibration steps are
463da42859SDinh Nguyen  * decided at compile time based on the user's calibration mode selection,
473da42859SDinh Nguyen  * as captured by the STATIC_CALIB_STEPS selection below.
483da42859SDinh Nguyen  *
493da42859SDinh Nguyen  * However, to support simulation-time selection of fast simulation mode, where
503da42859SDinh Nguyen  * we skip everything except the bare minimum, we need a few of the steps to
513da42859SDinh Nguyen  * be dynamic.  In those cases, we either use the DYNAMIC_CALIB_STEPS for the
523da42859SDinh Nguyen  * check, which is based on the rtl-supplied value, or we dynamically compute
533da42859SDinh Nguyen  * the value to use based on the dynamically-chosen calibration mode
543da42859SDinh Nguyen  */
553da42859SDinh Nguyen 
563da42859SDinh Nguyen #define DLEVEL 0
573da42859SDinh Nguyen #define STATIC_IN_RTL_SIM 0
583da42859SDinh Nguyen #define STATIC_SKIP_DELAY_LOOPS 0
593da42859SDinh Nguyen 
603da42859SDinh Nguyen #define STATIC_CALIB_STEPS (STATIC_IN_RTL_SIM | CALIB_SKIP_FULL_TEST | \
613da42859SDinh Nguyen 	STATIC_SKIP_DELAY_LOOPS)
623da42859SDinh Nguyen 
633da42859SDinh Nguyen /* calibration steps requested by the rtl */
643da42859SDinh Nguyen uint16_t dyn_calib_steps;
653da42859SDinh Nguyen 
663da42859SDinh Nguyen /*
673da42859SDinh Nguyen  * To make CALIB_SKIP_DELAY_LOOPS a dynamic conditional option
683da42859SDinh Nguyen  * instead of static, we use boolean logic to select between
693da42859SDinh Nguyen  * non-skip and skip values
703da42859SDinh Nguyen  *
713da42859SDinh Nguyen  * The mask is set to include all bits when not-skipping, but is
723da42859SDinh Nguyen  * zero when skipping
733da42859SDinh Nguyen  */
743da42859SDinh Nguyen 
753da42859SDinh Nguyen uint16_t skip_delay_mask;	/* mask off bits when skipping/not-skipping */
763da42859SDinh Nguyen 
773da42859SDinh Nguyen #define SKIP_DELAY_LOOP_VALUE_OR_ZERO(non_skip_value) \
783da42859SDinh Nguyen 	((non_skip_value) & skip_delay_mask)
793da42859SDinh Nguyen 
803da42859SDinh Nguyen struct gbl_type *gbl;
813da42859SDinh Nguyen struct param_type *param;
823da42859SDinh Nguyen uint32_t curr_shadow_reg;
833da42859SDinh Nguyen 
843da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_write_test(uint32_t rank_bgn,
853da42859SDinh Nguyen 	uint32_t write_group, uint32_t use_dm,
863da42859SDinh Nguyen 	uint32_t all_correct, uint32_t *bit_chk, uint32_t all_ranks);
873da42859SDinh Nguyen 
883da42859SDinh Nguyen static void set_failing_group_stage(uint32_t group, uint32_t stage,
893da42859SDinh Nguyen 	uint32_t substage)
903da42859SDinh Nguyen {
913da42859SDinh Nguyen 	/*
923da42859SDinh Nguyen 	 * Only set the global stage if there was not been any other
933da42859SDinh Nguyen 	 * failing group
943da42859SDinh Nguyen 	 */
953da42859SDinh Nguyen 	if (gbl->error_stage == CAL_STAGE_NIL)	{
963da42859SDinh Nguyen 		gbl->error_substage = substage;
973da42859SDinh Nguyen 		gbl->error_stage = stage;
983da42859SDinh Nguyen 		gbl->error_group = group;
993da42859SDinh Nguyen 	}
1003da42859SDinh Nguyen }
1013da42859SDinh Nguyen 
1023da42859SDinh Nguyen static void reg_file_set_group(uint32_t set_group)
1033da42859SDinh Nguyen {
1043da42859SDinh Nguyen 	/* Read the current group and stage */
105*1273dd9eSMarek Vasut 	uint32_t cur_stage_group = readl(&sdr_reg_file->cur_stage);
1063da42859SDinh Nguyen 
1073da42859SDinh Nguyen 	/* Clear the group */
1083da42859SDinh Nguyen 	cur_stage_group &= 0x0000FFFF;
1093da42859SDinh Nguyen 
1103da42859SDinh Nguyen 	/* Set the group */
1113da42859SDinh Nguyen 	cur_stage_group |= (set_group << 16);
1123da42859SDinh Nguyen 
1133da42859SDinh Nguyen 	/* Write the data back */
114*1273dd9eSMarek Vasut 	writel(cur_stage_group, &sdr_reg_file->cur_stage);
1153da42859SDinh Nguyen }
1163da42859SDinh Nguyen 
1173da42859SDinh Nguyen static void reg_file_set_stage(uint32_t set_stage)
1183da42859SDinh Nguyen {
1193da42859SDinh Nguyen 	/* Read the current group and stage */
120*1273dd9eSMarek Vasut 	uint32_t cur_stage_group = readl(&sdr_reg_file->cur_stage);
1213da42859SDinh Nguyen 
1223da42859SDinh Nguyen 	/* Clear the stage and substage */
1233da42859SDinh Nguyen 	cur_stage_group &= 0xFFFF0000;
1243da42859SDinh Nguyen 
1253da42859SDinh Nguyen 	/* Set the stage */
1263da42859SDinh Nguyen 	cur_stage_group |= (set_stage & 0x000000FF);
1273da42859SDinh Nguyen 
1283da42859SDinh Nguyen 	/* Write the data back */
129*1273dd9eSMarek Vasut 	writel(cur_stage_group, &sdr_reg_file->cur_stage);
1303da42859SDinh Nguyen }
1313da42859SDinh Nguyen 
1323da42859SDinh Nguyen static void reg_file_set_sub_stage(uint32_t set_sub_stage)
1333da42859SDinh Nguyen {
1343da42859SDinh Nguyen 	/* Read the current group and stage */
135*1273dd9eSMarek Vasut 	uint32_t cur_stage_group = readl(&sdr_reg_file->cur_stage);
1363da42859SDinh Nguyen 
1373da42859SDinh Nguyen 	/* Clear the substage */
1383da42859SDinh Nguyen 	cur_stage_group &= 0xFFFF00FF;
1393da42859SDinh Nguyen 
1403da42859SDinh Nguyen 	/* Set the sub stage */
1413da42859SDinh Nguyen 	cur_stage_group |= ((set_sub_stage << 8) & 0x0000FF00);
1423da42859SDinh Nguyen 
1433da42859SDinh Nguyen 	/* Write the data back */
144*1273dd9eSMarek Vasut 	writel(cur_stage_group, &sdr_reg_file->cur_stage);
1453da42859SDinh Nguyen }
1463da42859SDinh Nguyen 
1473da42859SDinh Nguyen static void initialize(void)
1483da42859SDinh Nguyen {
1493da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
1503da42859SDinh Nguyen 	/* USER calibration has control over path to memory */
1513da42859SDinh Nguyen 	/*
1523da42859SDinh Nguyen 	 * In Hard PHY this is a 2-bit control:
1533da42859SDinh Nguyen 	 * 0: AFI Mux Select
1543da42859SDinh Nguyen 	 * 1: DDIO Mux Select
1553da42859SDinh Nguyen 	 */
156*1273dd9eSMarek Vasut 	writel(0x3, &phy_mgr_cfg->mux_sel);
1573da42859SDinh Nguyen 
1583da42859SDinh Nguyen 	/* USER memory clock is not stable we begin initialization  */
159*1273dd9eSMarek Vasut 	writel(0, &phy_mgr_cfg->reset_mem_stbl);
1603da42859SDinh Nguyen 
1613da42859SDinh Nguyen 	/* USER calibration status all set to zero */
162*1273dd9eSMarek Vasut 	writel(0, &phy_mgr_cfg->cal_status);
1633da42859SDinh Nguyen 
164*1273dd9eSMarek Vasut 	writel(0, &phy_mgr_cfg->cal_debug_info);
1653da42859SDinh Nguyen 
1663da42859SDinh Nguyen 	if ((dyn_calib_steps & CALIB_SKIP_ALL) != CALIB_SKIP_ALL) {
1673da42859SDinh Nguyen 		param->read_correct_mask_vg  = ((uint32_t)1 <<
1683da42859SDinh Nguyen 			(RW_MGR_MEM_DQ_PER_READ_DQS /
1693da42859SDinh Nguyen 			RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS)) - 1;
1703da42859SDinh Nguyen 		param->write_correct_mask_vg = ((uint32_t)1 <<
1713da42859SDinh Nguyen 			(RW_MGR_MEM_DQ_PER_READ_DQS /
1723da42859SDinh Nguyen 			RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS)) - 1;
1733da42859SDinh Nguyen 		param->read_correct_mask     = ((uint32_t)1 <<
1743da42859SDinh Nguyen 			RW_MGR_MEM_DQ_PER_READ_DQS) - 1;
1753da42859SDinh Nguyen 		param->write_correct_mask    = ((uint32_t)1 <<
1763da42859SDinh Nguyen 			RW_MGR_MEM_DQ_PER_WRITE_DQS) - 1;
1773da42859SDinh Nguyen 		param->dm_correct_mask       = ((uint32_t)1 <<
1783da42859SDinh Nguyen 			(RW_MGR_MEM_DATA_WIDTH / RW_MGR_MEM_DATA_MASK_WIDTH))
1793da42859SDinh Nguyen 			- 1;
1803da42859SDinh Nguyen 	}
1813da42859SDinh Nguyen }
1823da42859SDinh Nguyen 
1833da42859SDinh Nguyen static void set_rank_and_odt_mask(uint32_t rank, uint32_t odt_mode)
1843da42859SDinh Nguyen {
1853da42859SDinh Nguyen 	uint32_t odt_mask_0 = 0;
1863da42859SDinh Nguyen 	uint32_t odt_mask_1 = 0;
1873da42859SDinh Nguyen 	uint32_t cs_and_odt_mask;
1883da42859SDinh Nguyen 
1893da42859SDinh Nguyen 	if (odt_mode == RW_MGR_ODT_MODE_READ_WRITE) {
1903da42859SDinh Nguyen 		if (RW_MGR_MEM_NUMBER_OF_RANKS == 1) {
1913da42859SDinh Nguyen 			/*
1923da42859SDinh Nguyen 			 * 1 Rank
1933da42859SDinh Nguyen 			 * Read: ODT = 0
1943da42859SDinh Nguyen 			 * Write: ODT = 1
1953da42859SDinh Nguyen 			 */
1963da42859SDinh Nguyen 			odt_mask_0 = 0x0;
1973da42859SDinh Nguyen 			odt_mask_1 = 0x1;
1983da42859SDinh Nguyen 		} else if (RW_MGR_MEM_NUMBER_OF_RANKS == 2) {
1993da42859SDinh Nguyen 			/* 2 Ranks */
2003da42859SDinh Nguyen 			if (RW_MGR_MEM_NUMBER_OF_CS_PER_DIMM == 1) {
2013da42859SDinh Nguyen 				/* - Dual-Slot , Single-Rank
2023da42859SDinh Nguyen 				 * (1 chip-select per DIMM)
2033da42859SDinh Nguyen 				 * OR
2043da42859SDinh Nguyen 				 * - RDIMM, 4 total CS (2 CS per DIMM)
2053da42859SDinh Nguyen 				 * means 2 DIMM
2063da42859SDinh Nguyen 				 * Since MEM_NUMBER_OF_RANKS is 2 they are
2073da42859SDinh Nguyen 				 * both single rank
2083da42859SDinh Nguyen 				 * with 2 CS each (special for RDIMM)
2093da42859SDinh Nguyen 				 * Read: Turn on ODT on the opposite rank
2103da42859SDinh Nguyen 				 * Write: Turn on ODT on all ranks
2113da42859SDinh Nguyen 				 */
2123da42859SDinh Nguyen 				odt_mask_0 = 0x3 & ~(1 << rank);
2133da42859SDinh Nguyen 				odt_mask_1 = 0x3;
2143da42859SDinh Nguyen 			} else {
2153da42859SDinh Nguyen 				/*
2163da42859SDinh Nguyen 				 * USER - Single-Slot , Dual-rank DIMMs
2173da42859SDinh Nguyen 				 * (2 chip-selects per DIMM)
2183da42859SDinh Nguyen 				 * USER Read: Turn on ODT off on all ranks
2193da42859SDinh Nguyen 				 * USER Write: Turn on ODT on active rank
2203da42859SDinh Nguyen 				 */
2213da42859SDinh Nguyen 				odt_mask_0 = 0x0;
2223da42859SDinh Nguyen 				odt_mask_1 = 0x3 & (1 << rank);
2233da42859SDinh Nguyen 			}
2243da42859SDinh Nguyen 		} else {
2253da42859SDinh Nguyen 			/* 4 Ranks
2263da42859SDinh Nguyen 			 * Read:
2273da42859SDinh Nguyen 			 * ----------+-----------------------+
2283da42859SDinh Nguyen 			 *           |                       |
2293da42859SDinh Nguyen 			 *           |         ODT           |
2303da42859SDinh Nguyen 			 * Read From +-----------------------+
2313da42859SDinh Nguyen 			 *   Rank    |  3  |  2  |  1  |  0  |
2323da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2333da42859SDinh Nguyen 			 *     0     |  0  |  1  |  0  |  0  |
2343da42859SDinh Nguyen 			 *     1     |  1  |  0  |  0  |  0  |
2353da42859SDinh Nguyen 			 *     2     |  0  |  0  |  0  |  1  |
2363da42859SDinh Nguyen 			 *     3     |  0  |  0  |  1  |  0  |
2373da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2383da42859SDinh Nguyen 			 *
2393da42859SDinh Nguyen 			 * Write:
2403da42859SDinh Nguyen 			 * ----------+-----------------------+
2413da42859SDinh Nguyen 			 *           |                       |
2423da42859SDinh Nguyen 			 *           |         ODT           |
2433da42859SDinh Nguyen 			 * Write To  +-----------------------+
2443da42859SDinh Nguyen 			 *   Rank    |  3  |  2  |  1  |  0  |
2453da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2463da42859SDinh Nguyen 			 *     0     |  0  |  1  |  0  |  1  |
2473da42859SDinh Nguyen 			 *     1     |  1  |  0  |  1  |  0  |
2483da42859SDinh Nguyen 			 *     2     |  0  |  1  |  0  |  1  |
2493da42859SDinh Nguyen 			 *     3     |  1  |  0  |  1  |  0  |
2503da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2513da42859SDinh Nguyen 			 */
2523da42859SDinh Nguyen 			switch (rank) {
2533da42859SDinh Nguyen 			case 0:
2543da42859SDinh Nguyen 				odt_mask_0 = 0x4;
2553da42859SDinh Nguyen 				odt_mask_1 = 0x5;
2563da42859SDinh Nguyen 				break;
2573da42859SDinh Nguyen 			case 1:
2583da42859SDinh Nguyen 				odt_mask_0 = 0x8;
2593da42859SDinh Nguyen 				odt_mask_1 = 0xA;
2603da42859SDinh Nguyen 				break;
2613da42859SDinh Nguyen 			case 2:
2623da42859SDinh Nguyen 				odt_mask_0 = 0x1;
2633da42859SDinh Nguyen 				odt_mask_1 = 0x5;
2643da42859SDinh Nguyen 				break;
2653da42859SDinh Nguyen 			case 3:
2663da42859SDinh Nguyen 				odt_mask_0 = 0x2;
2673da42859SDinh Nguyen 				odt_mask_1 = 0xA;
2683da42859SDinh Nguyen 				break;
2693da42859SDinh Nguyen 			}
2703da42859SDinh Nguyen 		}
2713da42859SDinh Nguyen 	} else {
2723da42859SDinh Nguyen 		odt_mask_0 = 0x0;
2733da42859SDinh Nguyen 		odt_mask_1 = 0x0;
2743da42859SDinh Nguyen 	}
2753da42859SDinh Nguyen 
2763da42859SDinh Nguyen 	cs_and_odt_mask =
2773da42859SDinh Nguyen 		(0xFF & ~(1 << rank)) |
2783da42859SDinh Nguyen 		((0xFF & odt_mask_0) << 8) |
2793da42859SDinh Nguyen 		((0xFF & odt_mask_1) << 16);
280*1273dd9eSMarek Vasut 	writel(cs_and_odt_mask, SDR_PHYGRP_RWMGRGRP_ADDRESS |
281*1273dd9eSMarek Vasut 				RW_MGR_SET_CS_AND_ODT_MASK_OFFSET);
2823da42859SDinh Nguyen }
2833da42859SDinh Nguyen 
2843da42859SDinh Nguyen static void scc_mgr_initialize(void)
2853da42859SDinh Nguyen {
286c4815f76SMarek Vasut 	u32 addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_HHP_RFILE_OFFSET;
2873da42859SDinh Nguyen 
2883da42859SDinh Nguyen 	/*
2893da42859SDinh Nguyen 	 * Clear register file for HPS
2903da42859SDinh Nguyen 	 * 16 (2^4) is the size of the full register file in the scc mgr:
2913da42859SDinh Nguyen 	 *	RFILE_DEPTH = log2(MEM_DQ_PER_DQS + 1 + MEM_DM_PER_DQS +
2923da42859SDinh Nguyen 	 * MEM_IF_READ_DQS_WIDTH - 1) + 1;
2933da42859SDinh Nguyen 	 */
2943da42859SDinh Nguyen 	uint32_t i;
2953da42859SDinh Nguyen 	for (i = 0; i < 16; i++) {
2967ac40d25SMarek Vasut 		debug_cond(DLEVEL == 1, "%s:%d: Clearing SCC RFILE index %u\n",
2973da42859SDinh Nguyen 			   __func__, __LINE__, i);
29817fdc916SMarek Vasut 		writel(0, addr + (i << 2));
2993da42859SDinh Nguyen 	}
3003da42859SDinh Nguyen }
3013da42859SDinh Nguyen 
3023da42859SDinh Nguyen static void scc_mgr_set_dqs_bus_in_delay(uint32_t read_group,
3033da42859SDinh Nguyen 						uint32_t delay)
3043da42859SDinh Nguyen {
305c4815f76SMarek Vasut 	u32 addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_DQS_IN_DELAY_OFFSET;
3063da42859SDinh Nguyen 
3073da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
30817fdc916SMarek Vasut 	writel(delay, addr + (read_group << 2));
3093da42859SDinh Nguyen }
3103da42859SDinh Nguyen 
3113da42859SDinh Nguyen static void scc_mgr_set_dqs_io_in_delay(uint32_t write_group,
3123da42859SDinh Nguyen 	uint32_t delay)
3133da42859SDinh Nguyen {
314c4815f76SMarek Vasut 	u32 addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_IN_DELAY_OFFSET;
3153da42859SDinh Nguyen 
31617fdc916SMarek Vasut 	writel(delay, addr + (RW_MGR_MEM_DQ_PER_WRITE_DQS << 2));
3173da42859SDinh Nguyen }
3183da42859SDinh Nguyen 
3193da42859SDinh Nguyen static void scc_mgr_set_dqs_en_phase(uint32_t read_group, uint32_t phase)
3203da42859SDinh Nguyen {
321c4815f76SMarek Vasut 	u32 addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_DQS_EN_PHASE_OFFSET;
3223da42859SDinh Nguyen 
3233da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
32417fdc916SMarek Vasut 	writel(phase, addr + (read_group << 2));
3253da42859SDinh Nguyen }
3263da42859SDinh Nguyen 
3273da42859SDinh Nguyen static void scc_mgr_set_dqs_en_phase_all_ranks(uint32_t read_group,
3283da42859SDinh Nguyen 					       uint32_t phase)
3293da42859SDinh Nguyen {
3303da42859SDinh Nguyen 	uint32_t r;
3313da42859SDinh Nguyen 	uint32_t update_scan_chains;
3323da42859SDinh Nguyen 
3333da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
3343da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
3353da42859SDinh Nguyen 		/*
3363da42859SDinh Nguyen 		 * USER although the h/w doesn't support different phases per
3373da42859SDinh Nguyen 		 * shadow register, for simplicity our scc manager modeling
3383da42859SDinh Nguyen 		 * keeps different phase settings per shadow reg, and it's
3393da42859SDinh Nguyen 		 * important for us to keep them in sync to match h/w.
3403da42859SDinh Nguyen 		 * for efficiency, the scan chain update should occur only
3413da42859SDinh Nguyen 		 * once to sr0.
3423da42859SDinh Nguyen 		 */
3433da42859SDinh Nguyen 		update_scan_chains = (r == 0) ? 1 : 0;
3443da42859SDinh Nguyen 
3453da42859SDinh Nguyen 		scc_mgr_set_dqs_en_phase(read_group, phase);
3463da42859SDinh Nguyen 
3473da42859SDinh Nguyen 		if (update_scan_chains) {
348*1273dd9eSMarek Vasut 			writel(read_group, &sdr_scc_mgr->dqs_ena);
349*1273dd9eSMarek Vasut 			writel(0, &sdr_scc_mgr->update);
3503da42859SDinh Nguyen 		}
3513da42859SDinh Nguyen 	}
3523da42859SDinh Nguyen }
3533da42859SDinh Nguyen 
3543da42859SDinh Nguyen static void scc_mgr_set_dqdqs_output_phase(uint32_t write_group,
3553da42859SDinh Nguyen 						  uint32_t phase)
3563da42859SDinh Nguyen {
357c4815f76SMarek Vasut 	u32 addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_DQDQS_OUT_PHASE_OFFSET;
3583da42859SDinh Nguyen 
3593da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
36017fdc916SMarek Vasut 	writel(phase, addr + (write_group << 2));
3613da42859SDinh Nguyen }
3623da42859SDinh Nguyen 
3633da42859SDinh Nguyen static void scc_mgr_set_dqdqs_output_phase_all_ranks(uint32_t write_group,
3643da42859SDinh Nguyen 						     uint32_t phase)
3653da42859SDinh Nguyen {
3663da42859SDinh Nguyen 	uint32_t r;
3673da42859SDinh Nguyen 	uint32_t update_scan_chains;
3683da42859SDinh Nguyen 
3693da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
3703da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
3713da42859SDinh Nguyen 		/*
3723da42859SDinh Nguyen 		 * USER although the h/w doesn't support different phases per
3733da42859SDinh Nguyen 		 * shadow register, for simplicity our scc manager modeling
3743da42859SDinh Nguyen 		 * keeps different phase settings per shadow reg, and it's
3753da42859SDinh Nguyen 		 * important for us to keep them in sync to match h/w.
3763da42859SDinh Nguyen 		 * for efficiency, the scan chain update should occur only
3773da42859SDinh Nguyen 		 * once to sr0.
3783da42859SDinh Nguyen 		 */
3793da42859SDinh Nguyen 		update_scan_chains = (r == 0) ? 1 : 0;
3803da42859SDinh Nguyen 
3813da42859SDinh Nguyen 		scc_mgr_set_dqdqs_output_phase(write_group, phase);
3823da42859SDinh Nguyen 
3833da42859SDinh Nguyen 		if (update_scan_chains) {
384*1273dd9eSMarek Vasut 			writel(write_group, &sdr_scc_mgr->dqs_ena);
385*1273dd9eSMarek Vasut 			writel(0, &sdr_scc_mgr->update);
3863da42859SDinh Nguyen 		}
3873da42859SDinh Nguyen 	}
3883da42859SDinh Nguyen }
3893da42859SDinh Nguyen 
3903da42859SDinh Nguyen static void scc_mgr_set_dqs_en_delay(uint32_t read_group, uint32_t delay)
3913da42859SDinh Nguyen {
392c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_DQS_EN_DELAY_OFFSET;
3933da42859SDinh Nguyen 
3943da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
39517fdc916SMarek Vasut 	writel(delay + IO_DQS_EN_DELAY_OFFSET, addr +
3963da42859SDinh Nguyen 	       (read_group << 2));
3973da42859SDinh Nguyen }
3983da42859SDinh Nguyen 
3993da42859SDinh Nguyen static void scc_mgr_set_dqs_en_delay_all_ranks(uint32_t read_group,
4003da42859SDinh Nguyen 					       uint32_t delay)
4013da42859SDinh Nguyen {
4023da42859SDinh Nguyen 	uint32_t r;
4033da42859SDinh Nguyen 
4043da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
4053da42859SDinh Nguyen 		r += NUM_RANKS_PER_SHADOW_REG) {
4063da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay(read_group, delay);
4073da42859SDinh Nguyen 
408*1273dd9eSMarek Vasut 		writel(read_group, &sdr_scc_mgr->dqs_ena);
4093da42859SDinh Nguyen 		/*
4103da42859SDinh Nguyen 		 * In shadow register mode, the T11 settings are stored in
4113da42859SDinh Nguyen 		 * registers in the core, which are updated by the DQS_ENA
4123da42859SDinh Nguyen 		 * signals. Not issuing the SCC_MGR_UPD command allows us to
4133da42859SDinh Nguyen 		 * save lots of rank switching overhead, by calling
4143da42859SDinh Nguyen 		 * select_shadow_regs_for_update with update_scan_chains
4153da42859SDinh Nguyen 		 * set to 0.
4163da42859SDinh Nguyen 		 */
417*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
4183da42859SDinh Nguyen 	}
4193da42859SDinh Nguyen 	/*
4203da42859SDinh Nguyen 	 * In shadow register mode, the T11 settings are stored in
4213da42859SDinh Nguyen 	 * registers in the core, which are updated by the DQS_ENA
4223da42859SDinh Nguyen 	 * signals. Not issuing the SCC_MGR_UPD command allows us to
4233da42859SDinh Nguyen 	 * save lots of rank switching overhead, by calling
4243da42859SDinh Nguyen 	 * select_shadow_regs_for_update with update_scan_chains
4253da42859SDinh Nguyen 	 * set to 0.
4263da42859SDinh Nguyen 	 */
427*1273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
4283da42859SDinh Nguyen }
4293da42859SDinh Nguyen 
4303da42859SDinh Nguyen static void scc_mgr_set_oct_out1_delay(uint32_t write_group, uint32_t delay)
4313da42859SDinh Nguyen {
4323da42859SDinh Nguyen 	uint32_t read_group;
433c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_OCT_OUT1_DELAY_OFFSET;
4343da42859SDinh Nguyen 
4353da42859SDinh Nguyen 	/*
4363da42859SDinh Nguyen 	 * Load the setting in the SCC manager
4373da42859SDinh Nguyen 	 * Although OCT affects only write data, the OCT delay is controlled
4383da42859SDinh Nguyen 	 * by the DQS logic block which is instantiated once per read group.
4393da42859SDinh Nguyen 	 * For protocols where a write group consists of multiple read groups,
4403da42859SDinh Nguyen 	 * the setting must be set multiple times.
4413da42859SDinh Nguyen 	 */
4423da42859SDinh Nguyen 	for (read_group = write_group * RW_MGR_MEM_IF_READ_DQS_WIDTH /
4433da42859SDinh Nguyen 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH;
4443da42859SDinh Nguyen 	     read_group < (write_group + 1) * RW_MGR_MEM_IF_READ_DQS_WIDTH /
4453da42859SDinh Nguyen 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH; ++read_group)
44617fdc916SMarek Vasut 		writel(delay, addr + (read_group << 2));
4473da42859SDinh Nguyen }
4483da42859SDinh Nguyen 
4493da42859SDinh Nguyen static void scc_mgr_set_dq_out1_delay(uint32_t write_group,
4503da42859SDinh Nguyen 				      uint32_t dq_in_group, uint32_t delay)
4513da42859SDinh Nguyen {
452c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
4533da42859SDinh Nguyen 
4543da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
45517fdc916SMarek Vasut 	writel(delay, addr + (dq_in_group << 2));
4563da42859SDinh Nguyen }
4573da42859SDinh Nguyen 
4583da42859SDinh Nguyen static void scc_mgr_set_dq_in_delay(uint32_t write_group,
4593da42859SDinh Nguyen 	uint32_t dq_in_group, uint32_t delay)
4603da42859SDinh Nguyen {
461c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_IN_DELAY_OFFSET;
4623da42859SDinh Nguyen 
4633da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
46417fdc916SMarek Vasut 	writel(delay, addr + (dq_in_group << 2));
4653da42859SDinh Nguyen }
4663da42859SDinh Nguyen 
4673da42859SDinh Nguyen static void scc_mgr_set_hhp_extras(void)
4683da42859SDinh Nguyen {
4693da42859SDinh Nguyen 	/*
4703da42859SDinh Nguyen 	 * Load the fixed setting in the SCC manager
4713da42859SDinh Nguyen 	 * bits: 0:0 = 1'b1   - dqs bypass
4723da42859SDinh Nguyen 	 * bits: 1:1 = 1'b1   - dq bypass
4733da42859SDinh Nguyen 	 * bits: 4:2 = 3'b001   - rfifo_mode
4743da42859SDinh Nguyen 	 * bits: 6:5 = 2'b01  - rfifo clock_select
4753da42859SDinh Nguyen 	 * bits: 7:7 = 1'b0  - separate gating from ungating setting
4763da42859SDinh Nguyen 	 * bits: 8:8 = 1'b0  - separate OE from Output delay setting
4773da42859SDinh Nguyen 	 */
4783da42859SDinh Nguyen 	uint32_t value = (0<<8) | (0<<7) | (1<<5) | (1<<2) | (1<<1) | (1<<0);
479c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_HHP_GLOBALS_OFFSET;
4803da42859SDinh Nguyen 
48117fdc916SMarek Vasut 	writel(value, addr + SCC_MGR_HHP_EXTRAS_OFFSET);
4823da42859SDinh Nguyen }
4833da42859SDinh Nguyen 
4843da42859SDinh Nguyen static void scc_mgr_set_dqs_out1_delay(uint32_t write_group,
4853da42859SDinh Nguyen 					      uint32_t delay)
4863da42859SDinh Nguyen {
487c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
4883da42859SDinh Nguyen 
4893da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
49017fdc916SMarek Vasut 	writel(delay, addr + (RW_MGR_MEM_DQ_PER_WRITE_DQS << 2));
4913da42859SDinh Nguyen }
4923da42859SDinh Nguyen 
4933da42859SDinh Nguyen static void scc_mgr_set_dm_out1_delay(uint32_t write_group,
4943da42859SDinh Nguyen 					     uint32_t dm, uint32_t delay)
4953da42859SDinh Nguyen {
496c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
4973da42859SDinh Nguyen 
4983da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
49917fdc916SMarek Vasut 	writel(delay, addr +
5003da42859SDinh Nguyen 		((RW_MGR_MEM_DQ_PER_WRITE_DQS + 1 + dm) << 2));
5013da42859SDinh Nguyen }
5023da42859SDinh Nguyen 
5033da42859SDinh Nguyen /*
5043da42859SDinh Nguyen  * USER Zero all DQS config
5053da42859SDinh Nguyen  * TODO: maybe rename to scc_mgr_zero_dqs_config (or something)
5063da42859SDinh Nguyen  */
5073da42859SDinh Nguyen static void scc_mgr_zero_all(void)
5083da42859SDinh Nguyen {
5093da42859SDinh Nguyen 	uint32_t i, r;
5103da42859SDinh Nguyen 
5113da42859SDinh Nguyen 	/*
5123da42859SDinh Nguyen 	 * USER Zero all DQS config settings, across all groups and all
5133da42859SDinh Nguyen 	 * shadow registers
5143da42859SDinh Nguyen 	 */
5153da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r +=
5163da42859SDinh Nguyen 	     NUM_RANKS_PER_SHADOW_REG) {
5173da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
5183da42859SDinh Nguyen 			/*
5193da42859SDinh Nguyen 			 * The phases actually don't exist on a per-rank basis,
5203da42859SDinh Nguyen 			 * but there's no harm updating them several times, so
5213da42859SDinh Nguyen 			 * let's keep the code simple.
5223da42859SDinh Nguyen 			 */
5233da42859SDinh Nguyen 			scc_mgr_set_dqs_bus_in_delay(i, IO_DQS_IN_RESERVE);
5243da42859SDinh Nguyen 			scc_mgr_set_dqs_en_phase(i, 0);
5253da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay(i, 0);
5263da42859SDinh Nguyen 		}
5273da42859SDinh Nguyen 
5283da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_WRITE_DQS_WIDTH; i++) {
5293da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, 0);
5303da42859SDinh Nguyen 			/* av/cv don't have out2 */
5313da42859SDinh Nguyen 			scc_mgr_set_oct_out1_delay(i, IO_DQS_OUT_RESERVE);
5323da42859SDinh Nguyen 		}
5333da42859SDinh Nguyen 	}
5343da42859SDinh Nguyen 
5353da42859SDinh Nguyen 	/* multicast to all DQS group enables */
536*1273dd9eSMarek Vasut 	writel(0xff, &sdr_scc_mgr->dqs_ena);
537*1273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
5383da42859SDinh Nguyen }
5393da42859SDinh Nguyen 
5403da42859SDinh Nguyen static void scc_set_bypass_mode(uint32_t write_group, uint32_t mode)
5413da42859SDinh Nguyen {
5423da42859SDinh Nguyen 	/* mode = 0 : Do NOT bypass - Half Rate Mode */
5433da42859SDinh Nguyen 	/* mode = 1 : Bypass - Full Rate Mode */
5443da42859SDinh Nguyen 
5453da42859SDinh Nguyen 	/* only need to set once for all groups, pins, dq, dqs, dm */
5463da42859SDinh Nguyen 	if (write_group == 0) {
5473da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d Setting HHP Extras\n", __func__,
5483da42859SDinh Nguyen 			   __LINE__);
5493da42859SDinh Nguyen 		scc_mgr_set_hhp_extras();
5503da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d Done Setting HHP Extras\n",
5513da42859SDinh Nguyen 			  __func__, __LINE__);
5523da42859SDinh Nguyen 	}
5533da42859SDinh Nguyen 	/* multicast to all DQ enables */
554*1273dd9eSMarek Vasut 	writel(0xff, &sdr_scc_mgr->dq_ena);
555*1273dd9eSMarek Vasut 	writel(0xff, &sdr_scc_mgr->dm_ena);
5563da42859SDinh Nguyen 
5573da42859SDinh Nguyen 	/* update current DQS IO enable */
558*1273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->dqs_io_ena);
5593da42859SDinh Nguyen 
5603da42859SDinh Nguyen 	/* update the DQS logic */
561*1273dd9eSMarek Vasut 	writel(write_group, &sdr_scc_mgr->dqs_ena);
5623da42859SDinh Nguyen 
5633da42859SDinh Nguyen 	/* hit update */
564*1273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
5653da42859SDinh Nguyen }
5663da42859SDinh Nguyen 
5673da42859SDinh Nguyen static void scc_mgr_zero_group(uint32_t write_group, uint32_t test_begin,
5683da42859SDinh Nguyen 			       int32_t out_only)
5693da42859SDinh Nguyen {
5703da42859SDinh Nguyen 	uint32_t i, r;
5713da42859SDinh Nguyen 
5723da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r +=
5733da42859SDinh Nguyen 		NUM_RANKS_PER_SHADOW_REG) {
5743da42859SDinh Nguyen 		/* Zero all DQ config settings */
5753da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
5763da42859SDinh Nguyen 			scc_mgr_set_dq_out1_delay(write_group, i, 0);
5773da42859SDinh Nguyen 			if (!out_only)
5783da42859SDinh Nguyen 				scc_mgr_set_dq_in_delay(write_group, i, 0);
5793da42859SDinh Nguyen 		}
5803da42859SDinh Nguyen 
5813da42859SDinh Nguyen 		/* multicast to all DQ enables */
582*1273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dq_ena);
5833da42859SDinh Nguyen 
5843da42859SDinh Nguyen 		/* Zero all DM config settings */
5853da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_NUM_DM_PER_WRITE_GROUP; i++) {
5863da42859SDinh Nguyen 			scc_mgr_set_dm_out1_delay(write_group, i, 0);
5873da42859SDinh Nguyen 		}
5883da42859SDinh Nguyen 
5893da42859SDinh Nguyen 		/* multicast to all DM enables */
590*1273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dm_ena);
5913da42859SDinh Nguyen 
5923da42859SDinh Nguyen 		/* zero all DQS io settings */
5933da42859SDinh Nguyen 		if (!out_only)
5943da42859SDinh Nguyen 			scc_mgr_set_dqs_io_in_delay(write_group, 0);
5953da42859SDinh Nguyen 		/* av/cv don't have out2 */
5963da42859SDinh Nguyen 		scc_mgr_set_dqs_out1_delay(write_group, IO_DQS_OUT_RESERVE);
5973da42859SDinh Nguyen 		scc_mgr_set_oct_out1_delay(write_group, IO_DQS_OUT_RESERVE);
5983da42859SDinh Nguyen 		scc_mgr_load_dqs_for_write_group(write_group);
5993da42859SDinh Nguyen 
6003da42859SDinh Nguyen 		/* multicast to all DQS IO enables (only 1) */
601*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->dqs_io_ena);
6023da42859SDinh Nguyen 
6033da42859SDinh Nguyen 		/* hit update to zero everything */
604*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
6053da42859SDinh Nguyen 	}
6063da42859SDinh Nguyen }
6073da42859SDinh Nguyen 
6083da42859SDinh Nguyen /* load up dqs config settings */
6093da42859SDinh Nguyen static void scc_mgr_load_dqs(uint32_t dqs)
6103da42859SDinh Nguyen {
611*1273dd9eSMarek Vasut 	writel(dqs, &sdr_scc_mgr->dqs_ena);
6123da42859SDinh Nguyen }
6133da42859SDinh Nguyen 
6143da42859SDinh Nguyen static void scc_mgr_load_dqs_for_write_group(uint32_t write_group)
6153da42859SDinh Nguyen {
6163da42859SDinh Nguyen 	uint32_t read_group;
617e79025a7SMarek Vasut 	uint32_t addr = (u32)&sdr_scc_mgr->dqs_ena;
6183da42859SDinh Nguyen 	/*
6193da42859SDinh Nguyen 	 * Although OCT affects only write data, the OCT delay is controlled
6203da42859SDinh Nguyen 	 * by the DQS logic block which is instantiated once per read group.
6213da42859SDinh Nguyen 	 * For protocols where a write group consists of multiple read groups,
6223da42859SDinh Nguyen 	 * the setting must be scanned multiple times.
6233da42859SDinh Nguyen 	 */
6243da42859SDinh Nguyen 	for (read_group = write_group * RW_MGR_MEM_IF_READ_DQS_WIDTH /
6253da42859SDinh Nguyen 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH;
6263da42859SDinh Nguyen 	     read_group < (write_group + 1) * RW_MGR_MEM_IF_READ_DQS_WIDTH /
6273da42859SDinh Nguyen 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH; ++read_group)
62817fdc916SMarek Vasut 		writel(read_group, addr);
6293da42859SDinh Nguyen }
6303da42859SDinh Nguyen 
6313da42859SDinh Nguyen /* load up dqs io config settings */
6323da42859SDinh Nguyen static void scc_mgr_load_dqs_io(void)
6333da42859SDinh Nguyen {
634*1273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->dqs_io_ena);
6353da42859SDinh Nguyen }
6363da42859SDinh Nguyen 
6373da42859SDinh Nguyen /* load up dq config settings */
6383da42859SDinh Nguyen static void scc_mgr_load_dq(uint32_t dq_in_group)
6393da42859SDinh Nguyen {
640*1273dd9eSMarek Vasut 	writel(dq_in_group, &sdr_scc_mgr->dq_ena);
6413da42859SDinh Nguyen }
6423da42859SDinh Nguyen 
6433da42859SDinh Nguyen /* load up dm config settings */
6443da42859SDinh Nguyen static void scc_mgr_load_dm(uint32_t dm)
6453da42859SDinh Nguyen {
646*1273dd9eSMarek Vasut 	writel(dm, &sdr_scc_mgr->dm_ena);
6473da42859SDinh Nguyen }
6483da42859SDinh Nguyen 
6493da42859SDinh Nguyen /*
6503da42859SDinh Nguyen  * apply and load a particular input delay for the DQ pins in a group
6513da42859SDinh Nguyen  * group_bgn is the index of the first dq pin (in the write group)
6523da42859SDinh Nguyen  */
6533da42859SDinh Nguyen static void scc_mgr_apply_group_dq_in_delay(uint32_t write_group,
6543da42859SDinh Nguyen 					    uint32_t group_bgn, uint32_t delay)
6553da42859SDinh Nguyen {
6563da42859SDinh Nguyen 	uint32_t i, p;
6573da42859SDinh Nguyen 
6583da42859SDinh Nguyen 	for (i = 0, p = group_bgn; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++, p++) {
6593da42859SDinh Nguyen 		scc_mgr_set_dq_in_delay(write_group, p, delay);
6603da42859SDinh Nguyen 		scc_mgr_load_dq(p);
6613da42859SDinh Nguyen 	}
6623da42859SDinh Nguyen }
6633da42859SDinh Nguyen 
6643da42859SDinh Nguyen /* apply and load a particular output delay for the DQ pins in a group */
6653da42859SDinh Nguyen static void scc_mgr_apply_group_dq_out1_delay(uint32_t write_group,
6663da42859SDinh Nguyen 					      uint32_t group_bgn,
6673da42859SDinh Nguyen 					      uint32_t delay1)
6683da42859SDinh Nguyen {
6693da42859SDinh Nguyen 	uint32_t i, p;
6703da42859SDinh Nguyen 
6713da42859SDinh Nguyen 	for (i = 0, p = group_bgn; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++, p++) {
6723da42859SDinh Nguyen 		scc_mgr_set_dq_out1_delay(write_group, i, delay1);
6733da42859SDinh Nguyen 		scc_mgr_load_dq(i);
6743da42859SDinh Nguyen 	}
6753da42859SDinh Nguyen }
6763da42859SDinh Nguyen 
6773da42859SDinh Nguyen /* apply and load a particular output delay for the DM pins in a group */
6783da42859SDinh Nguyen static void scc_mgr_apply_group_dm_out1_delay(uint32_t write_group,
6793da42859SDinh Nguyen 					      uint32_t delay1)
6803da42859SDinh Nguyen {
6813da42859SDinh Nguyen 	uint32_t i;
6823da42859SDinh Nguyen 
6833da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_NUM_DM_PER_WRITE_GROUP; i++) {
6843da42859SDinh Nguyen 		scc_mgr_set_dm_out1_delay(write_group, i, delay1);
6853da42859SDinh Nguyen 		scc_mgr_load_dm(i);
6863da42859SDinh Nguyen 	}
6873da42859SDinh Nguyen }
6883da42859SDinh Nguyen 
6893da42859SDinh Nguyen 
6903da42859SDinh Nguyen /* apply and load delay on both DQS and OCT out1 */
6913da42859SDinh Nguyen static void scc_mgr_apply_group_dqs_io_and_oct_out1(uint32_t write_group,
6923da42859SDinh Nguyen 						    uint32_t delay)
6933da42859SDinh Nguyen {
6943da42859SDinh Nguyen 	scc_mgr_set_dqs_out1_delay(write_group, delay);
6953da42859SDinh Nguyen 	scc_mgr_load_dqs_io();
6963da42859SDinh Nguyen 
6973da42859SDinh Nguyen 	scc_mgr_set_oct_out1_delay(write_group, delay);
6983da42859SDinh Nguyen 	scc_mgr_load_dqs_for_write_group(write_group);
6993da42859SDinh Nguyen }
7003da42859SDinh Nguyen 
7013da42859SDinh Nguyen /* apply a delay to the entire output side: DQ, DM, DQS, OCT */
7023da42859SDinh Nguyen static void scc_mgr_apply_group_all_out_delay_add(uint32_t write_group,
7033da42859SDinh Nguyen 						  uint32_t group_bgn,
7043da42859SDinh Nguyen 						  uint32_t delay)
7053da42859SDinh Nguyen {
7063da42859SDinh Nguyen 	uint32_t i, p, new_delay;
7073da42859SDinh Nguyen 
7083da42859SDinh Nguyen 	/* dq shift */
7093da42859SDinh Nguyen 	for (i = 0, p = group_bgn; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++, p++) {
7103da42859SDinh Nguyen 		new_delay = READ_SCC_DQ_OUT2_DELAY;
7113da42859SDinh Nguyen 		new_delay += delay;
7123da42859SDinh Nguyen 
7133da42859SDinh Nguyen 		if (new_delay > IO_IO_OUT2_DELAY_MAX) {
7143da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DQ[%u,%u]:\
7153da42859SDinh Nguyen 				   %u > %lu => %lu", __func__, __LINE__,
7163da42859SDinh Nguyen 				   write_group, group_bgn, delay, i, p, new_delay,
7173da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX,
7183da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX);
7193da42859SDinh Nguyen 			new_delay = IO_IO_OUT2_DELAY_MAX;
7203da42859SDinh Nguyen 		}
7213da42859SDinh Nguyen 
7223da42859SDinh Nguyen 		scc_mgr_load_dq(i);
7233da42859SDinh Nguyen 	}
7243da42859SDinh Nguyen 
7253da42859SDinh Nguyen 	/* dm shift */
7263da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_NUM_DM_PER_WRITE_GROUP; i++) {
7273da42859SDinh Nguyen 		new_delay = READ_SCC_DM_IO_OUT2_DELAY;
7283da42859SDinh Nguyen 		new_delay += delay;
7293da42859SDinh Nguyen 
7303da42859SDinh Nguyen 		if (new_delay > IO_IO_OUT2_DELAY_MAX) {
7313da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DM[%u]:\
7323da42859SDinh Nguyen 				   %u > %lu => %lu\n",  __func__, __LINE__,
7333da42859SDinh Nguyen 				   write_group, group_bgn, delay, i, new_delay,
7343da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX,
7353da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX);
7363da42859SDinh Nguyen 			new_delay = IO_IO_OUT2_DELAY_MAX;
7373da42859SDinh Nguyen 		}
7383da42859SDinh Nguyen 
7393da42859SDinh Nguyen 		scc_mgr_load_dm(i);
7403da42859SDinh Nguyen 	}
7413da42859SDinh Nguyen 
7423da42859SDinh Nguyen 	/* dqs shift */
7433da42859SDinh Nguyen 	new_delay = READ_SCC_DQS_IO_OUT2_DELAY;
7443da42859SDinh Nguyen 	new_delay += delay;
7453da42859SDinh Nguyen 
7463da42859SDinh Nguyen 	if (new_delay > IO_IO_OUT2_DELAY_MAX) {
7473da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DQS: %u > %d => %d;"
7483da42859SDinh Nguyen 			   " adding %u to OUT1\n", __func__, __LINE__,
7493da42859SDinh Nguyen 			   write_group, group_bgn, delay, new_delay,
7503da42859SDinh Nguyen 			   IO_IO_OUT2_DELAY_MAX, IO_IO_OUT2_DELAY_MAX,
7513da42859SDinh Nguyen 			   new_delay - IO_IO_OUT2_DELAY_MAX);
7523da42859SDinh Nguyen 		scc_mgr_set_dqs_out1_delay(write_group, new_delay -
7533da42859SDinh Nguyen 					   IO_IO_OUT2_DELAY_MAX);
7543da42859SDinh Nguyen 		new_delay = IO_IO_OUT2_DELAY_MAX;
7553da42859SDinh Nguyen 	}
7563da42859SDinh Nguyen 
7573da42859SDinh Nguyen 	scc_mgr_load_dqs_io();
7583da42859SDinh Nguyen 
7593da42859SDinh Nguyen 	/* oct shift */
7603da42859SDinh Nguyen 	new_delay = READ_SCC_OCT_OUT2_DELAY;
7613da42859SDinh Nguyen 	new_delay += delay;
7623da42859SDinh Nguyen 
7633da42859SDinh Nguyen 	if (new_delay > IO_IO_OUT2_DELAY_MAX) {
7643da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DQS: %u > %d => %d;"
7653da42859SDinh Nguyen 			   " adding %u to OUT1\n", __func__, __LINE__,
7663da42859SDinh Nguyen 			   write_group, group_bgn, delay, new_delay,
7673da42859SDinh Nguyen 			   IO_IO_OUT2_DELAY_MAX, IO_IO_OUT2_DELAY_MAX,
7683da42859SDinh Nguyen 			   new_delay - IO_IO_OUT2_DELAY_MAX);
7693da42859SDinh Nguyen 		scc_mgr_set_oct_out1_delay(write_group, new_delay -
7703da42859SDinh Nguyen 					   IO_IO_OUT2_DELAY_MAX);
7713da42859SDinh Nguyen 		new_delay = IO_IO_OUT2_DELAY_MAX;
7723da42859SDinh Nguyen 	}
7733da42859SDinh Nguyen 
7743da42859SDinh Nguyen 	scc_mgr_load_dqs_for_write_group(write_group);
7753da42859SDinh Nguyen }
7763da42859SDinh Nguyen 
7773da42859SDinh Nguyen /*
7783da42859SDinh Nguyen  * USER apply a delay to the entire output side (DQ, DM, DQS, OCT)
7793da42859SDinh Nguyen  * and to all ranks
7803da42859SDinh Nguyen  */
7813da42859SDinh Nguyen static void scc_mgr_apply_group_all_out_delay_add_all_ranks(
7823da42859SDinh Nguyen 	uint32_t write_group, uint32_t group_bgn, uint32_t delay)
7833da42859SDinh Nguyen {
7843da42859SDinh Nguyen 	uint32_t r;
7853da42859SDinh Nguyen 
7863da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
7873da42859SDinh Nguyen 		r += NUM_RANKS_PER_SHADOW_REG) {
7883da42859SDinh Nguyen 		scc_mgr_apply_group_all_out_delay_add(write_group,
7893da42859SDinh Nguyen 						      group_bgn, delay);
790*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
7913da42859SDinh Nguyen 	}
7923da42859SDinh Nguyen }
7933da42859SDinh Nguyen 
7943da42859SDinh Nguyen /* optimization used to recover some slots in ddr3 inst_rom */
7953da42859SDinh Nguyen /* could be applied to other protocols if we wanted to */
7963da42859SDinh Nguyen static void set_jump_as_return(void)
7973da42859SDinh Nguyen {
7983da42859SDinh Nguyen 	/*
7993da42859SDinh Nguyen 	 * to save space, we replace return with jump to special shared
8003da42859SDinh Nguyen 	 * RETURN instruction so we set the counter to large value so that
8013da42859SDinh Nguyen 	 * we always jump
8023da42859SDinh Nguyen 	 */
803*1273dd9eSMarek Vasut 	writel(0xff, &sdr_rw_load_mgr_regs->load_cntr0);
804*1273dd9eSMarek Vasut 	writel(RW_MGR_RETURN, &sdr_rw_load_jump_mgr_regs->load_jump_add0);
8053da42859SDinh Nguyen }
8063da42859SDinh Nguyen 
8073da42859SDinh Nguyen /*
8083da42859SDinh Nguyen  * should always use constants as argument to ensure all computations are
8093da42859SDinh Nguyen  * performed at compile time
8103da42859SDinh Nguyen  */
8113da42859SDinh Nguyen static void delay_for_n_mem_clocks(const uint32_t clocks)
8123da42859SDinh Nguyen {
8133da42859SDinh Nguyen 	uint32_t afi_clocks;
8143da42859SDinh Nguyen 	uint8_t inner = 0;
8153da42859SDinh Nguyen 	uint8_t outer = 0;
8163da42859SDinh Nguyen 	uint16_t c_loop = 0;
8173da42859SDinh Nguyen 
8183da42859SDinh Nguyen 	debug("%s:%d: clocks=%u ... start\n", __func__, __LINE__, clocks);
8193da42859SDinh Nguyen 
8203da42859SDinh Nguyen 
8213da42859SDinh Nguyen 	afi_clocks = (clocks + AFI_RATE_RATIO-1) / AFI_RATE_RATIO;
8223da42859SDinh Nguyen 	/* scale (rounding up) to get afi clocks */
8233da42859SDinh Nguyen 
8243da42859SDinh Nguyen 	/*
8253da42859SDinh Nguyen 	 * Note, we don't bother accounting for being off a little bit
8263da42859SDinh Nguyen 	 * because of a few extra instructions in outer loops
8273da42859SDinh Nguyen 	 * Note, the loops have a test at the end, and do the test before
8283da42859SDinh Nguyen 	 * the decrement, and so always perform the loop
8293da42859SDinh Nguyen 	 * 1 time more than the counter value
8303da42859SDinh Nguyen 	 */
8313da42859SDinh Nguyen 	if (afi_clocks == 0) {
8323da42859SDinh Nguyen 		;
8333da42859SDinh Nguyen 	} else if (afi_clocks <= 0x100) {
8343da42859SDinh Nguyen 		inner = afi_clocks-1;
8353da42859SDinh Nguyen 		outer = 0;
8363da42859SDinh Nguyen 		c_loop = 0;
8373da42859SDinh Nguyen 	} else if (afi_clocks <= 0x10000) {
8383da42859SDinh Nguyen 		inner = 0xff;
8393da42859SDinh Nguyen 		outer = (afi_clocks-1) >> 8;
8403da42859SDinh Nguyen 		c_loop = 0;
8413da42859SDinh Nguyen 	} else {
8423da42859SDinh Nguyen 		inner = 0xff;
8433da42859SDinh Nguyen 		outer = 0xff;
8443da42859SDinh Nguyen 		c_loop = (afi_clocks-1) >> 16;
8453da42859SDinh Nguyen 	}
8463da42859SDinh Nguyen 
8473da42859SDinh Nguyen 	/*
8483da42859SDinh Nguyen 	 * rom instructions are structured as follows:
8493da42859SDinh Nguyen 	 *
8503da42859SDinh Nguyen 	 *    IDLE_LOOP2: jnz cntr0, TARGET_A
8513da42859SDinh Nguyen 	 *    IDLE_LOOP1: jnz cntr1, TARGET_B
8523da42859SDinh Nguyen 	 *                return
8533da42859SDinh Nguyen 	 *
8543da42859SDinh Nguyen 	 * so, when doing nested loops, TARGET_A is set to IDLE_LOOP2, and
8553da42859SDinh Nguyen 	 * TARGET_B is set to IDLE_LOOP2 as well
8563da42859SDinh Nguyen 	 *
8573da42859SDinh Nguyen 	 * if we have no outer loop, though, then we can use IDLE_LOOP1 only,
8583da42859SDinh Nguyen 	 * and set TARGET_B to IDLE_LOOP1 and we skip IDLE_LOOP2 entirely
8593da42859SDinh Nguyen 	 *
8603da42859SDinh Nguyen 	 * a little confusing, but it helps save precious space in the inst_rom
8613da42859SDinh Nguyen 	 * and sequencer rom and keeps the delays more accurate and reduces
8623da42859SDinh Nguyen 	 * overhead
8633da42859SDinh Nguyen 	 */
8643da42859SDinh Nguyen 	if (afi_clocks <= 0x100) {
865*1273dd9eSMarek Vasut 		writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(inner),
866*1273dd9eSMarek Vasut 			&sdr_rw_load_mgr_regs->load_cntr1);
8673da42859SDinh Nguyen 
868*1273dd9eSMarek Vasut 		writel(RW_MGR_IDLE_LOOP1,
869*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
8703da42859SDinh Nguyen 
871*1273dd9eSMarek Vasut 		writel(RW_MGR_IDLE_LOOP1, SDR_PHYGRP_RWMGRGRP_ADDRESS |
872*1273dd9eSMarek Vasut 					  RW_MGR_RUN_SINGLE_GROUP_OFFSET);
8733da42859SDinh Nguyen 	} else {
874*1273dd9eSMarek Vasut 		writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(inner),
875*1273dd9eSMarek Vasut 			&sdr_rw_load_mgr_regs->load_cntr0);
8763da42859SDinh Nguyen 
877*1273dd9eSMarek Vasut 		writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(outer),
878*1273dd9eSMarek Vasut 			&sdr_rw_load_mgr_regs->load_cntr1);
8793da42859SDinh Nguyen 
880*1273dd9eSMarek Vasut 		writel(RW_MGR_IDLE_LOOP2,
881*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add0);
8823da42859SDinh Nguyen 
883*1273dd9eSMarek Vasut 		writel(RW_MGR_IDLE_LOOP2,
884*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
8853da42859SDinh Nguyen 
8863da42859SDinh Nguyen 		/* hack to get around compiler not being smart enough */
8873da42859SDinh Nguyen 		if (afi_clocks <= 0x10000) {
8883da42859SDinh Nguyen 			/* only need to run once */
889*1273dd9eSMarek Vasut 			writel(RW_MGR_IDLE_LOOP2, SDR_PHYGRP_RWMGRGRP_ADDRESS |
890*1273dd9eSMarek Vasut 						  RW_MGR_RUN_SINGLE_GROUP_OFFSET);
8913da42859SDinh Nguyen 		} else {
8923da42859SDinh Nguyen 			do {
893*1273dd9eSMarek Vasut 				writel(RW_MGR_IDLE_LOOP2,
894*1273dd9eSMarek Vasut 					SDR_PHYGRP_RWMGRGRP_ADDRESS |
895*1273dd9eSMarek Vasut 					RW_MGR_RUN_SINGLE_GROUP_OFFSET);
8963da42859SDinh Nguyen 			} while (c_loop-- != 0);
8973da42859SDinh Nguyen 		}
8983da42859SDinh Nguyen 	}
8993da42859SDinh Nguyen 	debug("%s:%d clocks=%u ... end\n", __func__, __LINE__, clocks);
9003da42859SDinh Nguyen }
9013da42859SDinh Nguyen 
9023da42859SDinh Nguyen static void rw_mgr_mem_initialize(void)
9033da42859SDinh Nguyen {
9043da42859SDinh Nguyen 	uint32_t r;
905*1273dd9eSMarek Vasut 	uint32_t grpaddr = SDR_PHYGRP_RWMGRGRP_ADDRESS |
906*1273dd9eSMarek Vasut 			   RW_MGR_RUN_SINGLE_GROUP_OFFSET;
9073da42859SDinh Nguyen 
9083da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
9093da42859SDinh Nguyen 
9103da42859SDinh Nguyen 	/* The reset / cke part of initialization is broadcasted to all ranks */
911*1273dd9eSMarek Vasut 	writel(RW_MGR_RANK_ALL, SDR_PHYGRP_RWMGRGRP_ADDRESS |
912*1273dd9eSMarek Vasut 				RW_MGR_SET_CS_AND_ODT_MASK_OFFSET);
9133da42859SDinh Nguyen 
9143da42859SDinh Nguyen 	/*
9153da42859SDinh Nguyen 	 * Here's how you load register for a loop
9163da42859SDinh Nguyen 	 * Counters are located @ 0x800
9173da42859SDinh Nguyen 	 * Jump address are located @ 0xC00
9183da42859SDinh Nguyen 	 * For both, registers 0 to 3 are selected using bits 3 and 2, like
9193da42859SDinh Nguyen 	 * in 0x800, 0x804, 0x808, 0x80C and 0xC00, 0xC04, 0xC08, 0xC0C
9203da42859SDinh Nguyen 	 * I know this ain't pretty, but Avalon bus throws away the 2 least
9213da42859SDinh Nguyen 	 * significant bits
9223da42859SDinh Nguyen 	 */
9233da42859SDinh Nguyen 
9243da42859SDinh Nguyen 	/* start with memory RESET activated */
9253da42859SDinh Nguyen 
9263da42859SDinh Nguyen 	/* tINIT = 200us */
9273da42859SDinh Nguyen 
9283da42859SDinh Nguyen 	/*
9293da42859SDinh Nguyen 	 * 200us @ 266MHz (3.75 ns) ~ 54000 clock cycles
9303da42859SDinh Nguyen 	 * If a and b are the number of iteration in 2 nested loops
9313da42859SDinh Nguyen 	 * it takes the following number of cycles to complete the operation:
9323da42859SDinh Nguyen 	 * number_of_cycles = ((2 + n) * a + 2) * b
9333da42859SDinh Nguyen 	 * where n is the number of instruction in the inner loop
9343da42859SDinh Nguyen 	 * One possible solution is n = 0 , a = 256 , b = 106 => a = FF,
9353da42859SDinh Nguyen 	 * b = 6A
9363da42859SDinh Nguyen 	 */
9373da42859SDinh Nguyen 
9383da42859SDinh Nguyen 	/* Load counters */
9393da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TINIT_CNTR0_VAL),
940*1273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr0);
9413da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TINIT_CNTR1_VAL),
942*1273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr1);
9433da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TINIT_CNTR2_VAL),
944*1273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr2);
9453da42859SDinh Nguyen 
9463da42859SDinh Nguyen 	/* Load jump address */
947*1273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_0_CKE_0,
948*1273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add0);
949*1273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_0_CKE_0,
950*1273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add1);
951*1273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_0_CKE_0,
952*1273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add2);
9533da42859SDinh Nguyen 
9543da42859SDinh Nguyen 	/* Execute count instruction */
955*1273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_0_CKE_0, grpaddr);
9563da42859SDinh Nguyen 
9573da42859SDinh Nguyen 	/* indicate that memory is stable */
958*1273dd9eSMarek Vasut 	writel(1, &phy_mgr_cfg->reset_mem_stbl);
9593da42859SDinh Nguyen 
9603da42859SDinh Nguyen 	/*
9613da42859SDinh Nguyen 	 * transition the RESET to high
9623da42859SDinh Nguyen 	 * Wait for 500us
9633da42859SDinh Nguyen 	 */
9643da42859SDinh Nguyen 
9653da42859SDinh Nguyen 	/*
9663da42859SDinh Nguyen 	 * 500us @ 266MHz (3.75 ns) ~ 134000 clock cycles
9673da42859SDinh Nguyen 	 * If a and b are the number of iteration in 2 nested loops
9683da42859SDinh Nguyen 	 * it takes the following number of cycles to complete the operation
9693da42859SDinh Nguyen 	 * number_of_cycles = ((2 + n) * a + 2) * b
9703da42859SDinh Nguyen 	 * where n is the number of instruction in the inner loop
9713da42859SDinh Nguyen 	 * One possible solution is n = 2 , a = 131 , b = 256 => a = 83,
9723da42859SDinh Nguyen 	 * b = FF
9733da42859SDinh Nguyen 	 */
9743da42859SDinh Nguyen 
9753da42859SDinh Nguyen 	/* Load counters */
9763da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TRESET_CNTR0_VAL),
977*1273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr0);
9783da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TRESET_CNTR1_VAL),
979*1273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr1);
9803da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TRESET_CNTR2_VAL),
981*1273dd9eSMarek Vasut 	       &sdr_rw_load_mgr_regs->load_cntr2);
9823da42859SDinh Nguyen 
9833da42859SDinh Nguyen 	/* Load jump address */
984*1273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_1_CKE_0,
985*1273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add0);
986*1273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_1_CKE_0,
987*1273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add1);
988*1273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_1_CKE_0,
989*1273dd9eSMarek Vasut 		&sdr_rw_load_jump_mgr_regs->load_jump_add2);
9903da42859SDinh Nguyen 
991*1273dd9eSMarek Vasut 	writel(RW_MGR_INIT_RESET_1_CKE_0, grpaddr);
9923da42859SDinh Nguyen 
9933da42859SDinh Nguyen 	/* bring up clock enable */
9943da42859SDinh Nguyen 
9953da42859SDinh Nguyen 	/* tXRP < 250 ck cycles */
9963da42859SDinh Nguyen 	delay_for_n_mem_clocks(250);
9973da42859SDinh Nguyen 
9983da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r++) {
9993da42859SDinh Nguyen 		if (param->skip_ranks[r]) {
10003da42859SDinh Nguyen 			/* request to skip the rank */
10013da42859SDinh Nguyen 			continue;
10023da42859SDinh Nguyen 		}
10033da42859SDinh Nguyen 
10043da42859SDinh Nguyen 		/* set rank */
10053da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_OFF);
10063da42859SDinh Nguyen 
10073da42859SDinh Nguyen 		/*
10083da42859SDinh Nguyen 		 * USER Use Mirror-ed commands for odd ranks if address
10093da42859SDinh Nguyen 		 * mirrorring is on
10103da42859SDinh Nguyen 		 */
10113da42859SDinh Nguyen 		if ((RW_MGR_MEM_ADDRESS_MIRRORING >> r) & 0x1) {
10123da42859SDinh Nguyen 			set_jump_as_return();
1013*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS2_MIRR, grpaddr);
10143da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10153da42859SDinh Nguyen 			set_jump_as_return();
1016*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS3_MIRR, grpaddr);
10173da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10183da42859SDinh Nguyen 			set_jump_as_return();
1019*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS1_MIRR, grpaddr);
10203da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10213da42859SDinh Nguyen 			set_jump_as_return();
1022*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS0_DLL_RESET_MIRR, grpaddr);
10233da42859SDinh Nguyen 		} else {
10243da42859SDinh Nguyen 			set_jump_as_return();
1025*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS2, grpaddr);
10263da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10273da42859SDinh Nguyen 			set_jump_as_return();
1028*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS3, grpaddr);
10293da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10303da42859SDinh Nguyen 			set_jump_as_return();
1031*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS1, grpaddr);
10323da42859SDinh Nguyen 			set_jump_as_return();
1033*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS0_DLL_RESET, grpaddr);
10343da42859SDinh Nguyen 		}
10353da42859SDinh Nguyen 		set_jump_as_return();
1036*1273dd9eSMarek Vasut 		writel(RW_MGR_ZQCL, grpaddr);
10373da42859SDinh Nguyen 
10383da42859SDinh Nguyen 		/* tZQinit = tDLLK = 512 ck cycles */
10393da42859SDinh Nguyen 		delay_for_n_mem_clocks(512);
10403da42859SDinh Nguyen 	}
10413da42859SDinh Nguyen }
10423da42859SDinh Nguyen 
10433da42859SDinh Nguyen /*
10443da42859SDinh Nguyen  * At the end of calibration we have to program the user settings in, and
10453da42859SDinh Nguyen  * USER  hand off the memory to the user.
10463da42859SDinh Nguyen  */
10473da42859SDinh Nguyen static void rw_mgr_mem_handoff(void)
10483da42859SDinh Nguyen {
10493da42859SDinh Nguyen 	uint32_t r;
1050*1273dd9eSMarek Vasut 	uint32_t grpaddr = SDR_PHYGRP_RWMGRGRP_ADDRESS |
1051*1273dd9eSMarek Vasut 			   RW_MGR_RUN_SINGLE_GROUP_OFFSET;
10523da42859SDinh Nguyen 
10533da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
10543da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r++) {
10553da42859SDinh Nguyen 		if (param->skip_ranks[r])
10563da42859SDinh Nguyen 			/* request to skip the rank */
10573da42859SDinh Nguyen 			continue;
10583da42859SDinh Nguyen 		/* set rank */
10593da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_OFF);
10603da42859SDinh Nguyen 
10613da42859SDinh Nguyen 		/* precharge all banks ... */
1062*1273dd9eSMarek Vasut 		writel(RW_MGR_PRECHARGE_ALL, grpaddr);
10633da42859SDinh Nguyen 
10643da42859SDinh Nguyen 		/* load up MR settings specified by user */
10653da42859SDinh Nguyen 
10663da42859SDinh Nguyen 		/*
10673da42859SDinh Nguyen 		 * Use Mirror-ed commands for odd ranks if address
10683da42859SDinh Nguyen 		 * mirrorring is on
10693da42859SDinh Nguyen 		 */
10703da42859SDinh Nguyen 		if ((RW_MGR_MEM_ADDRESS_MIRRORING >> r) & 0x1) {
10713da42859SDinh Nguyen 			set_jump_as_return();
1072*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS2_MIRR, grpaddr);
10733da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10743da42859SDinh Nguyen 			set_jump_as_return();
1075*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS3_MIRR, grpaddr);
10763da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10773da42859SDinh Nguyen 			set_jump_as_return();
1078*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS1_MIRR, grpaddr);
10793da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10803da42859SDinh Nguyen 			set_jump_as_return();
1081*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS0_USER_MIRR, grpaddr);
10823da42859SDinh Nguyen 		} else {
10833da42859SDinh Nguyen 			set_jump_as_return();
1084*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS2, grpaddr);
10853da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10863da42859SDinh Nguyen 			set_jump_as_return();
1087*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS3, grpaddr);
10883da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10893da42859SDinh Nguyen 			set_jump_as_return();
1090*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS1, grpaddr);
10913da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10923da42859SDinh Nguyen 			set_jump_as_return();
1093*1273dd9eSMarek Vasut 			writel(RW_MGR_MRS0_USER, grpaddr);
10943da42859SDinh Nguyen 		}
10953da42859SDinh Nguyen 		/*
10963da42859SDinh Nguyen 		 * USER  need to wait tMOD (12CK or 15ns) time before issuing
10973da42859SDinh Nguyen 		 * other commands, but we will have plenty of NIOS cycles before
10983da42859SDinh Nguyen 		 * actual handoff so its okay.
10993da42859SDinh Nguyen 		 */
11003da42859SDinh Nguyen 	}
11013da42859SDinh Nguyen }
11023da42859SDinh Nguyen 
11033da42859SDinh Nguyen /*
11043da42859SDinh Nguyen  * performs a guaranteed read on the patterns we are going to use during a
11053da42859SDinh Nguyen  * read test to ensure memory works
11063da42859SDinh Nguyen  */
11073da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test_patterns(uint32_t rank_bgn,
11083da42859SDinh Nguyen 	uint32_t group, uint32_t num_tries, uint32_t *bit_chk,
11093da42859SDinh Nguyen 	uint32_t all_ranks)
11103da42859SDinh Nguyen {
11113da42859SDinh Nguyen 	uint32_t r, vg;
11123da42859SDinh Nguyen 	uint32_t correct_mask_vg;
11133da42859SDinh Nguyen 	uint32_t tmp_bit_chk;
11143da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
11153da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
11163da42859SDinh Nguyen 	uint32_t addr;
11173da42859SDinh Nguyen 	uint32_t base_rw_mgr;
11183da42859SDinh Nguyen 
11193da42859SDinh Nguyen 	*bit_chk = param->read_correct_mask;
11203da42859SDinh Nguyen 	correct_mask_vg = param->read_correct_mask_vg;
11213da42859SDinh Nguyen 
11223da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
11233da42859SDinh Nguyen 		if (param->skip_ranks[r])
11243da42859SDinh Nguyen 			/* request to skip the rank */
11253da42859SDinh Nguyen 			continue;
11263da42859SDinh Nguyen 
11273da42859SDinh Nguyen 		/* set rank */
11283da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
11293da42859SDinh Nguyen 
11303da42859SDinh Nguyen 		/* Load up a constant bursts of read commands */
1131*1273dd9eSMarek Vasut 		writel(0x20, &sdr_rw_load_mgr_regs->load_cntr0);
1132*1273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_READ,
1133*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add0);
11343da42859SDinh Nguyen 
1135*1273dd9eSMarek Vasut 		writel(0x20, &sdr_rw_load_mgr_regs->load_cntr1);
1136*1273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_READ_CONT,
1137*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
11383da42859SDinh Nguyen 
11393da42859SDinh Nguyen 		tmp_bit_chk = 0;
11403da42859SDinh Nguyen 		for (vg = RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS-1; ; vg--) {
11413da42859SDinh Nguyen 			/* reset the fifos to get pointers to known state */
11423da42859SDinh Nguyen 
1143*1273dd9eSMarek Vasut 			writel(0, &phy_mgr_cmd->fifo_reset);
1144*1273dd9eSMarek Vasut 			writel(0, SDR_PHYGRP_RWMGRGRP_ADDRESS |
1145*1273dd9eSMarek Vasut 				  RW_MGR_RESET_READ_DATAPATH_OFFSET);
11463da42859SDinh Nguyen 
11473da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk << (RW_MGR_MEM_DQ_PER_READ_DQS
11483da42859SDinh Nguyen 				/ RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS);
11493da42859SDinh Nguyen 
1150c4815f76SMarek Vasut 			addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
115117fdc916SMarek Vasut 			writel(RW_MGR_GUARANTEED_READ, addr +
11523da42859SDinh Nguyen 			       ((group * RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS +
11533da42859SDinh Nguyen 				vg) << 2));
11543da42859SDinh Nguyen 
1155*1273dd9eSMarek Vasut 			base_rw_mgr = readl(SDR_PHYGRP_RWMGRGRP_ADDRESS);
11563da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk | (correct_mask_vg & (~base_rw_mgr));
11573da42859SDinh Nguyen 
11583da42859SDinh Nguyen 			if (vg == 0)
11593da42859SDinh Nguyen 				break;
11603da42859SDinh Nguyen 		}
11613da42859SDinh Nguyen 		*bit_chk &= tmp_bit_chk;
11623da42859SDinh Nguyen 	}
11633da42859SDinh Nguyen 
1164c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
116517fdc916SMarek Vasut 	writel(RW_MGR_CLEAR_DQS_ENABLE, addr + (group << 2));
11663da42859SDinh Nguyen 
11673da42859SDinh Nguyen 	set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
11683da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d test_load_patterns(%u,ALL) => (%u == %u) =>\
11693da42859SDinh Nguyen 		   %lu\n", __func__, __LINE__, group, *bit_chk, param->read_correct_mask,
11703da42859SDinh Nguyen 		   (long unsigned int)(*bit_chk == param->read_correct_mask));
11713da42859SDinh Nguyen 	return *bit_chk == param->read_correct_mask;
11723da42859SDinh Nguyen }
11733da42859SDinh Nguyen 
11743da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test_patterns_all_ranks
11753da42859SDinh Nguyen 	(uint32_t group, uint32_t num_tries, uint32_t *bit_chk)
11763da42859SDinh Nguyen {
11773da42859SDinh Nguyen 	return rw_mgr_mem_calibrate_read_test_patterns(0, group,
11783da42859SDinh Nguyen 		num_tries, bit_chk, 1);
11793da42859SDinh Nguyen }
11803da42859SDinh Nguyen 
11813da42859SDinh Nguyen /* load up the patterns we are going to use during a read test */
11823da42859SDinh Nguyen static void rw_mgr_mem_calibrate_read_load_patterns(uint32_t rank_bgn,
11833da42859SDinh Nguyen 	uint32_t all_ranks)
11843da42859SDinh Nguyen {
11853da42859SDinh Nguyen 	uint32_t r;
11863da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
11873da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
11883da42859SDinh Nguyen 
11893da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
11903da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
11913da42859SDinh Nguyen 		if (param->skip_ranks[r])
11923da42859SDinh Nguyen 			/* request to skip the rank */
11933da42859SDinh Nguyen 			continue;
11943da42859SDinh Nguyen 
11953da42859SDinh Nguyen 		/* set rank */
11963da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
11973da42859SDinh Nguyen 
11983da42859SDinh Nguyen 		/* Load up a constant bursts */
1199*1273dd9eSMarek Vasut 		writel(0x20, &sdr_rw_load_mgr_regs->load_cntr0);
12003da42859SDinh Nguyen 
1201*1273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_WRITE_WAIT0,
1202*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add0);
12033da42859SDinh Nguyen 
1204*1273dd9eSMarek Vasut 		writel(0x20, &sdr_rw_load_mgr_regs->load_cntr1);
12053da42859SDinh Nguyen 
1206*1273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_WRITE_WAIT1,
1207*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
12083da42859SDinh Nguyen 
1209*1273dd9eSMarek Vasut 		writel(0x04, &sdr_rw_load_mgr_regs->load_cntr2);
12103da42859SDinh Nguyen 
1211*1273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_WRITE_WAIT2,
1212*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add2);
12133da42859SDinh Nguyen 
1214*1273dd9eSMarek Vasut 		writel(0x04, &sdr_rw_load_mgr_regs->load_cntr3);
12153da42859SDinh Nguyen 
1216*1273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_WRITE_WAIT3,
1217*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add3);
12183da42859SDinh Nguyen 
1219*1273dd9eSMarek Vasut 		writel(RW_MGR_GUARANTEED_WRITE, SDR_PHYGRP_RWMGRGRP_ADDRESS |
1220*1273dd9eSMarek Vasut 						RW_MGR_RUN_SINGLE_GROUP_OFFSET);
12213da42859SDinh Nguyen 	}
12223da42859SDinh Nguyen 
12233da42859SDinh Nguyen 	set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
12243da42859SDinh Nguyen }
12253da42859SDinh Nguyen 
12263da42859SDinh Nguyen /*
12273da42859SDinh Nguyen  * try a read and see if it returns correct data back. has dummy reads
12283da42859SDinh Nguyen  * inserted into the mix used to align dqs enable. has more thorough checks
12293da42859SDinh Nguyen  * than the regular read test.
12303da42859SDinh Nguyen  */
12313da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test(uint32_t rank_bgn, uint32_t group,
12323da42859SDinh Nguyen 	uint32_t num_tries, uint32_t all_correct, uint32_t *bit_chk,
12333da42859SDinh Nguyen 	uint32_t all_groups, uint32_t all_ranks)
12343da42859SDinh Nguyen {
12353da42859SDinh Nguyen 	uint32_t r, vg;
12363da42859SDinh Nguyen 	uint32_t correct_mask_vg;
12373da42859SDinh Nguyen 	uint32_t tmp_bit_chk;
12383da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
12393da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
12403da42859SDinh Nguyen 	uint32_t addr;
12413da42859SDinh Nguyen 	uint32_t base_rw_mgr;
12423da42859SDinh Nguyen 
12433da42859SDinh Nguyen 	*bit_chk = param->read_correct_mask;
12443da42859SDinh Nguyen 	correct_mask_vg = param->read_correct_mask_vg;
12453da42859SDinh Nguyen 
12463da42859SDinh Nguyen 	uint32_t quick_read_mode = (((STATIC_CALIB_STEPS) &
12473da42859SDinh Nguyen 		CALIB_SKIP_DELAY_SWEEPS) && ENABLE_SUPER_QUICK_CALIBRATION);
12483da42859SDinh Nguyen 
12493da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
12503da42859SDinh Nguyen 		if (param->skip_ranks[r])
12513da42859SDinh Nguyen 			/* request to skip the rank */
12523da42859SDinh Nguyen 			continue;
12533da42859SDinh Nguyen 
12543da42859SDinh Nguyen 		/* set rank */
12553da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
12563da42859SDinh Nguyen 
1257*1273dd9eSMarek Vasut 		writel(0x10, &sdr_rw_load_mgr_regs->load_cntr1);
12583da42859SDinh Nguyen 
1259*1273dd9eSMarek Vasut 		writel(RW_MGR_READ_B2B_WAIT1,
1260*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
12613da42859SDinh Nguyen 
1262*1273dd9eSMarek Vasut 		writel(0x10, &sdr_rw_load_mgr_regs->load_cntr2);
1263*1273dd9eSMarek Vasut 		writel(RW_MGR_READ_B2B_WAIT2,
1264*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add2);
12653da42859SDinh Nguyen 
12663da42859SDinh Nguyen 		if (quick_read_mode)
1267*1273dd9eSMarek Vasut 			writel(0x1, &sdr_rw_load_mgr_regs->load_cntr0);
12683da42859SDinh Nguyen 			/* need at least two (1+1) reads to capture failures */
12693da42859SDinh Nguyen 		else if (all_groups)
1270*1273dd9eSMarek Vasut 			writel(0x06, &sdr_rw_load_mgr_regs->load_cntr0);
12713da42859SDinh Nguyen 		else
1272*1273dd9eSMarek Vasut 			writel(0x32, &sdr_rw_load_mgr_regs->load_cntr0);
12733da42859SDinh Nguyen 
1274*1273dd9eSMarek Vasut 		writel(RW_MGR_READ_B2B,
1275*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add0);
12763da42859SDinh Nguyen 		if (all_groups)
12773da42859SDinh Nguyen 			writel(RW_MGR_MEM_IF_READ_DQS_WIDTH *
12783da42859SDinh Nguyen 			       RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS - 1,
1279*1273dd9eSMarek Vasut 			       &sdr_rw_load_mgr_regs->load_cntr3);
12803da42859SDinh Nguyen 		else
1281*1273dd9eSMarek Vasut 			writel(0x0, &sdr_rw_load_mgr_regs->load_cntr3);
12823da42859SDinh Nguyen 
1283*1273dd9eSMarek Vasut 		writel(RW_MGR_READ_B2B,
1284*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add3);
12853da42859SDinh Nguyen 
12863da42859SDinh Nguyen 		tmp_bit_chk = 0;
12873da42859SDinh Nguyen 		for (vg = RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS-1; ; vg--) {
12883da42859SDinh Nguyen 			/* reset the fifos to get pointers to known state */
1289*1273dd9eSMarek Vasut 			writel(0, &phy_mgr_cmd->fifo_reset);
1290*1273dd9eSMarek Vasut 			writel(0, SDR_PHYGRP_RWMGRGRP_ADDRESS |
1291*1273dd9eSMarek Vasut 				  RW_MGR_RESET_READ_DATAPATH_OFFSET);
12923da42859SDinh Nguyen 
12933da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk << (RW_MGR_MEM_DQ_PER_READ_DQS
12943da42859SDinh Nguyen 				/ RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS);
12953da42859SDinh Nguyen 
1296c4815f76SMarek Vasut 			if (all_groups)
1297c4815f76SMarek Vasut 				addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_ALL_GROUPS_OFFSET;
1298c4815f76SMarek Vasut 			else
1299c4815f76SMarek Vasut 				addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
1300c4815f76SMarek Vasut 
130117fdc916SMarek Vasut 			writel(RW_MGR_READ_B2B, addr +
13023da42859SDinh Nguyen 			       ((group * RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS +
13033da42859SDinh Nguyen 			       vg) << 2));
13043da42859SDinh Nguyen 
1305*1273dd9eSMarek Vasut 			base_rw_mgr = readl(SDR_PHYGRP_RWMGRGRP_ADDRESS);
13063da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk | (correct_mask_vg & ~(base_rw_mgr));
13073da42859SDinh Nguyen 
13083da42859SDinh Nguyen 			if (vg == 0)
13093da42859SDinh Nguyen 				break;
13103da42859SDinh Nguyen 		}
13113da42859SDinh Nguyen 		*bit_chk &= tmp_bit_chk;
13123da42859SDinh Nguyen 	}
13133da42859SDinh Nguyen 
1314c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
131517fdc916SMarek Vasut 	writel(RW_MGR_CLEAR_DQS_ENABLE, addr + (group << 2));
13163da42859SDinh Nguyen 
13173da42859SDinh Nguyen 	if (all_correct) {
13183da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
13193da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d read_test(%u,ALL,%u) =>\
13203da42859SDinh Nguyen 			   (%u == %u) => %lu", __func__, __LINE__, group,
13213da42859SDinh Nguyen 			   all_groups, *bit_chk, param->read_correct_mask,
13223da42859SDinh Nguyen 			   (long unsigned int)(*bit_chk ==
13233da42859SDinh Nguyen 			   param->read_correct_mask));
13243da42859SDinh Nguyen 		return *bit_chk == param->read_correct_mask;
13253da42859SDinh Nguyen 	} else	{
13263da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
13273da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d read_test(%u,ONE,%u) =>\
13283da42859SDinh Nguyen 			   (%u != %lu) => %lu\n", __func__, __LINE__,
13293da42859SDinh Nguyen 			   group, all_groups, *bit_chk, (long unsigned int)0,
13303da42859SDinh Nguyen 			   (long unsigned int)(*bit_chk != 0x00));
13313da42859SDinh Nguyen 		return *bit_chk != 0x00;
13323da42859SDinh Nguyen 	}
13333da42859SDinh Nguyen }
13343da42859SDinh Nguyen 
13353da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test_all_ranks(uint32_t group,
13363da42859SDinh Nguyen 	uint32_t num_tries, uint32_t all_correct, uint32_t *bit_chk,
13373da42859SDinh Nguyen 	uint32_t all_groups)
13383da42859SDinh Nguyen {
13393da42859SDinh Nguyen 	return rw_mgr_mem_calibrate_read_test(0, group, num_tries, all_correct,
13403da42859SDinh Nguyen 					      bit_chk, all_groups, 1);
13413da42859SDinh Nguyen }
13423da42859SDinh Nguyen 
13433da42859SDinh Nguyen static void rw_mgr_incr_vfifo(uint32_t grp, uint32_t *v)
13443da42859SDinh Nguyen {
1345*1273dd9eSMarek Vasut 	writel(grp, &phy_mgr_cmd->inc_vfifo_hard_phy);
13463da42859SDinh Nguyen 	(*v)++;
13473da42859SDinh Nguyen }
13483da42859SDinh Nguyen 
13493da42859SDinh Nguyen static void rw_mgr_decr_vfifo(uint32_t grp, uint32_t *v)
13503da42859SDinh Nguyen {
13513da42859SDinh Nguyen 	uint32_t i;
13523da42859SDinh Nguyen 
13533da42859SDinh Nguyen 	for (i = 0; i < VFIFO_SIZE-1; i++)
13543da42859SDinh Nguyen 		rw_mgr_incr_vfifo(grp, v);
13553da42859SDinh Nguyen }
13563da42859SDinh Nguyen 
13573da42859SDinh Nguyen static int find_vfifo_read(uint32_t grp, uint32_t *bit_chk)
13583da42859SDinh Nguyen {
13593da42859SDinh Nguyen 	uint32_t  v;
13603da42859SDinh Nguyen 	uint32_t fail_cnt = 0;
13613da42859SDinh Nguyen 	uint32_t test_status;
13623da42859SDinh Nguyen 
13633da42859SDinh Nguyen 	for (v = 0; v < VFIFO_SIZE; ) {
13643da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: vfifo %u\n",
13653da42859SDinh Nguyen 			   __func__, __LINE__, v);
13663da42859SDinh Nguyen 		test_status = rw_mgr_mem_calibrate_read_test_all_ranks
13673da42859SDinh Nguyen 			(grp, 1, PASS_ONE_BIT, bit_chk, 0);
13683da42859SDinh Nguyen 		if (!test_status) {
13693da42859SDinh Nguyen 			fail_cnt++;
13703da42859SDinh Nguyen 
13713da42859SDinh Nguyen 			if (fail_cnt == 2)
13723da42859SDinh Nguyen 				break;
13733da42859SDinh Nguyen 		}
13743da42859SDinh Nguyen 
13753da42859SDinh Nguyen 		/* fiddle with FIFO */
13763da42859SDinh Nguyen 		rw_mgr_incr_vfifo(grp, &v);
13773da42859SDinh Nguyen 	}
13783da42859SDinh Nguyen 
13793da42859SDinh Nguyen 	if (v >= VFIFO_SIZE) {
13803da42859SDinh Nguyen 		/* no failing read found!! Something must have gone wrong */
13813da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: vfifo failed\n",
13823da42859SDinh Nguyen 			   __func__, __LINE__);
13833da42859SDinh Nguyen 		return 0;
13843da42859SDinh Nguyen 	} else {
13853da42859SDinh Nguyen 		return v;
13863da42859SDinh Nguyen 	}
13873da42859SDinh Nguyen }
13883da42859SDinh Nguyen 
13893da42859SDinh Nguyen static int find_working_phase(uint32_t *grp, uint32_t *bit_chk,
13903da42859SDinh Nguyen 			      uint32_t dtaps_per_ptap, uint32_t *work_bgn,
13913da42859SDinh Nguyen 			      uint32_t *v, uint32_t *d, uint32_t *p,
13923da42859SDinh Nguyen 			      uint32_t *i, uint32_t *max_working_cnt)
13933da42859SDinh Nguyen {
13943da42859SDinh Nguyen 	uint32_t found_begin = 0;
13953da42859SDinh Nguyen 	uint32_t tmp_delay = 0;
13963da42859SDinh Nguyen 	uint32_t test_status;
13973da42859SDinh Nguyen 
13983da42859SDinh Nguyen 	for (*d = 0; *d <= dtaps_per_ptap; (*d)++, tmp_delay +=
13993da42859SDinh Nguyen 		IO_DELAY_PER_DQS_EN_DCHAIN_TAP) {
14003da42859SDinh Nguyen 		*work_bgn = tmp_delay;
14013da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay_all_ranks(*grp, *d);
14023da42859SDinh Nguyen 
14033da42859SDinh Nguyen 		for (*i = 0; *i < VFIFO_SIZE; (*i)++) {
14043da42859SDinh Nguyen 			for (*p = 0; *p <= IO_DQS_EN_PHASE_MAX; (*p)++, *work_bgn +=
14053da42859SDinh Nguyen 				IO_DELAY_PER_OPA_TAP) {
14063da42859SDinh Nguyen 				scc_mgr_set_dqs_en_phase_all_ranks(*grp, *p);
14073da42859SDinh Nguyen 
14083da42859SDinh Nguyen 				test_status =
14093da42859SDinh Nguyen 				rw_mgr_mem_calibrate_read_test_all_ranks
14103da42859SDinh Nguyen 				(*grp, 1, PASS_ONE_BIT, bit_chk, 0);
14113da42859SDinh Nguyen 
14123da42859SDinh Nguyen 				if (test_status) {
14133da42859SDinh Nguyen 					*max_working_cnt = 1;
14143da42859SDinh Nguyen 					found_begin = 1;
14153da42859SDinh Nguyen 					break;
14163da42859SDinh Nguyen 				}
14173da42859SDinh Nguyen 			}
14183da42859SDinh Nguyen 
14193da42859SDinh Nguyen 			if (found_begin)
14203da42859SDinh Nguyen 				break;
14213da42859SDinh Nguyen 
14223da42859SDinh Nguyen 			if (*p > IO_DQS_EN_PHASE_MAX)
14233da42859SDinh Nguyen 				/* fiddle with FIFO */
14243da42859SDinh Nguyen 				rw_mgr_incr_vfifo(*grp, v);
14253da42859SDinh Nguyen 		}
14263da42859SDinh Nguyen 
14273da42859SDinh Nguyen 		if (found_begin)
14283da42859SDinh Nguyen 			break;
14293da42859SDinh Nguyen 	}
14303da42859SDinh Nguyen 
14313da42859SDinh Nguyen 	if (*i >= VFIFO_SIZE) {
14323da42859SDinh Nguyen 		/* cannot find working solution */
14333da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: no vfifo/\
14343da42859SDinh Nguyen 			   ptap/dtap\n", __func__, __LINE__);
14353da42859SDinh Nguyen 		return 0;
14363da42859SDinh Nguyen 	} else {
14373da42859SDinh Nguyen 		return 1;
14383da42859SDinh Nguyen 	}
14393da42859SDinh Nguyen }
14403da42859SDinh Nguyen 
14413da42859SDinh Nguyen static void sdr_backup_phase(uint32_t *grp, uint32_t *bit_chk,
14423da42859SDinh Nguyen 			     uint32_t *work_bgn, uint32_t *v, uint32_t *d,
14433da42859SDinh Nguyen 			     uint32_t *p, uint32_t *max_working_cnt)
14443da42859SDinh Nguyen {
14453da42859SDinh Nguyen 	uint32_t found_begin = 0;
14463da42859SDinh Nguyen 	uint32_t tmp_delay;
14473da42859SDinh Nguyen 
14483da42859SDinh Nguyen 	/* Special case code for backing up a phase */
14493da42859SDinh Nguyen 	if (*p == 0) {
14503da42859SDinh Nguyen 		*p = IO_DQS_EN_PHASE_MAX;
14513da42859SDinh Nguyen 		rw_mgr_decr_vfifo(*grp, v);
14523da42859SDinh Nguyen 	} else {
14533da42859SDinh Nguyen 		(*p)--;
14543da42859SDinh Nguyen 	}
14553da42859SDinh Nguyen 	tmp_delay = *work_bgn - IO_DELAY_PER_OPA_TAP;
14563da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(*grp, *p);
14573da42859SDinh Nguyen 
14583da42859SDinh Nguyen 	for (*d = 0; *d <= IO_DQS_EN_DELAY_MAX && tmp_delay < *work_bgn;
14593da42859SDinh Nguyen 		(*d)++, tmp_delay += IO_DELAY_PER_DQS_EN_DCHAIN_TAP) {
14603da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay_all_ranks(*grp, *d);
14613da42859SDinh Nguyen 
14623da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_read_test_all_ranks(*grp, 1,
14633da42859SDinh Nguyen 							     PASS_ONE_BIT,
14643da42859SDinh Nguyen 							     bit_chk, 0)) {
14653da42859SDinh Nguyen 			found_begin = 1;
14663da42859SDinh Nguyen 			*work_bgn = tmp_delay;
14673da42859SDinh Nguyen 			break;
14683da42859SDinh Nguyen 		}
14693da42859SDinh Nguyen 	}
14703da42859SDinh Nguyen 
14713da42859SDinh Nguyen 	/* We have found a working dtap before the ptap found above */
14723da42859SDinh Nguyen 	if (found_begin == 1)
14733da42859SDinh Nguyen 		(*max_working_cnt)++;
14743da42859SDinh Nguyen 
14753da42859SDinh Nguyen 	/*
14763da42859SDinh Nguyen 	 * Restore VFIFO to old state before we decremented it
14773da42859SDinh Nguyen 	 * (if needed).
14783da42859SDinh Nguyen 	 */
14793da42859SDinh Nguyen 	(*p)++;
14803da42859SDinh Nguyen 	if (*p > IO_DQS_EN_PHASE_MAX) {
14813da42859SDinh Nguyen 		*p = 0;
14823da42859SDinh Nguyen 		rw_mgr_incr_vfifo(*grp, v);
14833da42859SDinh Nguyen 	}
14843da42859SDinh Nguyen 
14853da42859SDinh Nguyen 	scc_mgr_set_dqs_en_delay_all_ranks(*grp, 0);
14863da42859SDinh Nguyen }
14873da42859SDinh Nguyen 
14883da42859SDinh Nguyen static int sdr_nonworking_phase(uint32_t *grp, uint32_t *bit_chk,
14893da42859SDinh Nguyen 			     uint32_t *work_bgn, uint32_t *v, uint32_t *d,
14903da42859SDinh Nguyen 			     uint32_t *p, uint32_t *i, uint32_t *max_working_cnt,
14913da42859SDinh Nguyen 			     uint32_t *work_end)
14923da42859SDinh Nguyen {
14933da42859SDinh Nguyen 	uint32_t found_end = 0;
14943da42859SDinh Nguyen 
14953da42859SDinh Nguyen 	(*p)++;
14963da42859SDinh Nguyen 	*work_end += IO_DELAY_PER_OPA_TAP;
14973da42859SDinh Nguyen 	if (*p > IO_DQS_EN_PHASE_MAX) {
14983da42859SDinh Nguyen 		/* fiddle with FIFO */
14993da42859SDinh Nguyen 		*p = 0;
15003da42859SDinh Nguyen 		rw_mgr_incr_vfifo(*grp, v);
15013da42859SDinh Nguyen 	}
15023da42859SDinh Nguyen 
15033da42859SDinh Nguyen 	for (; *i < VFIFO_SIZE + 1; (*i)++) {
15043da42859SDinh Nguyen 		for (; *p <= IO_DQS_EN_PHASE_MAX; (*p)++, *work_end
15053da42859SDinh Nguyen 			+= IO_DELAY_PER_OPA_TAP) {
15063da42859SDinh Nguyen 			scc_mgr_set_dqs_en_phase_all_ranks(*grp, *p);
15073da42859SDinh Nguyen 
15083da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_read_test_all_ranks
15093da42859SDinh Nguyen 				(*grp, 1, PASS_ONE_BIT, bit_chk, 0)) {
15103da42859SDinh Nguyen 				found_end = 1;
15113da42859SDinh Nguyen 				break;
15123da42859SDinh Nguyen 			} else {
15133da42859SDinh Nguyen 				(*max_working_cnt)++;
15143da42859SDinh Nguyen 			}
15153da42859SDinh Nguyen 		}
15163da42859SDinh Nguyen 
15173da42859SDinh Nguyen 		if (found_end)
15183da42859SDinh Nguyen 			break;
15193da42859SDinh Nguyen 
15203da42859SDinh Nguyen 		if (*p > IO_DQS_EN_PHASE_MAX) {
15213da42859SDinh Nguyen 			/* fiddle with FIFO */
15223da42859SDinh Nguyen 			rw_mgr_incr_vfifo(*grp, v);
15233da42859SDinh Nguyen 			*p = 0;
15243da42859SDinh Nguyen 		}
15253da42859SDinh Nguyen 	}
15263da42859SDinh Nguyen 
15273da42859SDinh Nguyen 	if (*i >= VFIFO_SIZE + 1) {
15283da42859SDinh Nguyen 		/* cannot see edge of failing read */
15293da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d sdr_nonworking_phase: end:\
15303da42859SDinh Nguyen 			   failed\n", __func__, __LINE__);
15313da42859SDinh Nguyen 		return 0;
15323da42859SDinh Nguyen 	} else {
15333da42859SDinh Nguyen 		return 1;
15343da42859SDinh Nguyen 	}
15353da42859SDinh Nguyen }
15363da42859SDinh Nguyen 
15373da42859SDinh Nguyen static int sdr_find_window_centre(uint32_t *grp, uint32_t *bit_chk,
15383da42859SDinh Nguyen 				  uint32_t *work_bgn, uint32_t *v, uint32_t *d,
15393da42859SDinh Nguyen 				  uint32_t *p, uint32_t *work_mid,
15403da42859SDinh Nguyen 				  uint32_t *work_end)
15413da42859SDinh Nguyen {
15423da42859SDinh Nguyen 	int i;
15433da42859SDinh Nguyen 	int tmp_delay = 0;
15443da42859SDinh Nguyen 
15453da42859SDinh Nguyen 	*work_mid = (*work_bgn + *work_end) / 2;
15463da42859SDinh Nguyen 
15473da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "work_bgn=%d work_end=%d work_mid=%d\n",
15483da42859SDinh Nguyen 		   *work_bgn, *work_end, *work_mid);
15493da42859SDinh Nguyen 	/* Get the middle delay to be less than a VFIFO delay */
15503da42859SDinh Nguyen 	for (*p = 0; *p <= IO_DQS_EN_PHASE_MAX;
15513da42859SDinh Nguyen 		(*p)++, tmp_delay += IO_DELAY_PER_OPA_TAP)
15523da42859SDinh Nguyen 		;
15533da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "vfifo ptap delay %d\n", tmp_delay);
15543da42859SDinh Nguyen 	while (*work_mid > tmp_delay)
15553da42859SDinh Nguyen 		*work_mid -= tmp_delay;
15563da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "new work_mid %d\n", *work_mid);
15573da42859SDinh Nguyen 
15583da42859SDinh Nguyen 	tmp_delay = 0;
15593da42859SDinh Nguyen 	for (*p = 0; *p <= IO_DQS_EN_PHASE_MAX && tmp_delay < *work_mid;
15603da42859SDinh Nguyen 		(*p)++, tmp_delay += IO_DELAY_PER_OPA_TAP)
15613da42859SDinh Nguyen 		;
15623da42859SDinh Nguyen 	tmp_delay -= IO_DELAY_PER_OPA_TAP;
15633da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "new p %d, tmp_delay=%d\n", (*p) - 1, tmp_delay);
15643da42859SDinh Nguyen 	for (*d = 0; *d <= IO_DQS_EN_DELAY_MAX && tmp_delay < *work_mid; (*d)++,
15653da42859SDinh Nguyen 		tmp_delay += IO_DELAY_PER_DQS_EN_DCHAIN_TAP)
15663da42859SDinh Nguyen 		;
15673da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "new d %d, tmp_delay=%d\n", *d, tmp_delay);
15683da42859SDinh Nguyen 
15693da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(*grp, (*p) - 1);
15703da42859SDinh Nguyen 	scc_mgr_set_dqs_en_delay_all_ranks(*grp, *d);
15713da42859SDinh Nguyen 
15723da42859SDinh Nguyen 	/*
15733da42859SDinh Nguyen 	 * push vfifo until we can successfully calibrate. We can do this
15743da42859SDinh Nguyen 	 * because the largest possible margin in 1 VFIFO cycle.
15753da42859SDinh Nguyen 	 */
15763da42859SDinh Nguyen 	for (i = 0; i < VFIFO_SIZE; i++) {
15773da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "find_dqs_en_phase: center: vfifo=%u\n",
15783da42859SDinh Nguyen 			   *v);
15793da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_read_test_all_ranks(*grp, 1,
15803da42859SDinh Nguyen 							     PASS_ONE_BIT,
15813da42859SDinh Nguyen 							     bit_chk, 0)) {
15823da42859SDinh Nguyen 			break;
15833da42859SDinh Nguyen 		}
15843da42859SDinh Nguyen 
15853da42859SDinh Nguyen 		/* fiddle with FIFO */
15863da42859SDinh Nguyen 		rw_mgr_incr_vfifo(*grp, v);
15873da42859SDinh Nguyen 	}
15883da42859SDinh Nguyen 
15893da42859SDinh Nguyen 	if (i >= VFIFO_SIZE) {
15903da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: center: \
15913da42859SDinh Nguyen 			   failed\n", __func__, __LINE__);
15923da42859SDinh Nguyen 		return 0;
15933da42859SDinh Nguyen 	} else {
15943da42859SDinh Nguyen 		return 1;
15953da42859SDinh Nguyen 	}
15963da42859SDinh Nguyen }
15973da42859SDinh Nguyen 
15983da42859SDinh Nguyen /* find a good dqs enable to use */
15993da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase(uint32_t grp)
16003da42859SDinh Nguyen {
16013da42859SDinh Nguyen 	uint32_t v, d, p, i;
16023da42859SDinh Nguyen 	uint32_t max_working_cnt;
16033da42859SDinh Nguyen 	uint32_t bit_chk;
16043da42859SDinh Nguyen 	uint32_t dtaps_per_ptap;
16053da42859SDinh Nguyen 	uint32_t work_bgn, work_mid, work_end;
16063da42859SDinh Nguyen 	uint32_t found_passing_read, found_failing_read, initial_failing_dtap;
16073da42859SDinh Nguyen 
16083da42859SDinh Nguyen 	debug("%s:%d %u\n", __func__, __LINE__, grp);
16093da42859SDinh Nguyen 
16103da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_VFIFO_CENTER);
16113da42859SDinh Nguyen 
16123da42859SDinh Nguyen 	scc_mgr_set_dqs_en_delay_all_ranks(grp, 0);
16133da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(grp, 0);
16143da42859SDinh Nguyen 
16153da42859SDinh Nguyen 	/* ************************************************************** */
16163da42859SDinh Nguyen 	/* * Step 0 : Determine number of delay taps for each phase tap * */
16173da42859SDinh Nguyen 	dtaps_per_ptap = IO_DELAY_PER_OPA_TAP/IO_DELAY_PER_DQS_EN_DCHAIN_TAP;
16183da42859SDinh Nguyen 
16193da42859SDinh Nguyen 	/* ********************************************************* */
16203da42859SDinh Nguyen 	/* * Step 1 : First push vfifo until we get a failing read * */
16213da42859SDinh Nguyen 	v = find_vfifo_read(grp, &bit_chk);
16223da42859SDinh Nguyen 
16233da42859SDinh Nguyen 	max_working_cnt = 0;
16243da42859SDinh Nguyen 
16253da42859SDinh Nguyen 	/* ******************************************************** */
16263da42859SDinh Nguyen 	/* * step 2: find first working phase, increment in ptaps * */
16273da42859SDinh Nguyen 	work_bgn = 0;
16283da42859SDinh Nguyen 	if (find_working_phase(&grp, &bit_chk, dtaps_per_ptap, &work_bgn, &v, &d,
16293da42859SDinh Nguyen 				&p, &i, &max_working_cnt) == 0)
16303da42859SDinh Nguyen 		return 0;
16313da42859SDinh Nguyen 
16323da42859SDinh Nguyen 	work_end = work_bgn;
16333da42859SDinh Nguyen 
16343da42859SDinh Nguyen 	/*
16353da42859SDinh Nguyen 	 * If d is 0 then the working window covers a phase tap and
16363da42859SDinh Nguyen 	 * we can follow the old procedure otherwise, we've found the beginning,
16373da42859SDinh Nguyen 	 * and we need to increment the dtaps until we find the end.
16383da42859SDinh Nguyen 	 */
16393da42859SDinh Nguyen 	if (d == 0) {
16403da42859SDinh Nguyen 		/* ********************************************************* */
16413da42859SDinh Nguyen 		/* * step 3a: if we have room, back off by one and
16423da42859SDinh Nguyen 		increment in dtaps * */
16433da42859SDinh Nguyen 
16443da42859SDinh Nguyen 		sdr_backup_phase(&grp, &bit_chk, &work_bgn, &v, &d, &p,
16453da42859SDinh Nguyen 				 &max_working_cnt);
16463da42859SDinh Nguyen 
16473da42859SDinh Nguyen 		/* ********************************************************* */
16483da42859SDinh Nguyen 		/* * step 4a: go forward from working phase to non working
16493da42859SDinh Nguyen 		phase, increment in ptaps * */
16503da42859SDinh Nguyen 		if (sdr_nonworking_phase(&grp, &bit_chk, &work_bgn, &v, &d, &p,
16513da42859SDinh Nguyen 					 &i, &max_working_cnt, &work_end) == 0)
16523da42859SDinh Nguyen 			return 0;
16533da42859SDinh Nguyen 
16543da42859SDinh Nguyen 		/* ********************************************************* */
16553da42859SDinh Nguyen 		/* * step 5a:  back off one from last, increment in dtaps  * */
16563da42859SDinh Nguyen 
16573da42859SDinh Nguyen 		/* Special case code for backing up a phase */
16583da42859SDinh Nguyen 		if (p == 0) {
16593da42859SDinh Nguyen 			p = IO_DQS_EN_PHASE_MAX;
16603da42859SDinh Nguyen 			rw_mgr_decr_vfifo(grp, &v);
16613da42859SDinh Nguyen 		} else {
16623da42859SDinh Nguyen 			p = p - 1;
16633da42859SDinh Nguyen 		}
16643da42859SDinh Nguyen 
16653da42859SDinh Nguyen 		work_end -= IO_DELAY_PER_OPA_TAP;
16663da42859SDinh Nguyen 		scc_mgr_set_dqs_en_phase_all_ranks(grp, p);
16673da42859SDinh Nguyen 
16683da42859SDinh Nguyen 		/* * The actual increment of dtaps is done outside of
16693da42859SDinh Nguyen 		the if/else loop to share code */
16703da42859SDinh Nguyen 		d = 0;
16713da42859SDinh Nguyen 
16723da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: v/p: \
16733da42859SDinh Nguyen 			   vfifo=%u ptap=%u\n", __func__, __LINE__,
16743da42859SDinh Nguyen 			   v, p);
16753da42859SDinh Nguyen 	} else {
16763da42859SDinh Nguyen 		/* ******************************************************* */
16773da42859SDinh Nguyen 		/* * step 3-5b:  Find the right edge of the window using
16783da42859SDinh Nguyen 		delay taps   * */
16793da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase:vfifo=%u \
16803da42859SDinh Nguyen 			   ptap=%u dtap=%u bgn=%u\n", __func__, __LINE__,
16813da42859SDinh Nguyen 			   v, p, d, work_bgn);
16823da42859SDinh Nguyen 
16833da42859SDinh Nguyen 		work_end = work_bgn;
16843da42859SDinh Nguyen 
16853da42859SDinh Nguyen 		/* * The actual increment of dtaps is done outside of the
16863da42859SDinh Nguyen 		if/else loop to share code */
16873da42859SDinh Nguyen 
16883da42859SDinh Nguyen 		/* Only here to counterbalance a subtract later on which is
16893da42859SDinh Nguyen 		not needed if this branch of the algorithm is taken */
16903da42859SDinh Nguyen 		max_working_cnt++;
16913da42859SDinh Nguyen 	}
16923da42859SDinh Nguyen 
16933da42859SDinh Nguyen 	/* The dtap increment to find the failing edge is done here */
16943da42859SDinh Nguyen 	for (; d <= IO_DQS_EN_DELAY_MAX; d++, work_end +=
16953da42859SDinh Nguyen 		IO_DELAY_PER_DQS_EN_DCHAIN_TAP) {
16963da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: \
16973da42859SDinh Nguyen 				   end-2: dtap=%u\n", __func__, __LINE__, d);
16983da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay_all_ranks(grp, d);
16993da42859SDinh Nguyen 
17003da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_read_test_all_ranks(grp, 1,
17013da42859SDinh Nguyen 								      PASS_ONE_BIT,
17023da42859SDinh Nguyen 								      &bit_chk, 0)) {
17033da42859SDinh Nguyen 				break;
17043da42859SDinh Nguyen 			}
17053da42859SDinh Nguyen 	}
17063da42859SDinh Nguyen 
17073da42859SDinh Nguyen 	/* Go back to working dtap */
17083da42859SDinh Nguyen 	if (d != 0)
17093da42859SDinh Nguyen 		work_end -= IO_DELAY_PER_DQS_EN_DCHAIN_TAP;
17103da42859SDinh Nguyen 
17113da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: v/p/d: vfifo=%u \
17123da42859SDinh Nguyen 		   ptap=%u dtap=%u end=%u\n", __func__, __LINE__,
17133da42859SDinh Nguyen 		   v, p, d-1, work_end);
17143da42859SDinh Nguyen 
17153da42859SDinh Nguyen 	if (work_end < work_bgn) {
17163da42859SDinh Nguyen 		/* nil range */
17173da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: end-2: \
17183da42859SDinh Nguyen 			   failed\n", __func__, __LINE__);
17193da42859SDinh Nguyen 		return 0;
17203da42859SDinh Nguyen 	}
17213da42859SDinh Nguyen 
17223da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: found range [%u,%u]\n",
17233da42859SDinh Nguyen 		   __func__, __LINE__, work_bgn, work_end);
17243da42859SDinh Nguyen 
17253da42859SDinh Nguyen 	/* *************************************************************** */
17263da42859SDinh Nguyen 	/*
17273da42859SDinh Nguyen 	 * * We need to calculate the number of dtaps that equal a ptap
17283da42859SDinh Nguyen 	 * * To do that we'll back up a ptap and re-find the edge of the
17293da42859SDinh Nguyen 	 * * window using dtaps
17303da42859SDinh Nguyen 	 */
17313da42859SDinh Nguyen 
17323da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: calculate dtaps_per_ptap \
17333da42859SDinh Nguyen 		   for tracking\n", __func__, __LINE__);
17343da42859SDinh Nguyen 
17353da42859SDinh Nguyen 	/* Special case code for backing up a phase */
17363da42859SDinh Nguyen 	if (p == 0) {
17373da42859SDinh Nguyen 		p = IO_DQS_EN_PHASE_MAX;
17383da42859SDinh Nguyen 		rw_mgr_decr_vfifo(grp, &v);
17393da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: backedup \
17403da42859SDinh Nguyen 			   cycle/phase: v=%u p=%u\n", __func__, __LINE__,
17413da42859SDinh Nguyen 			   v, p);
17423da42859SDinh Nguyen 	} else {
17433da42859SDinh Nguyen 		p = p - 1;
17443da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: backedup \
17453da42859SDinh Nguyen 			   phase only: v=%u p=%u", __func__, __LINE__,
17463da42859SDinh Nguyen 			   v, p);
17473da42859SDinh Nguyen 	}
17483da42859SDinh Nguyen 
17493da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(grp, p);
17503da42859SDinh Nguyen 
17513da42859SDinh Nguyen 	/*
17523da42859SDinh Nguyen 	 * Increase dtap until we first see a passing read (in case the
17533da42859SDinh Nguyen 	 * window is smaller than a ptap),
17543da42859SDinh Nguyen 	 * and then a failing read to mark the edge of the window again
17553da42859SDinh Nguyen 	 */
17563da42859SDinh Nguyen 
17573da42859SDinh Nguyen 	/* Find a passing read */
17583da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: find passing read\n",
17593da42859SDinh Nguyen 		   __func__, __LINE__);
17603da42859SDinh Nguyen 	found_passing_read = 0;
17613da42859SDinh Nguyen 	found_failing_read = 0;
17623da42859SDinh Nguyen 	initial_failing_dtap = d;
17633da42859SDinh Nguyen 	for (; d <= IO_DQS_EN_DELAY_MAX; d++) {
17643da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: testing \
17653da42859SDinh Nguyen 			   read d=%u\n", __func__, __LINE__, d);
17663da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay_all_ranks(grp, d);
17673da42859SDinh Nguyen 
17683da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_read_test_all_ranks(grp, 1,
17693da42859SDinh Nguyen 							     PASS_ONE_BIT,
17703da42859SDinh Nguyen 							     &bit_chk, 0)) {
17713da42859SDinh Nguyen 			found_passing_read = 1;
17723da42859SDinh Nguyen 			break;
17733da42859SDinh Nguyen 		}
17743da42859SDinh Nguyen 	}
17753da42859SDinh Nguyen 
17763da42859SDinh Nguyen 	if (found_passing_read) {
17773da42859SDinh Nguyen 		/* Find a failing read */
17783da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: find failing \
17793da42859SDinh Nguyen 			   read\n", __func__, __LINE__);
17803da42859SDinh Nguyen 		for (d = d + 1; d <= IO_DQS_EN_DELAY_MAX; d++) {
17813da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: \
17823da42859SDinh Nguyen 				   testing read d=%u\n", __func__, __LINE__, d);
17833da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay_all_ranks(grp, d);
17843da42859SDinh Nguyen 
17853da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_read_test_all_ranks
17863da42859SDinh Nguyen 				(grp, 1, PASS_ONE_BIT, &bit_chk, 0)) {
17873da42859SDinh Nguyen 				found_failing_read = 1;
17883da42859SDinh Nguyen 				break;
17893da42859SDinh Nguyen 			}
17903da42859SDinh Nguyen 		}
17913da42859SDinh Nguyen 	} else {
17923da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d find_dqs_en_phase: failed to \
17933da42859SDinh Nguyen 			   calculate dtaps", __func__, __LINE__);
17943da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "per ptap. Fall back on static value\n");
17953da42859SDinh Nguyen 	}
17963da42859SDinh Nguyen 
17973da42859SDinh Nguyen 	/*
17983da42859SDinh Nguyen 	 * The dynamically calculated dtaps_per_ptap is only valid if we
17993da42859SDinh Nguyen 	 * found a passing/failing read. If we didn't, it means d hit the max
18003da42859SDinh Nguyen 	 * (IO_DQS_EN_DELAY_MAX). Otherwise, dtaps_per_ptap retains its
18013da42859SDinh Nguyen 	 * statically calculated value.
18023da42859SDinh Nguyen 	 */
18033da42859SDinh Nguyen 	if (found_passing_read && found_failing_read)
18043da42859SDinh Nguyen 		dtaps_per_ptap = d - initial_failing_dtap;
18053da42859SDinh Nguyen 
1806*1273dd9eSMarek Vasut 	writel(dtaps_per_ptap, &sdr_reg_file->dtaps_per_ptap);
18073da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: dtaps_per_ptap=%u \
18083da42859SDinh Nguyen 		   - %u = %u",  __func__, __LINE__, d,
18093da42859SDinh Nguyen 		   initial_failing_dtap, dtaps_per_ptap);
18103da42859SDinh Nguyen 
18113da42859SDinh Nguyen 	/* ******************************************** */
18123da42859SDinh Nguyen 	/* * step 6:  Find the centre of the window   * */
18133da42859SDinh Nguyen 	if (sdr_find_window_centre(&grp, &bit_chk, &work_bgn, &v, &d, &p,
18143da42859SDinh Nguyen 				   &work_mid, &work_end) == 0)
18153da42859SDinh Nguyen 		return 0;
18163da42859SDinh Nguyen 
18173da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: center found: \
18183da42859SDinh Nguyen 		   vfifo=%u ptap=%u dtap=%u\n", __func__, __LINE__,
18193da42859SDinh Nguyen 		   v, p-1, d);
18203da42859SDinh Nguyen 	return 1;
18213da42859SDinh Nguyen }
18223da42859SDinh Nguyen 
18233da42859SDinh Nguyen /*
18243da42859SDinh Nguyen  * Try rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase across different
18253da42859SDinh Nguyen  * dq_in_delay values
18263da42859SDinh Nguyen  */
18273da42859SDinh Nguyen static uint32_t
18283da42859SDinh Nguyen rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase_sweep_dq_in_delay
18293da42859SDinh Nguyen (uint32_t write_group, uint32_t read_group, uint32_t test_bgn)
18303da42859SDinh Nguyen {
18313da42859SDinh Nguyen 	uint32_t found;
18323da42859SDinh Nguyen 	uint32_t i;
18333da42859SDinh Nguyen 	uint32_t p;
18343da42859SDinh Nguyen 	uint32_t d;
18353da42859SDinh Nguyen 	uint32_t r;
18363da42859SDinh Nguyen 
18373da42859SDinh Nguyen 	const uint32_t delay_step = IO_IO_IN_DELAY_MAX /
18383da42859SDinh Nguyen 		(RW_MGR_MEM_DQ_PER_READ_DQS-1);
18393da42859SDinh Nguyen 		/* we start at zero, so have one less dq to devide among */
18403da42859SDinh Nguyen 
18413da42859SDinh Nguyen 	debug("%s:%d (%u,%u,%u)", __func__, __LINE__, write_group, read_group,
18423da42859SDinh Nguyen 	      test_bgn);
18433da42859SDinh Nguyen 
18443da42859SDinh Nguyen 	/* try different dq_in_delays since the dq path is shorter than dqs */
18453da42859SDinh Nguyen 
18463da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
18473da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
18483da42859SDinh Nguyen 		for (i = 0, p = test_bgn, d = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS;
18493da42859SDinh Nguyen 			i++, p++, d += delay_step) {
18503da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d rw_mgr_mem_calibrate_\
18513da42859SDinh Nguyen 				   vfifo_find_dqs_", __func__, __LINE__);
18523da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "en_phase_sweep_dq_in_delay: g=%u/%u ",
18533da42859SDinh Nguyen 			       write_group, read_group);
18543da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "r=%u, i=%u p=%u d=%u\n", r, i , p, d);
18553da42859SDinh Nguyen 			scc_mgr_set_dq_in_delay(write_group, p, d);
18563da42859SDinh Nguyen 			scc_mgr_load_dq(p);
18573da42859SDinh Nguyen 		}
1858*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
18593da42859SDinh Nguyen 	}
18603da42859SDinh Nguyen 
18613da42859SDinh Nguyen 	found = rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase(read_group);
18623da42859SDinh Nguyen 
18633da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d rw_mgr_mem_calibrate_vfifo_find_dqs_\
18643da42859SDinh Nguyen 		   en_phase_sweep_dq", __func__, __LINE__);
18653da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "_in_delay: g=%u/%u found=%u; Reseting delay \
18663da42859SDinh Nguyen 		   chain to zero\n", write_group, read_group, found);
18673da42859SDinh Nguyen 
18683da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
18693da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
18703da42859SDinh Nguyen 		for (i = 0, p = test_bgn; i < RW_MGR_MEM_DQ_PER_READ_DQS;
18713da42859SDinh Nguyen 			i++, p++) {
18723da42859SDinh Nguyen 			scc_mgr_set_dq_in_delay(write_group, p, 0);
18733da42859SDinh Nguyen 			scc_mgr_load_dq(p);
18743da42859SDinh Nguyen 		}
1875*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
18763da42859SDinh Nguyen 	}
18773da42859SDinh Nguyen 
18783da42859SDinh Nguyen 	return found;
18793da42859SDinh Nguyen }
18803da42859SDinh Nguyen 
18813da42859SDinh Nguyen /* per-bit deskew DQ and center */
18823da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo_center(uint32_t rank_bgn,
18833da42859SDinh Nguyen 	uint32_t write_group, uint32_t read_group, uint32_t test_bgn,
18843da42859SDinh Nguyen 	uint32_t use_read_test, uint32_t update_fom)
18853da42859SDinh Nguyen {
18863da42859SDinh Nguyen 	uint32_t i, p, d, min_index;
18873da42859SDinh Nguyen 	/*
18883da42859SDinh Nguyen 	 * Store these as signed since there are comparisons with
18893da42859SDinh Nguyen 	 * signed numbers.
18903da42859SDinh Nguyen 	 */
18913da42859SDinh Nguyen 	uint32_t bit_chk;
18923da42859SDinh Nguyen 	uint32_t sticky_bit_chk;
18933da42859SDinh Nguyen 	int32_t left_edge[RW_MGR_MEM_DQ_PER_READ_DQS];
18943da42859SDinh Nguyen 	int32_t right_edge[RW_MGR_MEM_DQ_PER_READ_DQS];
18953da42859SDinh Nguyen 	int32_t final_dq[RW_MGR_MEM_DQ_PER_READ_DQS];
18963da42859SDinh Nguyen 	int32_t mid;
18973da42859SDinh Nguyen 	int32_t orig_mid_min, mid_min;
18983da42859SDinh Nguyen 	int32_t new_dqs, start_dqs, start_dqs_en, shift_dq, final_dqs,
18993da42859SDinh Nguyen 		final_dqs_en;
19003da42859SDinh Nguyen 	int32_t dq_margin, dqs_margin;
19013da42859SDinh Nguyen 	uint32_t stop;
19023da42859SDinh Nguyen 	uint32_t temp_dq_in_delay1, temp_dq_in_delay2;
19033da42859SDinh Nguyen 	uint32_t addr;
19043da42859SDinh Nguyen 
19053da42859SDinh Nguyen 	debug("%s:%d: %u %u", __func__, __LINE__, read_group, test_bgn);
19063da42859SDinh Nguyen 
1907c4815f76SMarek Vasut 	addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_DQS_IN_DELAY_OFFSET;
190817fdc916SMarek Vasut 	start_dqs = readl(addr + (read_group << 2));
19093da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS)
191017fdc916SMarek Vasut 		start_dqs_en = readl(addr + ((read_group << 2)
19113da42859SDinh Nguyen 				     - IO_DQS_EN_DELAY_OFFSET));
19123da42859SDinh Nguyen 
19133da42859SDinh Nguyen 	/* set the left and right edge of each bit to an illegal value */
19143da42859SDinh Nguyen 	/* use (IO_IO_IN_DELAY_MAX + 1) as an illegal value */
19153da42859SDinh Nguyen 	sticky_bit_chk = 0;
19163da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
19173da42859SDinh Nguyen 		left_edge[i]  = IO_IO_IN_DELAY_MAX + 1;
19183da42859SDinh Nguyen 		right_edge[i] = IO_IO_IN_DELAY_MAX + 1;
19193da42859SDinh Nguyen 	}
19203da42859SDinh Nguyen 
19213da42859SDinh Nguyen 	/* Search for the left edge of the window for each bit */
19223da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_IN_DELAY_MAX; d++) {
19233da42859SDinh Nguyen 		scc_mgr_apply_group_dq_in_delay(write_group, test_bgn, d);
19243da42859SDinh Nguyen 
1925*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
19263da42859SDinh Nguyen 
19273da42859SDinh Nguyen 		/*
19283da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
19293da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
19303da42859SDinh Nguyen 		 */
19313da42859SDinh Nguyen 		if (use_read_test) {
19323da42859SDinh Nguyen 			stop = !rw_mgr_mem_calibrate_read_test(rank_bgn,
19333da42859SDinh Nguyen 				read_group, NUM_READ_PB_TESTS, PASS_ONE_BIT,
19343da42859SDinh Nguyen 				&bit_chk, 0, 0);
19353da42859SDinh Nguyen 		} else {
19363da42859SDinh Nguyen 			rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
19373da42859SDinh Nguyen 							0, PASS_ONE_BIT,
19383da42859SDinh Nguyen 							&bit_chk, 0);
19393da42859SDinh Nguyen 			bit_chk = bit_chk >> (RW_MGR_MEM_DQ_PER_READ_DQS *
19403da42859SDinh Nguyen 				(read_group - (write_group *
19413da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
19423da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH)));
19433da42859SDinh Nguyen 			stop = (bit_chk == 0);
19443da42859SDinh Nguyen 		}
19453da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
19463da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->read_correct_mask);
19473da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center(left): dtap=%u => %u == %u \
19483da42859SDinh Nguyen 			   && %u", __func__, __LINE__, d,
19493da42859SDinh Nguyen 			   sticky_bit_chk,
19503da42859SDinh Nguyen 			param->read_correct_mask, stop);
19513da42859SDinh Nguyen 
19523da42859SDinh Nguyen 		if (stop == 1) {
19533da42859SDinh Nguyen 			break;
19543da42859SDinh Nguyen 		} else {
19553da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
19563da42859SDinh Nguyen 				if (bit_chk & 1) {
19573da42859SDinh Nguyen 					/* Remember a passing test as the
19583da42859SDinh Nguyen 					left_edge */
19593da42859SDinh Nguyen 					left_edge[i] = d;
19603da42859SDinh Nguyen 				} else {
19613da42859SDinh Nguyen 					/* If a left edge has not been seen yet,
19623da42859SDinh Nguyen 					then a future passing test will mark
19633da42859SDinh Nguyen 					this edge as the right edge */
19643da42859SDinh Nguyen 					if (left_edge[i] ==
19653da42859SDinh Nguyen 						IO_IO_IN_DELAY_MAX + 1) {
19663da42859SDinh Nguyen 						right_edge[i] = -(d + 1);
19673da42859SDinh Nguyen 					}
19683da42859SDinh Nguyen 				}
19693da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
19703da42859SDinh Nguyen 			}
19713da42859SDinh Nguyen 		}
19723da42859SDinh Nguyen 	}
19733da42859SDinh Nguyen 
19743da42859SDinh Nguyen 	/* Reset DQ delay chains to 0 */
19753da42859SDinh Nguyen 	scc_mgr_apply_group_dq_in_delay(write_group, test_bgn, 0);
19763da42859SDinh Nguyen 	sticky_bit_chk = 0;
19773da42859SDinh Nguyen 	for (i = RW_MGR_MEM_DQ_PER_READ_DQS - 1;; i--) {
19783da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center: left_edge[%u]: \
19793da42859SDinh Nguyen 			   %d right_edge[%u]: %d\n", __func__, __LINE__,
19803da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
19813da42859SDinh Nguyen 
19823da42859SDinh Nguyen 		/*
19833da42859SDinh Nguyen 		 * Check for cases where we haven't found the left edge,
19843da42859SDinh Nguyen 		 * which makes our assignment of the the right edge invalid.
19853da42859SDinh Nguyen 		 * Reset it to the illegal value.
19863da42859SDinh Nguyen 		 */
19873da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_IN_DELAY_MAX + 1) && (
19883da42859SDinh Nguyen 			right_edge[i] != IO_IO_IN_DELAY_MAX + 1)) {
19893da42859SDinh Nguyen 			right_edge[i] = IO_IO_IN_DELAY_MAX + 1;
19903da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d vfifo_center: reset \
19913da42859SDinh Nguyen 				   right_edge[%u]: %d\n", __func__, __LINE__,
19923da42859SDinh Nguyen 				   i, right_edge[i]);
19933da42859SDinh Nguyen 		}
19943da42859SDinh Nguyen 
19953da42859SDinh Nguyen 		/*
19963da42859SDinh Nguyen 		 * Reset sticky bit (except for bits where we have seen
19973da42859SDinh Nguyen 		 * both the left and right edge).
19983da42859SDinh Nguyen 		 */
19993da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk << 1;
20003da42859SDinh Nguyen 		if ((left_edge[i] != IO_IO_IN_DELAY_MAX + 1) &&
20013da42859SDinh Nguyen 		    (right_edge[i] != IO_IO_IN_DELAY_MAX + 1)) {
20023da42859SDinh Nguyen 			sticky_bit_chk = sticky_bit_chk | 1;
20033da42859SDinh Nguyen 		}
20043da42859SDinh Nguyen 
20053da42859SDinh Nguyen 		if (i == 0)
20063da42859SDinh Nguyen 			break;
20073da42859SDinh Nguyen 	}
20083da42859SDinh Nguyen 
20093da42859SDinh Nguyen 	/* Search for the right edge of the window for each bit */
20103da42859SDinh Nguyen 	for (d = 0; d <= IO_DQS_IN_DELAY_MAX - start_dqs; d++) {
20113da42859SDinh Nguyen 		scc_mgr_set_dqs_bus_in_delay(read_group, d + start_dqs);
20123da42859SDinh Nguyen 		if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
20133da42859SDinh Nguyen 			uint32_t delay = d + start_dqs_en;
20143da42859SDinh Nguyen 			if (delay > IO_DQS_EN_DELAY_MAX)
20153da42859SDinh Nguyen 				delay = IO_DQS_EN_DELAY_MAX;
20163da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay(read_group, delay);
20173da42859SDinh Nguyen 		}
20183da42859SDinh Nguyen 		scc_mgr_load_dqs(read_group);
20193da42859SDinh Nguyen 
2020*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
20213da42859SDinh Nguyen 
20223da42859SDinh Nguyen 		/*
20233da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
20243da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
20253da42859SDinh Nguyen 		 */
20263da42859SDinh Nguyen 		if (use_read_test) {
20273da42859SDinh Nguyen 			stop = !rw_mgr_mem_calibrate_read_test(rank_bgn,
20283da42859SDinh Nguyen 				read_group, NUM_READ_PB_TESTS, PASS_ONE_BIT,
20293da42859SDinh Nguyen 				&bit_chk, 0, 0);
20303da42859SDinh Nguyen 		} else {
20313da42859SDinh Nguyen 			rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
20323da42859SDinh Nguyen 							0, PASS_ONE_BIT,
20333da42859SDinh Nguyen 							&bit_chk, 0);
20343da42859SDinh Nguyen 			bit_chk = bit_chk >> (RW_MGR_MEM_DQ_PER_READ_DQS *
20353da42859SDinh Nguyen 				(read_group - (write_group *
20363da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
20373da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH)));
20383da42859SDinh Nguyen 			stop = (bit_chk == 0);
20393da42859SDinh Nguyen 		}
20403da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
20413da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->read_correct_mask);
20423da42859SDinh Nguyen 
20433da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center(right): dtap=%u => %u == \
20443da42859SDinh Nguyen 			   %u && %u", __func__, __LINE__, d,
20453da42859SDinh Nguyen 			   sticky_bit_chk, param->read_correct_mask, stop);
20463da42859SDinh Nguyen 
20473da42859SDinh Nguyen 		if (stop == 1) {
20483da42859SDinh Nguyen 			break;
20493da42859SDinh Nguyen 		} else {
20503da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
20513da42859SDinh Nguyen 				if (bit_chk & 1) {
20523da42859SDinh Nguyen 					/* Remember a passing test as
20533da42859SDinh Nguyen 					the right_edge */
20543da42859SDinh Nguyen 					right_edge[i] = d;
20553da42859SDinh Nguyen 				} else {
20563da42859SDinh Nguyen 					if (d != 0) {
20573da42859SDinh Nguyen 						/* If a right edge has not been
20583da42859SDinh Nguyen 						seen yet, then a future passing
20593da42859SDinh Nguyen 						test will mark this edge as the
20603da42859SDinh Nguyen 						left edge */
20613da42859SDinh Nguyen 						if (right_edge[i] ==
20623da42859SDinh Nguyen 						IO_IO_IN_DELAY_MAX + 1) {
20633da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
20643da42859SDinh Nguyen 						}
20653da42859SDinh Nguyen 					} else {
20663da42859SDinh Nguyen 						/* d = 0 failed, but it passed
20673da42859SDinh Nguyen 						when testing the left edge,
20683da42859SDinh Nguyen 						so it must be marginal,
20693da42859SDinh Nguyen 						set it to -1 */
20703da42859SDinh Nguyen 						if (right_edge[i] ==
20713da42859SDinh Nguyen 							IO_IO_IN_DELAY_MAX + 1 &&
20723da42859SDinh Nguyen 							left_edge[i] !=
20733da42859SDinh Nguyen 							IO_IO_IN_DELAY_MAX
20743da42859SDinh Nguyen 							+ 1) {
20753da42859SDinh Nguyen 							right_edge[i] = -1;
20763da42859SDinh Nguyen 						}
20773da42859SDinh Nguyen 						/* If a right edge has not been
20783da42859SDinh Nguyen 						seen yet, then a future passing
20793da42859SDinh Nguyen 						test will mark this edge as the
20803da42859SDinh Nguyen 						left edge */
20813da42859SDinh Nguyen 						else if (right_edge[i] ==
20823da42859SDinh Nguyen 							IO_IO_IN_DELAY_MAX +
20833da42859SDinh Nguyen 							1) {
20843da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
20853da42859SDinh Nguyen 						}
20863da42859SDinh Nguyen 					}
20873da42859SDinh Nguyen 				}
20883da42859SDinh Nguyen 
20893da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "%s:%d vfifo_center[r,\
20903da42859SDinh Nguyen 					   d=%u]: ", __func__, __LINE__, d);
20913da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "bit_chk_test=%d left_edge[%u]: %d ",
20923da42859SDinh Nguyen 					   (int)(bit_chk & 1), i, left_edge[i]);
20933da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "right_edge[%u]: %d\n", i,
20943da42859SDinh Nguyen 					   right_edge[i]);
20953da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
20963da42859SDinh Nguyen 			}
20973da42859SDinh Nguyen 		}
20983da42859SDinh Nguyen 	}
20993da42859SDinh Nguyen 
21003da42859SDinh Nguyen 	/* Check that all bits have a window */
21013da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
21023da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center: left_edge[%u]: \
21033da42859SDinh Nguyen 			   %d right_edge[%u]: %d", __func__, __LINE__,
21043da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
21053da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_IN_DELAY_MAX + 1) || (right_edge[i]
21063da42859SDinh Nguyen 			== IO_IO_IN_DELAY_MAX + 1)) {
21073da42859SDinh Nguyen 			/*
21083da42859SDinh Nguyen 			 * Restore delay chain settings before letting the loop
21093da42859SDinh Nguyen 			 * in rw_mgr_mem_calibrate_vfifo to retry different
21103da42859SDinh Nguyen 			 * dqs/ck relationships.
21113da42859SDinh Nguyen 			 */
21123da42859SDinh Nguyen 			scc_mgr_set_dqs_bus_in_delay(read_group, start_dqs);
21133da42859SDinh Nguyen 			if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
21143da42859SDinh Nguyen 				scc_mgr_set_dqs_en_delay(read_group,
21153da42859SDinh Nguyen 							 start_dqs_en);
21163da42859SDinh Nguyen 			}
21173da42859SDinh Nguyen 			scc_mgr_load_dqs(read_group);
2118*1273dd9eSMarek Vasut 			writel(0, &sdr_scc_mgr->update);
21193da42859SDinh Nguyen 
21203da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d vfifo_center: failed to \
21213da42859SDinh Nguyen 				   find edge [%u]: %d %d", __func__, __LINE__,
21223da42859SDinh Nguyen 				   i, left_edge[i], right_edge[i]);
21233da42859SDinh Nguyen 			if (use_read_test) {
21243da42859SDinh Nguyen 				set_failing_group_stage(read_group *
21253da42859SDinh Nguyen 					RW_MGR_MEM_DQ_PER_READ_DQS + i,
21263da42859SDinh Nguyen 					CAL_STAGE_VFIFO,
21273da42859SDinh Nguyen 					CAL_SUBSTAGE_VFIFO_CENTER);
21283da42859SDinh Nguyen 			} else {
21293da42859SDinh Nguyen 				set_failing_group_stage(read_group *
21303da42859SDinh Nguyen 					RW_MGR_MEM_DQ_PER_READ_DQS + i,
21313da42859SDinh Nguyen 					CAL_STAGE_VFIFO_AFTER_WRITES,
21323da42859SDinh Nguyen 					CAL_SUBSTAGE_VFIFO_CENTER);
21333da42859SDinh Nguyen 			}
21343da42859SDinh Nguyen 			return 0;
21353da42859SDinh Nguyen 		}
21363da42859SDinh Nguyen 	}
21373da42859SDinh Nguyen 
21383da42859SDinh Nguyen 	/* Find middle of window for each DQ bit */
21393da42859SDinh Nguyen 	mid_min = left_edge[0] - right_edge[0];
21403da42859SDinh Nguyen 	min_index = 0;
21413da42859SDinh Nguyen 	for (i = 1; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
21423da42859SDinh Nguyen 		mid = left_edge[i] - right_edge[i];
21433da42859SDinh Nguyen 		if (mid < mid_min) {
21443da42859SDinh Nguyen 			mid_min = mid;
21453da42859SDinh Nguyen 			min_index = i;
21463da42859SDinh Nguyen 		}
21473da42859SDinh Nguyen 	}
21483da42859SDinh Nguyen 
21493da42859SDinh Nguyen 	/*
21503da42859SDinh Nguyen 	 * -mid_min/2 represents the amount that we need to move DQS.
21513da42859SDinh Nguyen 	 * If mid_min is odd and positive we'll need to add one to
21523da42859SDinh Nguyen 	 * make sure the rounding in further calculations is correct
21533da42859SDinh Nguyen 	 * (always bias to the right), so just add 1 for all positive values.
21543da42859SDinh Nguyen 	 */
21553da42859SDinh Nguyen 	if (mid_min > 0)
21563da42859SDinh Nguyen 		mid_min++;
21573da42859SDinh Nguyen 
21583da42859SDinh Nguyen 	mid_min = mid_min / 2;
21593da42859SDinh Nguyen 
21603da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d vfifo_center: mid_min=%d (index=%u)\n",
21613da42859SDinh Nguyen 		   __func__, __LINE__, mid_min, min_index);
21623da42859SDinh Nguyen 
21633da42859SDinh Nguyen 	/* Determine the amount we can change DQS (which is -mid_min) */
21643da42859SDinh Nguyen 	orig_mid_min = mid_min;
21653da42859SDinh Nguyen 	new_dqs = start_dqs - mid_min;
21663da42859SDinh Nguyen 	if (new_dqs > IO_DQS_IN_DELAY_MAX)
21673da42859SDinh Nguyen 		new_dqs = IO_DQS_IN_DELAY_MAX;
21683da42859SDinh Nguyen 	else if (new_dqs < 0)
21693da42859SDinh Nguyen 		new_dqs = 0;
21703da42859SDinh Nguyen 
21713da42859SDinh Nguyen 	mid_min = start_dqs - new_dqs;
21723da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "vfifo_center: new mid_min=%d new_dqs=%d\n",
21733da42859SDinh Nguyen 		   mid_min, new_dqs);
21743da42859SDinh Nguyen 
21753da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
21763da42859SDinh Nguyen 		if (start_dqs_en - mid_min > IO_DQS_EN_DELAY_MAX)
21773da42859SDinh Nguyen 			mid_min += start_dqs_en - mid_min - IO_DQS_EN_DELAY_MAX;
21783da42859SDinh Nguyen 		else if (start_dqs_en - mid_min < 0)
21793da42859SDinh Nguyen 			mid_min += start_dqs_en - mid_min;
21803da42859SDinh Nguyen 	}
21813da42859SDinh Nguyen 	new_dqs = start_dqs - mid_min;
21823da42859SDinh Nguyen 
21833da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "vfifo_center: start_dqs=%d start_dqs_en=%d \
21843da42859SDinh Nguyen 		   new_dqs=%d mid_min=%d\n", start_dqs,
21853da42859SDinh Nguyen 		   IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS ? start_dqs_en : -1,
21863da42859SDinh Nguyen 		   new_dqs, mid_min);
21873da42859SDinh Nguyen 
21883da42859SDinh Nguyen 	/* Initialize data for export structures */
21893da42859SDinh Nguyen 	dqs_margin = IO_IO_IN_DELAY_MAX + 1;
21903da42859SDinh Nguyen 	dq_margin  = IO_IO_IN_DELAY_MAX + 1;
21913da42859SDinh Nguyen 
21923da42859SDinh Nguyen 	/* add delay to bring centre of all DQ windows to the same "level" */
21933da42859SDinh Nguyen 	for (i = 0, p = test_bgn; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++, p++) {
21943da42859SDinh Nguyen 		/* Use values before divide by 2 to reduce round off error */
21953da42859SDinh Nguyen 		shift_dq = (left_edge[i] - right_edge[i] -
21963da42859SDinh Nguyen 			(left_edge[min_index] - right_edge[min_index]))/2  +
21973da42859SDinh Nguyen 			(orig_mid_min - mid_min);
21983da42859SDinh Nguyen 
21993da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "vfifo_center: before: \
22003da42859SDinh Nguyen 			   shift_dq[%u]=%d\n", i, shift_dq);
22013da42859SDinh Nguyen 
2202*1273dd9eSMarek Vasut 		addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_IN_DELAY_OFFSET;
220317fdc916SMarek Vasut 		temp_dq_in_delay1 = readl(addr + (p << 2));
220417fdc916SMarek Vasut 		temp_dq_in_delay2 = readl(addr + (i << 2));
22053da42859SDinh Nguyen 
22063da42859SDinh Nguyen 		if (shift_dq + (int32_t)temp_dq_in_delay1 >
22073da42859SDinh Nguyen 			(int32_t)IO_IO_IN_DELAY_MAX) {
22083da42859SDinh Nguyen 			shift_dq = (int32_t)IO_IO_IN_DELAY_MAX - temp_dq_in_delay2;
22093da42859SDinh Nguyen 		} else if (shift_dq + (int32_t)temp_dq_in_delay1 < 0) {
22103da42859SDinh Nguyen 			shift_dq = -(int32_t)temp_dq_in_delay1;
22113da42859SDinh Nguyen 		}
22123da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "vfifo_center: after: \
22133da42859SDinh Nguyen 			   shift_dq[%u]=%d\n", i, shift_dq);
22143da42859SDinh Nguyen 		final_dq[i] = temp_dq_in_delay1 + shift_dq;
22153da42859SDinh Nguyen 		scc_mgr_set_dq_in_delay(write_group, p, final_dq[i]);
22163da42859SDinh Nguyen 		scc_mgr_load_dq(p);
22173da42859SDinh Nguyen 
22183da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "vfifo_center: margin[%u]=[%d,%d]\n", i,
22193da42859SDinh Nguyen 			   left_edge[i] - shift_dq + (-mid_min),
22203da42859SDinh Nguyen 			   right_edge[i] + shift_dq - (-mid_min));
22213da42859SDinh Nguyen 		/* To determine values for export structures */
22223da42859SDinh Nguyen 		if (left_edge[i] - shift_dq + (-mid_min) < dq_margin)
22233da42859SDinh Nguyen 			dq_margin = left_edge[i] - shift_dq + (-mid_min);
22243da42859SDinh Nguyen 
22253da42859SDinh Nguyen 		if (right_edge[i] + shift_dq - (-mid_min) < dqs_margin)
22263da42859SDinh Nguyen 			dqs_margin = right_edge[i] + shift_dq - (-mid_min);
22273da42859SDinh Nguyen 	}
22283da42859SDinh Nguyen 
22293da42859SDinh Nguyen 	final_dqs = new_dqs;
22303da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS)
22313da42859SDinh Nguyen 		final_dqs_en = start_dqs_en - mid_min;
22323da42859SDinh Nguyen 
22333da42859SDinh Nguyen 	/* Move DQS-en */
22343da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
22353da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay(read_group, final_dqs_en);
22363da42859SDinh Nguyen 		scc_mgr_load_dqs(read_group);
22373da42859SDinh Nguyen 	}
22383da42859SDinh Nguyen 
22393da42859SDinh Nguyen 	/* Move DQS */
22403da42859SDinh Nguyen 	scc_mgr_set_dqs_bus_in_delay(read_group, final_dqs);
22413da42859SDinh Nguyen 	scc_mgr_load_dqs(read_group);
22423da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d vfifo_center: dq_margin=%d \
22433da42859SDinh Nguyen 		   dqs_margin=%d", __func__, __LINE__,
22443da42859SDinh Nguyen 		   dq_margin, dqs_margin);
22453da42859SDinh Nguyen 
22463da42859SDinh Nguyen 	/*
22473da42859SDinh Nguyen 	 * Do not remove this line as it makes sure all of our decisions
22483da42859SDinh Nguyen 	 * have been applied. Apply the update bit.
22493da42859SDinh Nguyen 	 */
2250*1273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
22513da42859SDinh Nguyen 
22523da42859SDinh Nguyen 	return (dq_margin >= 0) && (dqs_margin >= 0);
22533da42859SDinh Nguyen }
22543da42859SDinh Nguyen 
22553da42859SDinh Nguyen /*
22563da42859SDinh Nguyen  * calibrate the read valid prediction FIFO.
22573da42859SDinh Nguyen  *
22583da42859SDinh Nguyen  *  - read valid prediction will consist of finding a good DQS enable phase,
22593da42859SDinh Nguyen  * DQS enable delay, DQS input phase, and DQS input delay.
22603da42859SDinh Nguyen  *  - we also do a per-bit deskew on the DQ lines.
22613da42859SDinh Nguyen  */
22623da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo(uint32_t read_group,
22633da42859SDinh Nguyen 					   uint32_t test_bgn)
22643da42859SDinh Nguyen {
22653da42859SDinh Nguyen 	uint32_t p, d, rank_bgn, sr;
22663da42859SDinh Nguyen 	uint32_t dtaps_per_ptap;
22673da42859SDinh Nguyen 	uint32_t tmp_delay;
22683da42859SDinh Nguyen 	uint32_t bit_chk;
22693da42859SDinh Nguyen 	uint32_t grp_calibrated;
22703da42859SDinh Nguyen 	uint32_t write_group, write_test_bgn;
22713da42859SDinh Nguyen 	uint32_t failed_substage;
22723da42859SDinh Nguyen 
22737ac40d25SMarek Vasut 	debug("%s:%d: %u %u\n", __func__, __LINE__, read_group, test_bgn);
22743da42859SDinh Nguyen 
22753da42859SDinh Nguyen 	/* update info for sims */
22763da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_VFIFO);
22773da42859SDinh Nguyen 
22783da42859SDinh Nguyen 	write_group = read_group;
22793da42859SDinh Nguyen 	write_test_bgn = test_bgn;
22803da42859SDinh Nguyen 
22813da42859SDinh Nguyen 	/* USER Determine number of delay taps for each phase tap */
22823da42859SDinh Nguyen 	dtaps_per_ptap = 0;
22833da42859SDinh Nguyen 	tmp_delay = 0;
22843da42859SDinh Nguyen 	while (tmp_delay < IO_DELAY_PER_OPA_TAP) {
22853da42859SDinh Nguyen 		dtaps_per_ptap++;
22863da42859SDinh Nguyen 		tmp_delay += IO_DELAY_PER_DQS_EN_DCHAIN_TAP;
22873da42859SDinh Nguyen 	}
22883da42859SDinh Nguyen 	dtaps_per_ptap--;
22893da42859SDinh Nguyen 	tmp_delay = 0;
22903da42859SDinh Nguyen 
22913da42859SDinh Nguyen 	/* update info for sims */
22923da42859SDinh Nguyen 	reg_file_set_group(read_group);
22933da42859SDinh Nguyen 
22943da42859SDinh Nguyen 	grp_calibrated = 0;
22953da42859SDinh Nguyen 
22963da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_GUARANTEED_READ);
22973da42859SDinh Nguyen 	failed_substage = CAL_SUBSTAGE_GUARANTEED_READ;
22983da42859SDinh Nguyen 
22993da42859SDinh Nguyen 	for (d = 0; d <= dtaps_per_ptap && grp_calibrated == 0; d += 2) {
23003da42859SDinh Nguyen 		/*
23013da42859SDinh Nguyen 		 * In RLDRAMX we may be messing the delay of pins in
23023da42859SDinh Nguyen 		 * the same write group but outside of the current read
23033da42859SDinh Nguyen 		 * the group, but that's ok because we haven't
23043da42859SDinh Nguyen 		 * calibrated output side yet.
23053da42859SDinh Nguyen 		 */
23063da42859SDinh Nguyen 		if (d > 0) {
23073da42859SDinh Nguyen 			scc_mgr_apply_group_all_out_delay_add_all_ranks
23083da42859SDinh Nguyen 			(write_group, write_test_bgn, d);
23093da42859SDinh Nguyen 		}
23103da42859SDinh Nguyen 
23113da42859SDinh Nguyen 		for (p = 0; p <= IO_DQDQS_OUT_PHASE_MAX && grp_calibrated == 0;
23123da42859SDinh Nguyen 			p++) {
23133da42859SDinh Nguyen 			/* set a particular dqdqs phase */
23143da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase_all_ranks(read_group, p);
23153da42859SDinh Nguyen 
23163da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d calibrate_vfifo: g=%u \
23173da42859SDinh Nguyen 				   p=%u d=%u\n", __func__, __LINE__,
23183da42859SDinh Nguyen 				   read_group, p, d);
23193da42859SDinh Nguyen 
23203da42859SDinh Nguyen 			/*
23213da42859SDinh Nguyen 			 * Load up the patterns used by read calibration
23223da42859SDinh Nguyen 			 * using current DQDQS phase.
23233da42859SDinh Nguyen 			 */
23243da42859SDinh Nguyen 			rw_mgr_mem_calibrate_read_load_patterns(0, 1);
23253da42859SDinh Nguyen 			if (!(gbl->phy_debug_mode_flags &
23263da42859SDinh Nguyen 				PHY_DEBUG_DISABLE_GUARANTEED_READ)) {
23273da42859SDinh Nguyen 				if (!rw_mgr_mem_calibrate_read_test_patterns_all_ranks
23283da42859SDinh Nguyen 				    (read_group, 1, &bit_chk)) {
23293da42859SDinh Nguyen 					debug_cond(DLEVEL == 1, "%s:%d Guaranteed read test failed:",
23303da42859SDinh Nguyen 						   __func__, __LINE__);
23313da42859SDinh Nguyen 					debug_cond(DLEVEL == 1, " g=%u p=%u d=%u\n",
23323da42859SDinh Nguyen 						   read_group, p, d);
23333da42859SDinh Nguyen 					break;
23343da42859SDinh Nguyen 				}
23353da42859SDinh Nguyen 			}
23363da42859SDinh Nguyen 
23373da42859SDinh Nguyen /* case:56390 */
23383da42859SDinh Nguyen 			grp_calibrated = 1;
23393da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase_sweep_dq_in_delay
23403da42859SDinh Nguyen 		    (write_group, read_group, test_bgn)) {
23413da42859SDinh Nguyen 				/*
23423da42859SDinh Nguyen 				 * USER Read per-bit deskew can be done on a
23433da42859SDinh Nguyen 				 * per shadow register basis.
23443da42859SDinh Nguyen 				 */
23453da42859SDinh Nguyen 				for (rank_bgn = 0, sr = 0;
23463da42859SDinh Nguyen 					rank_bgn < RW_MGR_MEM_NUMBER_OF_RANKS;
23473da42859SDinh Nguyen 					rank_bgn += NUM_RANKS_PER_SHADOW_REG,
23483da42859SDinh Nguyen 					++sr) {
23493da42859SDinh Nguyen 					/*
23503da42859SDinh Nguyen 					 * Determine if this set of ranks
23513da42859SDinh Nguyen 					 * should be skipped entirely.
23523da42859SDinh Nguyen 					 */
23533da42859SDinh Nguyen 					if (!param->skip_shadow_regs[sr]) {
23543da42859SDinh Nguyen 						/*
23553da42859SDinh Nguyen 						 * If doing read after write
23563da42859SDinh Nguyen 						 * calibration, do not update
23573da42859SDinh Nguyen 						 * FOM, now - do it then.
23583da42859SDinh Nguyen 						 */
23593da42859SDinh Nguyen 					if (!rw_mgr_mem_calibrate_vfifo_center
23603da42859SDinh Nguyen 						(rank_bgn, write_group,
23613da42859SDinh Nguyen 						read_group, test_bgn, 1, 0)) {
23623da42859SDinh Nguyen 							grp_calibrated = 0;
23633da42859SDinh Nguyen 							failed_substage =
23643da42859SDinh Nguyen 						CAL_SUBSTAGE_VFIFO_CENTER;
23653da42859SDinh Nguyen 						}
23663da42859SDinh Nguyen 					}
23673da42859SDinh Nguyen 				}
23683da42859SDinh Nguyen 			} else {
23693da42859SDinh Nguyen 				grp_calibrated = 0;
23703da42859SDinh Nguyen 				failed_substage = CAL_SUBSTAGE_DQS_EN_PHASE;
23713da42859SDinh Nguyen 			}
23723da42859SDinh Nguyen 		}
23733da42859SDinh Nguyen 	}
23743da42859SDinh Nguyen 
23753da42859SDinh Nguyen 	if (grp_calibrated == 0) {
23763da42859SDinh Nguyen 		set_failing_group_stage(write_group, CAL_STAGE_VFIFO,
23773da42859SDinh Nguyen 					failed_substage);
23783da42859SDinh Nguyen 		return 0;
23793da42859SDinh Nguyen 	}
23803da42859SDinh Nguyen 
23813da42859SDinh Nguyen 	/*
23823da42859SDinh Nguyen 	 * Reset the delay chains back to zero if they have moved > 1
23833da42859SDinh Nguyen 	 * (check for > 1 because loop will increase d even when pass in
23843da42859SDinh Nguyen 	 * first case).
23853da42859SDinh Nguyen 	 */
23863da42859SDinh Nguyen 	if (d > 2)
23873da42859SDinh Nguyen 		scc_mgr_zero_group(write_group, write_test_bgn, 1);
23883da42859SDinh Nguyen 
23893da42859SDinh Nguyen 	return 1;
23903da42859SDinh Nguyen }
23913da42859SDinh Nguyen 
23923da42859SDinh Nguyen /* VFIFO Calibration -- Read Deskew Calibration after write deskew */
23933da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo_end(uint32_t read_group,
23943da42859SDinh Nguyen 					       uint32_t test_bgn)
23953da42859SDinh Nguyen {
23963da42859SDinh Nguyen 	uint32_t rank_bgn, sr;
23973da42859SDinh Nguyen 	uint32_t grp_calibrated;
23983da42859SDinh Nguyen 	uint32_t write_group;
23993da42859SDinh Nguyen 
24003da42859SDinh Nguyen 	debug("%s:%d %u %u", __func__, __LINE__, read_group, test_bgn);
24013da42859SDinh Nguyen 
24023da42859SDinh Nguyen 	/* update info for sims */
24033da42859SDinh Nguyen 
24043da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_VFIFO_AFTER_WRITES);
24053da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_VFIFO_CENTER);
24063da42859SDinh Nguyen 
24073da42859SDinh Nguyen 	write_group = read_group;
24083da42859SDinh Nguyen 
24093da42859SDinh Nguyen 	/* update info for sims */
24103da42859SDinh Nguyen 	reg_file_set_group(read_group);
24113da42859SDinh Nguyen 
24123da42859SDinh Nguyen 	grp_calibrated = 1;
24133da42859SDinh Nguyen 	/* Read per-bit deskew can be done on a per shadow register basis */
24143da42859SDinh Nguyen 	for (rank_bgn = 0, sr = 0; rank_bgn < RW_MGR_MEM_NUMBER_OF_RANKS;
24153da42859SDinh Nguyen 		rank_bgn += NUM_RANKS_PER_SHADOW_REG, ++sr) {
24163da42859SDinh Nguyen 		/* Determine if this set of ranks should be skipped entirely */
24173da42859SDinh Nguyen 		if (!param->skip_shadow_regs[sr]) {
24183da42859SDinh Nguyen 		/* This is the last calibration round, update FOM here */
24193da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_vfifo_center(rank_bgn,
24203da42859SDinh Nguyen 								write_group,
24213da42859SDinh Nguyen 								read_group,
24223da42859SDinh Nguyen 								test_bgn, 0,
24233da42859SDinh Nguyen 								1)) {
24243da42859SDinh Nguyen 				grp_calibrated = 0;
24253da42859SDinh Nguyen 			}
24263da42859SDinh Nguyen 		}
24273da42859SDinh Nguyen 	}
24283da42859SDinh Nguyen 
24293da42859SDinh Nguyen 
24303da42859SDinh Nguyen 	if (grp_calibrated == 0) {
24313da42859SDinh Nguyen 		set_failing_group_stage(write_group,
24323da42859SDinh Nguyen 					CAL_STAGE_VFIFO_AFTER_WRITES,
24333da42859SDinh Nguyen 					CAL_SUBSTAGE_VFIFO_CENTER);
24343da42859SDinh Nguyen 		return 0;
24353da42859SDinh Nguyen 	}
24363da42859SDinh Nguyen 
24373da42859SDinh Nguyen 	return 1;
24383da42859SDinh Nguyen }
24393da42859SDinh Nguyen 
24403da42859SDinh Nguyen /* Calibrate LFIFO to find smallest read latency */
24413da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_lfifo(void)
24423da42859SDinh Nguyen {
24433da42859SDinh Nguyen 	uint32_t found_one;
24443da42859SDinh Nguyen 	uint32_t bit_chk;
24453da42859SDinh Nguyen 
24463da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
24473da42859SDinh Nguyen 
24483da42859SDinh Nguyen 	/* update info for sims */
24493da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_LFIFO);
24503da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_READ_LATENCY);
24513da42859SDinh Nguyen 
24523da42859SDinh Nguyen 	/* Load up the patterns used by read calibration for all ranks */
24533da42859SDinh Nguyen 	rw_mgr_mem_calibrate_read_load_patterns(0, 1);
24543da42859SDinh Nguyen 	found_one = 0;
24553da42859SDinh Nguyen 
24563da42859SDinh Nguyen 	do {
2457*1273dd9eSMarek Vasut 		writel(gbl->curr_read_lat, &phy_mgr_cfg->phy_rlat);
24583da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d lfifo: read_lat=%u",
24593da42859SDinh Nguyen 			   __func__, __LINE__, gbl->curr_read_lat);
24603da42859SDinh Nguyen 
24613da42859SDinh Nguyen 		if (!rw_mgr_mem_calibrate_read_test_all_ranks(0,
24623da42859SDinh Nguyen 							      NUM_READ_TESTS,
24633da42859SDinh Nguyen 							      PASS_ALL_BITS,
24643da42859SDinh Nguyen 							      &bit_chk, 1)) {
24653da42859SDinh Nguyen 			break;
24663da42859SDinh Nguyen 		}
24673da42859SDinh Nguyen 
24683da42859SDinh Nguyen 		found_one = 1;
24693da42859SDinh Nguyen 		/* reduce read latency and see if things are working */
24703da42859SDinh Nguyen 		/* correctly */
24713da42859SDinh Nguyen 		gbl->curr_read_lat--;
24723da42859SDinh Nguyen 	} while (gbl->curr_read_lat > 0);
24733da42859SDinh Nguyen 
24743da42859SDinh Nguyen 	/* reset the fifos to get pointers to known state */
24753da42859SDinh Nguyen 
2476*1273dd9eSMarek Vasut 	writel(0, &phy_mgr_cmd->fifo_reset);
24773da42859SDinh Nguyen 
24783da42859SDinh Nguyen 	if (found_one) {
24793da42859SDinh Nguyen 		/* add a fudge factor to the read latency that was determined */
24803da42859SDinh Nguyen 		gbl->curr_read_lat += 2;
2481*1273dd9eSMarek Vasut 		writel(gbl->curr_read_lat, &phy_mgr_cfg->phy_rlat);
24823da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d lfifo: success: using \
24833da42859SDinh Nguyen 			   read_lat=%u\n", __func__, __LINE__,
24843da42859SDinh Nguyen 			   gbl->curr_read_lat);
24853da42859SDinh Nguyen 		return 1;
24863da42859SDinh Nguyen 	} else {
24873da42859SDinh Nguyen 		set_failing_group_stage(0xff, CAL_STAGE_LFIFO,
24883da42859SDinh Nguyen 					CAL_SUBSTAGE_READ_LATENCY);
24893da42859SDinh Nguyen 
24903da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d lfifo: failed at initial \
24913da42859SDinh Nguyen 			   read_lat=%u\n", __func__, __LINE__,
24923da42859SDinh Nguyen 			   gbl->curr_read_lat);
24933da42859SDinh Nguyen 		return 0;
24943da42859SDinh Nguyen 	}
24953da42859SDinh Nguyen }
24963da42859SDinh Nguyen 
24973da42859SDinh Nguyen /*
24983da42859SDinh Nguyen  * issue write test command.
24993da42859SDinh Nguyen  * two variants are provided. one that just tests a write pattern and
25003da42859SDinh Nguyen  * another that tests datamask functionality.
25013da42859SDinh Nguyen  */
25023da42859SDinh Nguyen static void rw_mgr_mem_calibrate_write_test_issue(uint32_t group,
25033da42859SDinh Nguyen 						  uint32_t test_dm)
25043da42859SDinh Nguyen {
25053da42859SDinh Nguyen 	uint32_t mcc_instruction;
25063da42859SDinh Nguyen 	uint32_t quick_write_mode = (((STATIC_CALIB_STEPS) & CALIB_SKIP_WRITES) &&
25073da42859SDinh Nguyen 		ENABLE_SUPER_QUICK_CALIBRATION);
25083da42859SDinh Nguyen 	uint32_t rw_wl_nop_cycles;
25093da42859SDinh Nguyen 	uint32_t addr;
25103da42859SDinh Nguyen 
25113da42859SDinh Nguyen 	/*
25123da42859SDinh Nguyen 	 * Set counter and jump addresses for the right
25133da42859SDinh Nguyen 	 * number of NOP cycles.
25143da42859SDinh Nguyen 	 * The number of supported NOP cycles can range from -1 to infinity
25153da42859SDinh Nguyen 	 * Three different cases are handled:
25163da42859SDinh Nguyen 	 *
25173da42859SDinh Nguyen 	 * 1. For a number of NOP cycles greater than 0, the RW Mgr looping
25183da42859SDinh Nguyen 	 *    mechanism will be used to insert the right number of NOPs
25193da42859SDinh Nguyen 	 *
25203da42859SDinh Nguyen 	 * 2. For a number of NOP cycles equals to 0, the micro-instruction
25213da42859SDinh Nguyen 	 *    issuing the write command will jump straight to the
25223da42859SDinh Nguyen 	 *    micro-instruction that turns on DQS (for DDRx), or outputs write
25233da42859SDinh Nguyen 	 *    data (for RLD), skipping
25243da42859SDinh Nguyen 	 *    the NOP micro-instruction all together
25253da42859SDinh Nguyen 	 *
25263da42859SDinh Nguyen 	 * 3. A number of NOP cycles equal to -1 indicates that DQS must be
25273da42859SDinh Nguyen 	 *    turned on in the same micro-instruction that issues the write
25283da42859SDinh Nguyen 	 *    command. Then we need
25293da42859SDinh Nguyen 	 *    to directly jump to the micro-instruction that sends out the data
25303da42859SDinh Nguyen 	 *
25313da42859SDinh Nguyen 	 * NOTE: Implementing this mechanism uses 2 RW Mgr jump-counters
25323da42859SDinh Nguyen 	 *       (2 and 3). One jump-counter (0) is used to perform multiple
25333da42859SDinh Nguyen 	 *       write-read operations.
25343da42859SDinh Nguyen 	 *       one counter left to issue this command in "multiple-group" mode
25353da42859SDinh Nguyen 	 */
25363da42859SDinh Nguyen 
25373da42859SDinh Nguyen 	rw_wl_nop_cycles = gbl->rw_wl_nop_cycles;
25383da42859SDinh Nguyen 
25393da42859SDinh Nguyen 	if (rw_wl_nop_cycles == -1) {
25403da42859SDinh Nguyen 		/*
25413da42859SDinh Nguyen 		 * CNTR 2 - We want to execute the special write operation that
25423da42859SDinh Nguyen 		 * turns on DQS right away and then skip directly to the
25433da42859SDinh Nguyen 		 * instruction that sends out the data. We set the counter to a
25443da42859SDinh Nguyen 		 * large number so that the jump is always taken.
25453da42859SDinh Nguyen 		 */
2546*1273dd9eSMarek Vasut 		writel(0xFF, &sdr_rw_load_mgr_regs->load_cntr2);
25473da42859SDinh Nguyen 
25483da42859SDinh Nguyen 		/* CNTR 3 - Not used */
25493da42859SDinh Nguyen 		if (test_dm) {
25503da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_DM_BANK_0_WL_1;
25513da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_DATA,
2552*1273dd9eSMarek Vasut 			       &sdr_rw_load_jump_mgr_regs->load_jump_add2);
25533da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_NOP,
2554*1273dd9eSMarek Vasut 			       &sdr_rw_load_jump_mgr_regs->load_jump_add3);
25553da42859SDinh Nguyen 		} else {
25563da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_BANK_0_WL_1;
2557*1273dd9eSMarek Vasut 			writel(RW_MGR_LFSR_WR_RD_BANK_0_DATA,
2558*1273dd9eSMarek Vasut 				&sdr_rw_load_jump_mgr_regs->load_jump_add2);
2559*1273dd9eSMarek Vasut 			writel(RW_MGR_LFSR_WR_RD_BANK_0_NOP,
2560*1273dd9eSMarek Vasut 				&sdr_rw_load_jump_mgr_regs->load_jump_add3);
25613da42859SDinh Nguyen 		}
25623da42859SDinh Nguyen 	} else if (rw_wl_nop_cycles == 0) {
25633da42859SDinh Nguyen 		/*
25643da42859SDinh Nguyen 		 * CNTR 2 - We want to skip the NOP operation and go straight
25653da42859SDinh Nguyen 		 * to the DQS enable instruction. We set the counter to a large
25663da42859SDinh Nguyen 		 * number so that the jump is always taken.
25673da42859SDinh Nguyen 		 */
2568*1273dd9eSMarek Vasut 		writel(0xFF, &sdr_rw_load_mgr_regs->load_cntr2);
25693da42859SDinh Nguyen 
25703da42859SDinh Nguyen 		/* CNTR 3 - Not used */
25713da42859SDinh Nguyen 		if (test_dm) {
25723da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_DM_BANK_0;
25733da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_DQS,
2574*1273dd9eSMarek Vasut 			       &sdr_rw_load_jump_mgr_regs->load_jump_add2);
25753da42859SDinh Nguyen 		} else {
25763da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_BANK_0;
2577*1273dd9eSMarek Vasut 			writel(RW_MGR_LFSR_WR_RD_BANK_0_DQS,
2578*1273dd9eSMarek Vasut 				&sdr_rw_load_jump_mgr_regs->load_jump_add2);
25793da42859SDinh Nguyen 		}
25803da42859SDinh Nguyen 	} else {
25813da42859SDinh Nguyen 		/*
25823da42859SDinh Nguyen 		 * CNTR 2 - In this case we want to execute the next instruction
25833da42859SDinh Nguyen 		 * and NOT take the jump. So we set the counter to 0. The jump
25843da42859SDinh Nguyen 		 * address doesn't count.
25853da42859SDinh Nguyen 		 */
2586*1273dd9eSMarek Vasut 		writel(0x0, &sdr_rw_load_mgr_regs->load_cntr2);
2587*1273dd9eSMarek Vasut 		writel(0x0, &sdr_rw_load_jump_mgr_regs->load_jump_add2);
25883da42859SDinh Nguyen 
25893da42859SDinh Nguyen 		/*
25903da42859SDinh Nguyen 		 * CNTR 3 - Set the nop counter to the number of cycles we
25913da42859SDinh Nguyen 		 * need to loop for, minus 1.
25923da42859SDinh Nguyen 		 */
2593*1273dd9eSMarek Vasut 		writel(rw_wl_nop_cycles - 1, &sdr_rw_load_mgr_regs->load_cntr3);
25943da42859SDinh Nguyen 		if (test_dm) {
25953da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_DM_BANK_0;
2596*1273dd9eSMarek Vasut 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_NOP,
2597*1273dd9eSMarek Vasut 				&sdr_rw_load_jump_mgr_regs->load_jump_add3);
25983da42859SDinh Nguyen 		} else {
25993da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_BANK_0;
2600*1273dd9eSMarek Vasut 			writel(RW_MGR_LFSR_WR_RD_BANK_0_NOP,
2601*1273dd9eSMarek Vasut 				&sdr_rw_load_jump_mgr_regs->load_jump_add3);
26023da42859SDinh Nguyen 		}
26033da42859SDinh Nguyen 	}
26043da42859SDinh Nguyen 
2605*1273dd9eSMarek Vasut 	writel(0, SDR_PHYGRP_RWMGRGRP_ADDRESS |
2606*1273dd9eSMarek Vasut 		  RW_MGR_RESET_READ_DATAPATH_OFFSET);
26073da42859SDinh Nguyen 
26083da42859SDinh Nguyen 	if (quick_write_mode)
2609*1273dd9eSMarek Vasut 		writel(0x08, &sdr_rw_load_mgr_regs->load_cntr0);
26103da42859SDinh Nguyen 	else
2611*1273dd9eSMarek Vasut 		writel(0x40, &sdr_rw_load_mgr_regs->load_cntr0);
26123da42859SDinh Nguyen 
2613*1273dd9eSMarek Vasut 	writel(mcc_instruction, &sdr_rw_load_jump_mgr_regs->load_jump_add0);
26143da42859SDinh Nguyen 
26153da42859SDinh Nguyen 	/*
26163da42859SDinh Nguyen 	 * CNTR 1 - This is used to ensure enough time elapses
26173da42859SDinh Nguyen 	 * for read data to come back.
26183da42859SDinh Nguyen 	 */
2619*1273dd9eSMarek Vasut 	writel(0x30, &sdr_rw_load_mgr_regs->load_cntr1);
26203da42859SDinh Nguyen 
26213da42859SDinh Nguyen 	if (test_dm) {
2622*1273dd9eSMarek Vasut 		writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_WAIT,
2623*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
26243da42859SDinh Nguyen 	} else {
2625*1273dd9eSMarek Vasut 		writel(RW_MGR_LFSR_WR_RD_BANK_0_WAIT,
2626*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
26273da42859SDinh Nguyen 	}
26283da42859SDinh Nguyen 
2629c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
263017fdc916SMarek Vasut 	writel(mcc_instruction, addr + (group << 2));
26313da42859SDinh Nguyen }
26323da42859SDinh Nguyen 
26333da42859SDinh Nguyen /* Test writes, can check for a single bit pass or multiple bit pass */
26343da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_write_test(uint32_t rank_bgn,
26353da42859SDinh Nguyen 	uint32_t write_group, uint32_t use_dm, uint32_t all_correct,
26363da42859SDinh Nguyen 	uint32_t *bit_chk, uint32_t all_ranks)
26373da42859SDinh Nguyen {
26383da42859SDinh Nguyen 	uint32_t r;
26393da42859SDinh Nguyen 	uint32_t correct_mask_vg;
26403da42859SDinh Nguyen 	uint32_t tmp_bit_chk;
26413da42859SDinh Nguyen 	uint32_t vg;
26423da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
26433da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
26443da42859SDinh Nguyen 	uint32_t addr_rw_mgr;
26453da42859SDinh Nguyen 	uint32_t base_rw_mgr;
26463da42859SDinh Nguyen 
26473da42859SDinh Nguyen 	*bit_chk = param->write_correct_mask;
26483da42859SDinh Nguyen 	correct_mask_vg = param->write_correct_mask_vg;
26493da42859SDinh Nguyen 
26503da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
26513da42859SDinh Nguyen 		if (param->skip_ranks[r]) {
26523da42859SDinh Nguyen 			/* request to skip the rank */
26533da42859SDinh Nguyen 			continue;
26543da42859SDinh Nguyen 		}
26553da42859SDinh Nguyen 
26563da42859SDinh Nguyen 		/* set rank */
26573da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
26583da42859SDinh Nguyen 
26593da42859SDinh Nguyen 		tmp_bit_chk = 0;
2660a4bfa463SMarek Vasut 		addr_rw_mgr = SDR_PHYGRP_RWMGRGRP_ADDRESS;
26613da42859SDinh Nguyen 		for (vg = RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS-1; ; vg--) {
26623da42859SDinh Nguyen 			/* reset the fifos to get pointers to known state */
2663*1273dd9eSMarek Vasut 			writel(0, &phy_mgr_cmd->fifo_reset);
26643da42859SDinh Nguyen 
26653da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk <<
26663da42859SDinh Nguyen 				(RW_MGR_MEM_DQ_PER_WRITE_DQS /
26673da42859SDinh Nguyen 				RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS);
26683da42859SDinh Nguyen 			rw_mgr_mem_calibrate_write_test_issue(write_group *
26693da42859SDinh Nguyen 				RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS+vg,
26703da42859SDinh Nguyen 				use_dm);
26713da42859SDinh Nguyen 
267217fdc916SMarek Vasut 			base_rw_mgr = readl(addr_rw_mgr);
26733da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk | (correct_mask_vg & ~(base_rw_mgr));
26743da42859SDinh Nguyen 			if (vg == 0)
26753da42859SDinh Nguyen 				break;
26763da42859SDinh Nguyen 		}
26773da42859SDinh Nguyen 		*bit_chk &= tmp_bit_chk;
26783da42859SDinh Nguyen 	}
26793da42859SDinh Nguyen 
26803da42859SDinh Nguyen 	if (all_correct) {
26813da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
26823da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_test(%u,%u,ALL) : %u == \
26833da42859SDinh Nguyen 			   %u => %lu", write_group, use_dm,
26843da42859SDinh Nguyen 			   *bit_chk, param->write_correct_mask,
26853da42859SDinh Nguyen 			   (long unsigned int)(*bit_chk ==
26863da42859SDinh Nguyen 			   param->write_correct_mask));
26873da42859SDinh Nguyen 		return *bit_chk == param->write_correct_mask;
26883da42859SDinh Nguyen 	} else {
26893da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
26903da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_test(%u,%u,ONE) : %u != ",
26913da42859SDinh Nguyen 		       write_group, use_dm, *bit_chk);
26923da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%lu" " => %lu", (long unsigned int)0,
26933da42859SDinh Nguyen 			(long unsigned int)(*bit_chk != 0));
26943da42859SDinh Nguyen 		return *bit_chk != 0x00;
26953da42859SDinh Nguyen 	}
26963da42859SDinh Nguyen }
26973da42859SDinh Nguyen 
26983da42859SDinh Nguyen /*
26993da42859SDinh Nguyen  * center all windows. do per-bit-deskew to possibly increase size of
27003da42859SDinh Nguyen  * certain windows.
27013da42859SDinh Nguyen  */
27023da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_writes_center(uint32_t rank_bgn,
27033da42859SDinh Nguyen 	uint32_t write_group, uint32_t test_bgn)
27043da42859SDinh Nguyen {
27053da42859SDinh Nguyen 	uint32_t i, p, min_index;
27063da42859SDinh Nguyen 	int32_t d;
27073da42859SDinh Nguyen 	/*
27083da42859SDinh Nguyen 	 * Store these as signed since there are comparisons with
27093da42859SDinh Nguyen 	 * signed numbers.
27103da42859SDinh Nguyen 	 */
27113da42859SDinh Nguyen 	uint32_t bit_chk;
27123da42859SDinh Nguyen 	uint32_t sticky_bit_chk;
27133da42859SDinh Nguyen 	int32_t left_edge[RW_MGR_MEM_DQ_PER_WRITE_DQS];
27143da42859SDinh Nguyen 	int32_t right_edge[RW_MGR_MEM_DQ_PER_WRITE_DQS];
27153da42859SDinh Nguyen 	int32_t mid;
27163da42859SDinh Nguyen 	int32_t mid_min, orig_mid_min;
27173da42859SDinh Nguyen 	int32_t new_dqs, start_dqs, shift_dq;
27183da42859SDinh Nguyen 	int32_t dq_margin, dqs_margin, dm_margin;
27193da42859SDinh Nguyen 	uint32_t stop;
27203da42859SDinh Nguyen 	uint32_t temp_dq_out1_delay;
27213da42859SDinh Nguyen 	uint32_t addr;
27223da42859SDinh Nguyen 
27233da42859SDinh Nguyen 	debug("%s:%d %u %u", __func__, __LINE__, write_group, test_bgn);
27243da42859SDinh Nguyen 
27253da42859SDinh Nguyen 	dm_margin = 0;
27263da42859SDinh Nguyen 
2727c4815f76SMarek Vasut 	addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
272817fdc916SMarek Vasut 	start_dqs = readl(addr +
27293da42859SDinh Nguyen 			  (RW_MGR_MEM_DQ_PER_WRITE_DQS << 2));
27303da42859SDinh Nguyen 
27313da42859SDinh Nguyen 	/* per-bit deskew */
27323da42859SDinh Nguyen 
27333da42859SDinh Nguyen 	/*
27343da42859SDinh Nguyen 	 * set the left and right edge of each bit to an illegal value
27353da42859SDinh Nguyen 	 * use (IO_IO_OUT1_DELAY_MAX + 1) as an illegal value.
27363da42859SDinh Nguyen 	 */
27373da42859SDinh Nguyen 	sticky_bit_chk = 0;
27383da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
27393da42859SDinh Nguyen 		left_edge[i]  = IO_IO_OUT1_DELAY_MAX + 1;
27403da42859SDinh Nguyen 		right_edge[i] = IO_IO_OUT1_DELAY_MAX + 1;
27413da42859SDinh Nguyen 	}
27423da42859SDinh Nguyen 
27433da42859SDinh Nguyen 	/* Search for the left edge of the window for each bit */
27443da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_OUT1_DELAY_MAX; d++) {
27453da42859SDinh Nguyen 		scc_mgr_apply_group_dq_out1_delay(write_group, test_bgn, d);
27463da42859SDinh Nguyen 
2747*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
27483da42859SDinh Nguyen 
27493da42859SDinh Nguyen 		/*
27503da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
27513da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
27523da42859SDinh Nguyen 		 */
27533da42859SDinh Nguyen 		stop = !rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
27543da42859SDinh Nguyen 			0, PASS_ONE_BIT, &bit_chk, 0);
27553da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
27563da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->write_correct_mask);
27573da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center(left): dtap=%d => %u \
27583da42859SDinh Nguyen 			   == %u && %u [bit_chk= %u ]\n",
27593da42859SDinh Nguyen 			d, sticky_bit_chk, param->write_correct_mask,
27603da42859SDinh Nguyen 			stop, bit_chk);
27613da42859SDinh Nguyen 
27623da42859SDinh Nguyen 		if (stop == 1) {
27633da42859SDinh Nguyen 			break;
27643da42859SDinh Nguyen 		} else {
27653da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
27663da42859SDinh Nguyen 				if (bit_chk & 1) {
27673da42859SDinh Nguyen 					/*
27683da42859SDinh Nguyen 					 * Remember a passing test as the
27693da42859SDinh Nguyen 					 * left_edge.
27703da42859SDinh Nguyen 					 */
27713da42859SDinh Nguyen 					left_edge[i] = d;
27723da42859SDinh Nguyen 				} else {
27733da42859SDinh Nguyen 					/*
27743da42859SDinh Nguyen 					 * If a left edge has not been seen
27753da42859SDinh Nguyen 					 * yet, then a future passing test will
27763da42859SDinh Nguyen 					 * mark this edge as the right edge.
27773da42859SDinh Nguyen 					 */
27783da42859SDinh Nguyen 					if (left_edge[i] ==
27793da42859SDinh Nguyen 						IO_IO_OUT1_DELAY_MAX + 1) {
27803da42859SDinh Nguyen 						right_edge[i] = -(d + 1);
27813da42859SDinh Nguyen 					}
27823da42859SDinh Nguyen 				}
27833da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "write_center[l,d=%d):", d);
27843da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "bit_chk_test=%d left_edge[%u]: %d",
27853da42859SDinh Nguyen 					   (int)(bit_chk & 1), i, left_edge[i]);
27863da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "right_edge[%u]: %d\n", i,
27873da42859SDinh Nguyen 				       right_edge[i]);
27883da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
27893da42859SDinh Nguyen 			}
27903da42859SDinh Nguyen 		}
27913da42859SDinh Nguyen 	}
27923da42859SDinh Nguyen 
27933da42859SDinh Nguyen 	/* Reset DQ delay chains to 0 */
27943da42859SDinh Nguyen 	scc_mgr_apply_group_dq_out1_delay(write_group, test_bgn, 0);
27953da42859SDinh Nguyen 	sticky_bit_chk = 0;
27963da42859SDinh Nguyen 	for (i = RW_MGR_MEM_DQ_PER_WRITE_DQS - 1;; i--) {
27973da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d write_center: left_edge[%u]: \
27983da42859SDinh Nguyen 			   %d right_edge[%u]: %d\n", __func__, __LINE__,
27993da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
28003da42859SDinh Nguyen 
28013da42859SDinh Nguyen 		/*
28023da42859SDinh Nguyen 		 * Check for cases where we haven't found the left edge,
28033da42859SDinh Nguyen 		 * which makes our assignment of the the right edge invalid.
28043da42859SDinh Nguyen 		 * Reset it to the illegal value.
28053da42859SDinh Nguyen 		 */
28063da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_OUT1_DELAY_MAX + 1) &&
28073da42859SDinh Nguyen 		    (right_edge[i] != IO_IO_OUT1_DELAY_MAX + 1)) {
28083da42859SDinh Nguyen 			right_edge[i] = IO_IO_OUT1_DELAY_MAX + 1;
28093da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d write_center: reset \
28103da42859SDinh Nguyen 				   right_edge[%u]: %d\n", __func__, __LINE__,
28113da42859SDinh Nguyen 				   i, right_edge[i]);
28123da42859SDinh Nguyen 		}
28133da42859SDinh Nguyen 
28143da42859SDinh Nguyen 		/*
28153da42859SDinh Nguyen 		 * Reset sticky bit (except for bits where we have
28163da42859SDinh Nguyen 		 * seen the left edge).
28173da42859SDinh Nguyen 		 */
28183da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk << 1;
28193da42859SDinh Nguyen 		if ((left_edge[i] != IO_IO_OUT1_DELAY_MAX + 1))
28203da42859SDinh Nguyen 			sticky_bit_chk = sticky_bit_chk | 1;
28213da42859SDinh Nguyen 
28223da42859SDinh Nguyen 		if (i == 0)
28233da42859SDinh Nguyen 			break;
28243da42859SDinh Nguyen 	}
28253da42859SDinh Nguyen 
28263da42859SDinh Nguyen 	/* Search for the right edge of the window for each bit */
28273da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_OUT1_DELAY_MAX - start_dqs; d++) {
28283da42859SDinh Nguyen 		scc_mgr_apply_group_dqs_io_and_oct_out1(write_group,
28293da42859SDinh Nguyen 							d + start_dqs);
28303da42859SDinh Nguyen 
2831*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
28323da42859SDinh Nguyen 
28333da42859SDinh Nguyen 		/*
28343da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
28353da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
28363da42859SDinh Nguyen 		 */
28373da42859SDinh Nguyen 		stop = !rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
28383da42859SDinh Nguyen 			0, PASS_ONE_BIT, &bit_chk, 0);
28393da42859SDinh Nguyen 
28403da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
28413da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->write_correct_mask);
28423da42859SDinh Nguyen 
28433da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center (right): dtap=%u => %u == \
28443da42859SDinh Nguyen 			   %u && %u\n", d, sticky_bit_chk,
28453da42859SDinh Nguyen 			   param->write_correct_mask, stop);
28463da42859SDinh Nguyen 
28473da42859SDinh Nguyen 		if (stop == 1) {
28483da42859SDinh Nguyen 			if (d == 0) {
28493da42859SDinh Nguyen 				for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS;
28503da42859SDinh Nguyen 					i++) {
28513da42859SDinh Nguyen 					/* d = 0 failed, but it passed when
28523da42859SDinh Nguyen 					testing the left edge, so it must be
28533da42859SDinh Nguyen 					marginal, set it to -1 */
28543da42859SDinh Nguyen 					if (right_edge[i] ==
28553da42859SDinh Nguyen 						IO_IO_OUT1_DELAY_MAX + 1 &&
28563da42859SDinh Nguyen 						left_edge[i] !=
28573da42859SDinh Nguyen 						IO_IO_OUT1_DELAY_MAX + 1) {
28583da42859SDinh Nguyen 						right_edge[i] = -1;
28593da42859SDinh Nguyen 					}
28603da42859SDinh Nguyen 				}
28613da42859SDinh Nguyen 			}
28623da42859SDinh Nguyen 			break;
28633da42859SDinh Nguyen 		} else {
28643da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
28653da42859SDinh Nguyen 				if (bit_chk & 1) {
28663da42859SDinh Nguyen 					/*
28673da42859SDinh Nguyen 					 * Remember a passing test as
28683da42859SDinh Nguyen 					 * the right_edge.
28693da42859SDinh Nguyen 					 */
28703da42859SDinh Nguyen 					right_edge[i] = d;
28713da42859SDinh Nguyen 				} else {
28723da42859SDinh Nguyen 					if (d != 0) {
28733da42859SDinh Nguyen 						/*
28743da42859SDinh Nguyen 						 * If a right edge has not
28753da42859SDinh Nguyen 						 * been seen yet, then a future
28763da42859SDinh Nguyen 						 * passing test will mark this
28773da42859SDinh Nguyen 						 * edge as the left edge.
28783da42859SDinh Nguyen 						 */
28793da42859SDinh Nguyen 						if (right_edge[i] ==
28803da42859SDinh Nguyen 						    IO_IO_OUT1_DELAY_MAX + 1)
28813da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
28823da42859SDinh Nguyen 					} else {
28833da42859SDinh Nguyen 						/*
28843da42859SDinh Nguyen 						 * d = 0 failed, but it passed
28853da42859SDinh Nguyen 						 * when testing the left edge,
28863da42859SDinh Nguyen 						 * so it must be marginal, set
28873da42859SDinh Nguyen 						 * it to -1.
28883da42859SDinh Nguyen 						 */
28893da42859SDinh Nguyen 						if (right_edge[i] ==
28903da42859SDinh Nguyen 						    IO_IO_OUT1_DELAY_MAX + 1 &&
28913da42859SDinh Nguyen 						    left_edge[i] !=
28923da42859SDinh Nguyen 						    IO_IO_OUT1_DELAY_MAX + 1)
28933da42859SDinh Nguyen 							right_edge[i] = -1;
28943da42859SDinh Nguyen 						/*
28953da42859SDinh Nguyen 						 * If a right edge has not been
28963da42859SDinh Nguyen 						 * seen yet, then a future
28973da42859SDinh Nguyen 						 * passing test will mark this
28983da42859SDinh Nguyen 						 * edge as the left edge.
28993da42859SDinh Nguyen 						 */
29003da42859SDinh Nguyen 						else if (right_edge[i] ==
29013da42859SDinh Nguyen 							IO_IO_OUT1_DELAY_MAX +
29023da42859SDinh Nguyen 							1)
29033da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
29043da42859SDinh Nguyen 					}
29053da42859SDinh Nguyen 				}
29063da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "write_center[r,d=%d):", d);
29073da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "bit_chk_test=%d left_edge[%u]: %d",
29083da42859SDinh Nguyen 					   (int)(bit_chk & 1), i, left_edge[i]);
29093da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "right_edge[%u]: %d\n", i,
29103da42859SDinh Nguyen 					   right_edge[i]);
29113da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
29123da42859SDinh Nguyen 			}
29133da42859SDinh Nguyen 		}
29143da42859SDinh Nguyen 	}
29153da42859SDinh Nguyen 
29163da42859SDinh Nguyen 	/* Check that all bits have a window */
29173da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
29183da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d write_center: left_edge[%u]: \
29193da42859SDinh Nguyen 			   %d right_edge[%u]: %d", __func__, __LINE__,
29203da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
29213da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_OUT1_DELAY_MAX + 1) ||
29223da42859SDinh Nguyen 		    (right_edge[i] == IO_IO_OUT1_DELAY_MAX + 1)) {
29233da42859SDinh Nguyen 			set_failing_group_stage(test_bgn + i,
29243da42859SDinh Nguyen 						CAL_STAGE_WRITES,
29253da42859SDinh Nguyen 						CAL_SUBSTAGE_WRITES_CENTER);
29263da42859SDinh Nguyen 			return 0;
29273da42859SDinh Nguyen 		}
29283da42859SDinh Nguyen 	}
29293da42859SDinh Nguyen 
29303da42859SDinh Nguyen 	/* Find middle of window for each DQ bit */
29313da42859SDinh Nguyen 	mid_min = left_edge[0] - right_edge[0];
29323da42859SDinh Nguyen 	min_index = 0;
29333da42859SDinh Nguyen 	for (i = 1; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
29343da42859SDinh Nguyen 		mid = left_edge[i] - right_edge[i];
29353da42859SDinh Nguyen 		if (mid < mid_min) {
29363da42859SDinh Nguyen 			mid_min = mid;
29373da42859SDinh Nguyen 			min_index = i;
29383da42859SDinh Nguyen 		}
29393da42859SDinh Nguyen 	}
29403da42859SDinh Nguyen 
29413da42859SDinh Nguyen 	/*
29423da42859SDinh Nguyen 	 * -mid_min/2 represents the amount that we need to move DQS.
29433da42859SDinh Nguyen 	 * If mid_min is odd and positive we'll need to add one to
29443da42859SDinh Nguyen 	 * make sure the rounding in further calculations is correct
29453da42859SDinh Nguyen 	 * (always bias to the right), so just add 1 for all positive values.
29463da42859SDinh Nguyen 	 */
29473da42859SDinh Nguyen 	if (mid_min > 0)
29483da42859SDinh Nguyen 		mid_min++;
29493da42859SDinh Nguyen 	mid_min = mid_min / 2;
29503da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d write_center: mid_min=%d\n", __func__,
29513da42859SDinh Nguyen 		   __LINE__, mid_min);
29523da42859SDinh Nguyen 
29533da42859SDinh Nguyen 	/* Determine the amount we can change DQS (which is -mid_min) */
29543da42859SDinh Nguyen 	orig_mid_min = mid_min;
29553da42859SDinh Nguyen 	new_dqs = start_dqs;
29563da42859SDinh Nguyen 	mid_min = 0;
29573da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d write_center: start_dqs=%d new_dqs=%d \
29583da42859SDinh Nguyen 		   mid_min=%d\n", __func__, __LINE__, start_dqs, new_dqs, mid_min);
29593da42859SDinh Nguyen 	/* Initialize data for export structures */
29603da42859SDinh Nguyen 	dqs_margin = IO_IO_OUT1_DELAY_MAX + 1;
29613da42859SDinh Nguyen 	dq_margin  = IO_IO_OUT1_DELAY_MAX + 1;
29623da42859SDinh Nguyen 
29633da42859SDinh Nguyen 	/* add delay to bring centre of all DQ windows to the same "level" */
29643da42859SDinh Nguyen 	for (i = 0, p = test_bgn; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++, p++) {
29653da42859SDinh Nguyen 		/* Use values before divide by 2 to reduce round off error */
29663da42859SDinh Nguyen 		shift_dq = (left_edge[i] - right_edge[i] -
29673da42859SDinh Nguyen 			(left_edge[min_index] - right_edge[min_index]))/2  +
29683da42859SDinh Nguyen 		(orig_mid_min - mid_min);
29693da42859SDinh Nguyen 
29703da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d write_center: before: shift_dq \
29713da42859SDinh Nguyen 			   [%u]=%d\n", __func__, __LINE__, i, shift_dq);
29723da42859SDinh Nguyen 
2973*1273dd9eSMarek Vasut 		addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
297417fdc916SMarek Vasut 		temp_dq_out1_delay = readl(addr + (i << 2));
29753da42859SDinh Nguyen 		if (shift_dq + (int32_t)temp_dq_out1_delay >
29763da42859SDinh Nguyen 			(int32_t)IO_IO_OUT1_DELAY_MAX) {
29773da42859SDinh Nguyen 			shift_dq = (int32_t)IO_IO_OUT1_DELAY_MAX - temp_dq_out1_delay;
29783da42859SDinh Nguyen 		} else if (shift_dq + (int32_t)temp_dq_out1_delay < 0) {
29793da42859SDinh Nguyen 			shift_dq = -(int32_t)temp_dq_out1_delay;
29803da42859SDinh Nguyen 		}
29813da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center: after: shift_dq[%u]=%d\n",
29823da42859SDinh Nguyen 			   i, shift_dq);
29833da42859SDinh Nguyen 		scc_mgr_set_dq_out1_delay(write_group, i, temp_dq_out1_delay +
29843da42859SDinh Nguyen 					  shift_dq);
29853da42859SDinh Nguyen 		scc_mgr_load_dq(i);
29863da42859SDinh Nguyen 
29873da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center: margin[%u]=[%d,%d]\n", i,
29883da42859SDinh Nguyen 			   left_edge[i] - shift_dq + (-mid_min),
29893da42859SDinh Nguyen 			   right_edge[i] + shift_dq - (-mid_min));
29903da42859SDinh Nguyen 		/* To determine values for export structures */
29913da42859SDinh Nguyen 		if (left_edge[i] - shift_dq + (-mid_min) < dq_margin)
29923da42859SDinh Nguyen 			dq_margin = left_edge[i] - shift_dq + (-mid_min);
29933da42859SDinh Nguyen 
29943da42859SDinh Nguyen 		if (right_edge[i] + shift_dq - (-mid_min) < dqs_margin)
29953da42859SDinh Nguyen 			dqs_margin = right_edge[i] + shift_dq - (-mid_min);
29963da42859SDinh Nguyen 	}
29973da42859SDinh Nguyen 
29983da42859SDinh Nguyen 	/* Move DQS */
29993da42859SDinh Nguyen 	scc_mgr_apply_group_dqs_io_and_oct_out1(write_group, new_dqs);
3000*1273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
30013da42859SDinh Nguyen 
30023da42859SDinh Nguyen 	/* Centre DM */
30033da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d write_center: DM\n", __func__, __LINE__);
30043da42859SDinh Nguyen 
30053da42859SDinh Nguyen 	/*
30063da42859SDinh Nguyen 	 * set the left and right edge of each bit to an illegal value,
30073da42859SDinh Nguyen 	 * use (IO_IO_OUT1_DELAY_MAX + 1) as an illegal value,
30083da42859SDinh Nguyen 	 */
30093da42859SDinh Nguyen 	left_edge[0]  = IO_IO_OUT1_DELAY_MAX + 1;
30103da42859SDinh Nguyen 	right_edge[0] = IO_IO_OUT1_DELAY_MAX + 1;
30113da42859SDinh Nguyen 	int32_t bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
30123da42859SDinh Nguyen 	int32_t end_curr = IO_IO_OUT1_DELAY_MAX + 1;
30133da42859SDinh Nguyen 	int32_t bgn_best = IO_IO_OUT1_DELAY_MAX + 1;
30143da42859SDinh Nguyen 	int32_t end_best = IO_IO_OUT1_DELAY_MAX + 1;
30153da42859SDinh Nguyen 	int32_t win_best = 0;
30163da42859SDinh Nguyen 
30173da42859SDinh Nguyen 	/* Search for the/part of the window with DM shift */
30183da42859SDinh Nguyen 	for (d = IO_IO_OUT1_DELAY_MAX; d >= 0; d -= DELTA_D) {
30193da42859SDinh Nguyen 		scc_mgr_apply_group_dm_out1_delay(write_group, d);
3020*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
30213da42859SDinh Nguyen 
30223da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_write_test(rank_bgn, write_group, 1,
30233da42859SDinh Nguyen 						    PASS_ALL_BITS, &bit_chk,
30243da42859SDinh Nguyen 						    0)) {
30253da42859SDinh Nguyen 			/* USE Set current end of the window */
30263da42859SDinh Nguyen 			end_curr = -d;
30273da42859SDinh Nguyen 			/*
30283da42859SDinh Nguyen 			 * If a starting edge of our window has not been seen
30293da42859SDinh Nguyen 			 * this is our current start of the DM window.
30303da42859SDinh Nguyen 			 */
30313da42859SDinh Nguyen 			if (bgn_curr == IO_IO_OUT1_DELAY_MAX + 1)
30323da42859SDinh Nguyen 				bgn_curr = -d;
30333da42859SDinh Nguyen 
30343da42859SDinh Nguyen 			/*
30353da42859SDinh Nguyen 			 * If current window is bigger than best seen.
30363da42859SDinh Nguyen 			 * Set best seen to be current window.
30373da42859SDinh Nguyen 			 */
30383da42859SDinh Nguyen 			if ((end_curr-bgn_curr+1) > win_best) {
30393da42859SDinh Nguyen 				win_best = end_curr-bgn_curr+1;
30403da42859SDinh Nguyen 				bgn_best = bgn_curr;
30413da42859SDinh Nguyen 				end_best = end_curr;
30423da42859SDinh Nguyen 			}
30433da42859SDinh Nguyen 		} else {
30443da42859SDinh Nguyen 			/* We just saw a failing test. Reset temp edge */
30453da42859SDinh Nguyen 			bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
30463da42859SDinh Nguyen 			end_curr = IO_IO_OUT1_DELAY_MAX + 1;
30473da42859SDinh Nguyen 			}
30483da42859SDinh Nguyen 		}
30493da42859SDinh Nguyen 
30503da42859SDinh Nguyen 
30513da42859SDinh Nguyen 	/* Reset DM delay chains to 0 */
30523da42859SDinh Nguyen 	scc_mgr_apply_group_dm_out1_delay(write_group, 0);
30533da42859SDinh Nguyen 
30543da42859SDinh Nguyen 	/*
30553da42859SDinh Nguyen 	 * Check to see if the current window nudges up aganist 0 delay.
30563da42859SDinh Nguyen 	 * If so we need to continue the search by shifting DQS otherwise DQS
30573da42859SDinh Nguyen 	 * search begins as a new search. */
30583da42859SDinh Nguyen 	if (end_curr != 0) {
30593da42859SDinh Nguyen 		bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
30603da42859SDinh Nguyen 		end_curr = IO_IO_OUT1_DELAY_MAX + 1;
30613da42859SDinh Nguyen 	}
30623da42859SDinh Nguyen 
30633da42859SDinh Nguyen 	/* Search for the/part of the window with DQS shifts */
30643da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_OUT1_DELAY_MAX - new_dqs; d += DELTA_D) {
30653da42859SDinh Nguyen 		/*
30663da42859SDinh Nguyen 		 * Note: This only shifts DQS, so are we limiting ourselve to
30673da42859SDinh Nguyen 		 * width of DQ unnecessarily.
30683da42859SDinh Nguyen 		 */
30693da42859SDinh Nguyen 		scc_mgr_apply_group_dqs_io_and_oct_out1(write_group,
30703da42859SDinh Nguyen 							d + new_dqs);
30713da42859SDinh Nguyen 
3072*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
30733da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_write_test(rank_bgn, write_group, 1,
30743da42859SDinh Nguyen 						    PASS_ALL_BITS, &bit_chk,
30753da42859SDinh Nguyen 						    0)) {
30763da42859SDinh Nguyen 			/* USE Set current end of the window */
30773da42859SDinh Nguyen 			end_curr = d;
30783da42859SDinh Nguyen 			/*
30793da42859SDinh Nguyen 			 * If a beginning edge of our window has not been seen
30803da42859SDinh Nguyen 			 * this is our current begin of the DM window.
30813da42859SDinh Nguyen 			 */
30823da42859SDinh Nguyen 			if (bgn_curr == IO_IO_OUT1_DELAY_MAX + 1)
30833da42859SDinh Nguyen 				bgn_curr = d;
30843da42859SDinh Nguyen 
30853da42859SDinh Nguyen 			/*
30863da42859SDinh Nguyen 			 * If current window is bigger than best seen. Set best
30873da42859SDinh Nguyen 			 * seen to be current window.
30883da42859SDinh Nguyen 			 */
30893da42859SDinh Nguyen 			if ((end_curr-bgn_curr+1) > win_best) {
30903da42859SDinh Nguyen 				win_best = end_curr-bgn_curr+1;
30913da42859SDinh Nguyen 				bgn_best = bgn_curr;
30923da42859SDinh Nguyen 				end_best = end_curr;
30933da42859SDinh Nguyen 			}
30943da42859SDinh Nguyen 		} else {
30953da42859SDinh Nguyen 			/* We just saw a failing test. Reset temp edge */
30963da42859SDinh Nguyen 			bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
30973da42859SDinh Nguyen 			end_curr = IO_IO_OUT1_DELAY_MAX + 1;
30983da42859SDinh Nguyen 
30993da42859SDinh Nguyen 			/* Early exit optimization: if ther remaining delay
31003da42859SDinh Nguyen 			chain space is less than already seen largest window
31013da42859SDinh Nguyen 			we can exit */
31023da42859SDinh Nguyen 			if ((win_best-1) >
31033da42859SDinh Nguyen 				(IO_IO_OUT1_DELAY_MAX - new_dqs - d)) {
31043da42859SDinh Nguyen 					break;
31053da42859SDinh Nguyen 				}
31063da42859SDinh Nguyen 			}
31073da42859SDinh Nguyen 		}
31083da42859SDinh Nguyen 
31093da42859SDinh Nguyen 	/* assign left and right edge for cal and reporting; */
31103da42859SDinh Nguyen 	left_edge[0] = -1*bgn_best;
31113da42859SDinh Nguyen 	right_edge[0] = end_best;
31123da42859SDinh Nguyen 
31133da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d dm_calib: left=%d right=%d\n", __func__,
31143da42859SDinh Nguyen 		   __LINE__, left_edge[0], right_edge[0]);
31153da42859SDinh Nguyen 
31163da42859SDinh Nguyen 	/* Move DQS (back to orig) */
31173da42859SDinh Nguyen 	scc_mgr_apply_group_dqs_io_and_oct_out1(write_group, new_dqs);
31183da42859SDinh Nguyen 
31193da42859SDinh Nguyen 	/* Move DM */
31203da42859SDinh Nguyen 
31213da42859SDinh Nguyen 	/* Find middle of window for the DM bit */
31223da42859SDinh Nguyen 	mid = (left_edge[0] - right_edge[0]) / 2;
31233da42859SDinh Nguyen 
31243da42859SDinh Nguyen 	/* only move right, since we are not moving DQS/DQ */
31253da42859SDinh Nguyen 	if (mid < 0)
31263da42859SDinh Nguyen 		mid = 0;
31273da42859SDinh Nguyen 
31283da42859SDinh Nguyen 	/* dm_marign should fail if we never find a window */
31293da42859SDinh Nguyen 	if (win_best == 0)
31303da42859SDinh Nguyen 		dm_margin = -1;
31313da42859SDinh Nguyen 	else
31323da42859SDinh Nguyen 		dm_margin = left_edge[0] - mid;
31333da42859SDinh Nguyen 
31343da42859SDinh Nguyen 	scc_mgr_apply_group_dm_out1_delay(write_group, mid);
3135*1273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
31363da42859SDinh Nguyen 
31373da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d dm_calib: left=%d right=%d mid=%d \
31383da42859SDinh Nguyen 		   dm_margin=%d\n", __func__, __LINE__, left_edge[0],
31393da42859SDinh Nguyen 		   right_edge[0], mid, dm_margin);
31403da42859SDinh Nguyen 	/* Export values */
31413da42859SDinh Nguyen 	gbl->fom_out += dq_margin + dqs_margin;
31423da42859SDinh Nguyen 
31433da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d write_center: dq_margin=%d \
31443da42859SDinh Nguyen 		   dqs_margin=%d dm_margin=%d\n", __func__, __LINE__,
31453da42859SDinh Nguyen 		   dq_margin, dqs_margin, dm_margin);
31463da42859SDinh Nguyen 
31473da42859SDinh Nguyen 	/*
31483da42859SDinh Nguyen 	 * Do not remove this line as it makes sure all of our
31493da42859SDinh Nguyen 	 * decisions have been applied.
31503da42859SDinh Nguyen 	 */
3151*1273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
31523da42859SDinh Nguyen 	return (dq_margin >= 0) && (dqs_margin >= 0) && (dm_margin >= 0);
31533da42859SDinh Nguyen }
31543da42859SDinh Nguyen 
31553da42859SDinh Nguyen /* calibrate the write operations */
31563da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_writes(uint32_t rank_bgn, uint32_t g,
31573da42859SDinh Nguyen 	uint32_t test_bgn)
31583da42859SDinh Nguyen {
31593da42859SDinh Nguyen 	/* update info for sims */
31603da42859SDinh Nguyen 	debug("%s:%d %u %u\n", __func__, __LINE__, g, test_bgn);
31613da42859SDinh Nguyen 
31623da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_WRITES);
31633da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_WRITES_CENTER);
31643da42859SDinh Nguyen 
31653da42859SDinh Nguyen 	reg_file_set_group(g);
31663da42859SDinh Nguyen 
31673da42859SDinh Nguyen 	if (!rw_mgr_mem_calibrate_writes_center(rank_bgn, g, test_bgn)) {
31683da42859SDinh Nguyen 		set_failing_group_stage(g, CAL_STAGE_WRITES,
31693da42859SDinh Nguyen 					CAL_SUBSTAGE_WRITES_CENTER);
31703da42859SDinh Nguyen 		return 0;
31713da42859SDinh Nguyen 	}
31723da42859SDinh Nguyen 
31733da42859SDinh Nguyen 	return 1;
31743da42859SDinh Nguyen }
31753da42859SDinh Nguyen 
31763da42859SDinh Nguyen /* precharge all banks and activate row 0 in bank "000..." and bank "111..." */
31773da42859SDinh Nguyen static void mem_precharge_and_activate(void)
31783da42859SDinh Nguyen {
31793da42859SDinh Nguyen 	uint32_t r;
31803da42859SDinh Nguyen 
31813da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r++) {
31823da42859SDinh Nguyen 		if (param->skip_ranks[r]) {
31833da42859SDinh Nguyen 			/* request to skip the rank */
31843da42859SDinh Nguyen 			continue;
31853da42859SDinh Nguyen 		}
31863da42859SDinh Nguyen 
31873da42859SDinh Nguyen 		/* set rank */
31883da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_OFF);
31893da42859SDinh Nguyen 
31903da42859SDinh Nguyen 		/* precharge all banks ... */
3191*1273dd9eSMarek Vasut 		writel(RW_MGR_PRECHARGE_ALL, SDR_PHYGRP_RWMGRGRP_ADDRESS |
3192*1273dd9eSMarek Vasut 					     RW_MGR_RUN_SINGLE_GROUP_OFFSET);
31933da42859SDinh Nguyen 
3194*1273dd9eSMarek Vasut 		writel(0x0F, &sdr_rw_load_mgr_regs->load_cntr0);
3195*1273dd9eSMarek Vasut 		writel(RW_MGR_ACTIVATE_0_AND_1_WAIT1,
3196*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add0);
31973da42859SDinh Nguyen 
3198*1273dd9eSMarek Vasut 		writel(0x0F, &sdr_rw_load_mgr_regs->load_cntr1);
3199*1273dd9eSMarek Vasut 		writel(RW_MGR_ACTIVATE_0_AND_1_WAIT2,
3200*1273dd9eSMarek Vasut 			&sdr_rw_load_jump_mgr_regs->load_jump_add1);
32013da42859SDinh Nguyen 
32023da42859SDinh Nguyen 		/* activate rows */
3203*1273dd9eSMarek Vasut 		writel(RW_MGR_ACTIVATE_0_AND_1, SDR_PHYGRP_RWMGRGRP_ADDRESS |
3204*1273dd9eSMarek Vasut 						RW_MGR_RUN_SINGLE_GROUP_OFFSET);
32053da42859SDinh Nguyen 	}
32063da42859SDinh Nguyen }
32073da42859SDinh Nguyen 
32083da42859SDinh Nguyen /* Configure various memory related parameters. */
32093da42859SDinh Nguyen static void mem_config(void)
32103da42859SDinh Nguyen {
32113da42859SDinh Nguyen 	uint32_t rlat, wlat;
32123da42859SDinh Nguyen 	uint32_t rw_wl_nop_cycles;
32133da42859SDinh Nguyen 	uint32_t max_latency;
32143da42859SDinh Nguyen 
32153da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
32163da42859SDinh Nguyen 	/* read in write and read latency */
3217*1273dd9eSMarek Vasut 	wlat = readl(&data_mgr->t_wl_add);
3218*1273dd9eSMarek Vasut 	wlat += readl(&data_mgr->mem_t_add);
32193da42859SDinh Nguyen 
32203da42859SDinh Nguyen 	/* WL for hard phy does not include additive latency */
32213da42859SDinh Nguyen 
32223da42859SDinh Nguyen 	/*
32233da42859SDinh Nguyen 	 * add addtional write latency to offset the address/command extra
32243da42859SDinh Nguyen 	 * clock cycle. We change the AC mux setting causing AC to be delayed
32253da42859SDinh Nguyen 	 * by one mem clock cycle. Only do this for DDR3
32263da42859SDinh Nguyen 	 */
32273da42859SDinh Nguyen 	wlat = wlat + 1;
32283da42859SDinh Nguyen 
3229*1273dd9eSMarek Vasut 	rlat = readl(&data_mgr->t_rl_add);
32303da42859SDinh Nguyen 
32313da42859SDinh Nguyen 	rw_wl_nop_cycles = wlat - 2;
32323da42859SDinh Nguyen 	gbl->rw_wl_nop_cycles = rw_wl_nop_cycles;
32333da42859SDinh Nguyen 
32343da42859SDinh Nguyen 	/*
32353da42859SDinh Nguyen 	 * For AV/CV, lfifo is hardened and always runs at full rate so
32363da42859SDinh Nguyen 	 * max latency in AFI clocks, used here, is correspondingly smaller.
32373da42859SDinh Nguyen 	 */
32383da42859SDinh Nguyen 	max_latency = (1<<MAX_LATENCY_COUNT_WIDTH)/1 - 1;
32393da42859SDinh Nguyen 	/* configure for a burst length of 8 */
32403da42859SDinh Nguyen 
32413da42859SDinh Nguyen 	/* write latency */
32423da42859SDinh Nguyen 	/* Adjust Write Latency for Hard PHY */
32433da42859SDinh Nguyen 	wlat = wlat + 1;
32443da42859SDinh Nguyen 
32453da42859SDinh Nguyen 	/* set a pretty high read latency initially */
32463da42859SDinh Nguyen 	gbl->curr_read_lat = rlat + 16;
32473da42859SDinh Nguyen 
32483da42859SDinh Nguyen 	if (gbl->curr_read_lat > max_latency)
32493da42859SDinh Nguyen 		gbl->curr_read_lat = max_latency;
32503da42859SDinh Nguyen 
3251*1273dd9eSMarek Vasut 	writel(gbl->curr_read_lat, &phy_mgr_cfg->phy_rlat);
32523da42859SDinh Nguyen 
32533da42859SDinh Nguyen 	/* advertise write latency */
32543da42859SDinh Nguyen 	gbl->curr_write_lat = wlat;
3255*1273dd9eSMarek Vasut 	writel(wlat - 2, &phy_mgr_cfg->afi_wlat);
32563da42859SDinh Nguyen 
32573da42859SDinh Nguyen 	/* initialize bit slips */
32583da42859SDinh Nguyen 	mem_precharge_and_activate();
32593da42859SDinh Nguyen }
32603da42859SDinh Nguyen 
32613da42859SDinh Nguyen /* Set VFIFO and LFIFO to instant-on settings in skip calibration mode */
32623da42859SDinh Nguyen static void mem_skip_calibrate(void)
32633da42859SDinh Nguyen {
32643da42859SDinh Nguyen 	uint32_t vfifo_offset;
32653da42859SDinh Nguyen 	uint32_t i, j, r;
32663da42859SDinh Nguyen 
32673da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
32683da42859SDinh Nguyen 	/* Need to update every shadow register set used by the interface */
32693da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
32703da42859SDinh Nguyen 		r += NUM_RANKS_PER_SHADOW_REG) {
32713da42859SDinh Nguyen 		/*
32723da42859SDinh Nguyen 		 * Set output phase alignment settings appropriate for
32733da42859SDinh Nguyen 		 * skip calibration.
32743da42859SDinh Nguyen 		 */
32753da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
32763da42859SDinh Nguyen 			scc_mgr_set_dqs_en_phase(i, 0);
32773da42859SDinh Nguyen #if IO_DLL_CHAIN_LENGTH == 6
32783da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, 6);
32793da42859SDinh Nguyen #else
32803da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, 7);
32813da42859SDinh Nguyen #endif
32823da42859SDinh Nguyen 			/*
32833da42859SDinh Nguyen 			 * Case:33398
32843da42859SDinh Nguyen 			 *
32853da42859SDinh Nguyen 			 * Write data arrives to the I/O two cycles before write
32863da42859SDinh Nguyen 			 * latency is reached (720 deg).
32873da42859SDinh Nguyen 			 *   -> due to bit-slip in a/c bus
32883da42859SDinh Nguyen 			 *   -> to allow board skew where dqs is longer than ck
32893da42859SDinh Nguyen 			 *      -> how often can this happen!?
32903da42859SDinh Nguyen 			 *      -> can claim back some ptaps for high freq
32913da42859SDinh Nguyen 			 *       support if we can relax this, but i digress...
32923da42859SDinh Nguyen 			 *
32933da42859SDinh Nguyen 			 * The write_clk leads mem_ck by 90 deg
32943da42859SDinh Nguyen 			 * The minimum ptap of the OPA is 180 deg
32953da42859SDinh Nguyen 			 * Each ptap has (360 / IO_DLL_CHAIN_LENGH) deg of delay
32963da42859SDinh Nguyen 			 * The write_clk is always delayed by 2 ptaps
32973da42859SDinh Nguyen 			 *
32983da42859SDinh Nguyen 			 * Hence, to make DQS aligned to CK, we need to delay
32993da42859SDinh Nguyen 			 * DQS by:
33003da42859SDinh Nguyen 			 *    (720 - 90 - 180 - 2 * (360 / IO_DLL_CHAIN_LENGTH))
33013da42859SDinh Nguyen 			 *
33023da42859SDinh Nguyen 			 * Dividing the above by (360 / IO_DLL_CHAIN_LENGTH)
33033da42859SDinh Nguyen 			 * gives us the number of ptaps, which simplies to:
33043da42859SDinh Nguyen 			 *
33053da42859SDinh Nguyen 			 *    (1.25 * IO_DLL_CHAIN_LENGTH - 2)
33063da42859SDinh Nguyen 			 */
33073da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, (1.25 *
33083da42859SDinh Nguyen 				IO_DLL_CHAIN_LENGTH - 2));
33093da42859SDinh Nguyen 		}
3310*1273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dqs_ena);
3311*1273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dqs_io_ena);
33123da42859SDinh Nguyen 
33133da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_WRITE_DQS_WIDTH; i++) {
3314*1273dd9eSMarek Vasut 			writel(i, SDR_PHYGRP_SCCGRP_ADDRESS |
3315*1273dd9eSMarek Vasut 				  SCC_MGR_GROUP_COUNTER_OFFSET);
33163da42859SDinh Nguyen 		}
3317*1273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dq_ena);
3318*1273dd9eSMarek Vasut 		writel(0xff, &sdr_scc_mgr->dm_ena);
3319*1273dd9eSMarek Vasut 		writel(0, &sdr_scc_mgr->update);
33203da42859SDinh Nguyen 	}
33213da42859SDinh Nguyen 
33223da42859SDinh Nguyen 	/* Compensate for simulation model behaviour */
33233da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
33243da42859SDinh Nguyen 		scc_mgr_set_dqs_bus_in_delay(i, 10);
33253da42859SDinh Nguyen 		scc_mgr_load_dqs(i);
33263da42859SDinh Nguyen 	}
3327*1273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
33283da42859SDinh Nguyen 
33293da42859SDinh Nguyen 	/*
33303da42859SDinh Nguyen 	 * ArriaV has hard FIFOs that can only be initialized by incrementing
33313da42859SDinh Nguyen 	 * in sequencer.
33323da42859SDinh Nguyen 	 */
33333da42859SDinh Nguyen 	vfifo_offset = CALIB_VFIFO_OFFSET;
33343da42859SDinh Nguyen 	for (j = 0; j < vfifo_offset; j++) {
3335*1273dd9eSMarek Vasut 		writel(0xff, &phy_mgr_cmd->inc_vfifo_hard_phy);
33363da42859SDinh Nguyen 	}
3337*1273dd9eSMarek Vasut 	writel(0, &phy_mgr_cmd->fifo_reset);
33383da42859SDinh Nguyen 
33393da42859SDinh Nguyen 	/*
33403da42859SDinh Nguyen 	 * For ACV with hard lfifo, we get the skip-cal setting from
33413da42859SDinh Nguyen 	 * generation-time constant.
33423da42859SDinh Nguyen 	 */
33433da42859SDinh Nguyen 	gbl->curr_read_lat = CALIB_LFIFO_OFFSET;
3344*1273dd9eSMarek Vasut 	writel(gbl->curr_read_lat, &phy_mgr_cfg->phy_rlat);
33453da42859SDinh Nguyen }
33463da42859SDinh Nguyen 
33473da42859SDinh Nguyen /* Memory calibration entry point */
33483da42859SDinh Nguyen static uint32_t mem_calibrate(void)
33493da42859SDinh Nguyen {
33503da42859SDinh Nguyen 	uint32_t i;
33513da42859SDinh Nguyen 	uint32_t rank_bgn, sr;
33523da42859SDinh Nguyen 	uint32_t write_group, write_test_bgn;
33533da42859SDinh Nguyen 	uint32_t read_group, read_test_bgn;
33543da42859SDinh Nguyen 	uint32_t run_groups, current_run;
33553da42859SDinh Nguyen 	uint32_t failing_groups = 0;
33563da42859SDinh Nguyen 	uint32_t group_failed = 0;
33573da42859SDinh Nguyen 	uint32_t sr_failed = 0;
33583da42859SDinh Nguyen 
33593da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
33603da42859SDinh Nguyen 	/* Initialize the data settings */
33613da42859SDinh Nguyen 
33623da42859SDinh Nguyen 	gbl->error_substage = CAL_SUBSTAGE_NIL;
33633da42859SDinh Nguyen 	gbl->error_stage = CAL_STAGE_NIL;
33643da42859SDinh Nguyen 	gbl->error_group = 0xff;
33653da42859SDinh Nguyen 	gbl->fom_in = 0;
33663da42859SDinh Nguyen 	gbl->fom_out = 0;
33673da42859SDinh Nguyen 
33683da42859SDinh Nguyen 	mem_config();
33693da42859SDinh Nguyen 
33703da42859SDinh Nguyen 	uint32_t bypass_mode = 0x1;
33713da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
3372*1273dd9eSMarek Vasut 		writel(i, SDR_PHYGRP_SCCGRP_ADDRESS |
3373*1273dd9eSMarek Vasut 			  SCC_MGR_GROUP_COUNTER_OFFSET);
33743da42859SDinh Nguyen 		scc_set_bypass_mode(i, bypass_mode);
33753da42859SDinh Nguyen 	}
33763da42859SDinh Nguyen 
33773da42859SDinh Nguyen 	if ((dyn_calib_steps & CALIB_SKIP_ALL) == CALIB_SKIP_ALL) {
33783da42859SDinh Nguyen 		/*
33793da42859SDinh Nguyen 		 * Set VFIFO and LFIFO to instant-on settings in skip
33803da42859SDinh Nguyen 		 * calibration mode.
33813da42859SDinh Nguyen 		 */
33823da42859SDinh Nguyen 		mem_skip_calibrate();
33833da42859SDinh Nguyen 	} else {
33843da42859SDinh Nguyen 		for (i = 0; i < NUM_CALIB_REPEAT; i++) {
33853da42859SDinh Nguyen 			/*
33863da42859SDinh Nguyen 			 * Zero all delay chain/phase settings for all
33873da42859SDinh Nguyen 			 * groups and all shadow register sets.
33883da42859SDinh Nguyen 			 */
33893da42859SDinh Nguyen 			scc_mgr_zero_all();
33903da42859SDinh Nguyen 
33913da42859SDinh Nguyen 			run_groups = ~param->skip_groups;
33923da42859SDinh Nguyen 
33933da42859SDinh Nguyen 			for (write_group = 0, write_test_bgn = 0; write_group
33943da42859SDinh Nguyen 				< RW_MGR_MEM_IF_WRITE_DQS_WIDTH; write_group++,
33953da42859SDinh Nguyen 				write_test_bgn += RW_MGR_MEM_DQ_PER_WRITE_DQS) {
33963da42859SDinh Nguyen 				/* Initialized the group failure */
33973da42859SDinh Nguyen 				group_failed = 0;
33983da42859SDinh Nguyen 
33993da42859SDinh Nguyen 				current_run = run_groups & ((1 <<
34003da42859SDinh Nguyen 					RW_MGR_NUM_DQS_PER_WRITE_GROUP) - 1);
34013da42859SDinh Nguyen 				run_groups = run_groups >>
34023da42859SDinh Nguyen 					RW_MGR_NUM_DQS_PER_WRITE_GROUP;
34033da42859SDinh Nguyen 
34043da42859SDinh Nguyen 				if (current_run == 0)
34053da42859SDinh Nguyen 					continue;
34063da42859SDinh Nguyen 
3407*1273dd9eSMarek Vasut 				writel(write_group, SDR_PHYGRP_SCCGRP_ADDRESS |
3408*1273dd9eSMarek Vasut 						    SCC_MGR_GROUP_COUNTER_OFFSET);
34093da42859SDinh Nguyen 				scc_mgr_zero_group(write_group, write_test_bgn,
34103da42859SDinh Nguyen 						   0);
34113da42859SDinh Nguyen 
34123da42859SDinh Nguyen 				for (read_group = write_group *
34133da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
34143da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH,
34153da42859SDinh Nguyen 					read_test_bgn = 0;
34163da42859SDinh Nguyen 					read_group < (write_group + 1) *
34173da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
34183da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH &&
34193da42859SDinh Nguyen 					group_failed == 0;
34203da42859SDinh Nguyen 					read_group++, read_test_bgn +=
34213da42859SDinh Nguyen 					RW_MGR_MEM_DQ_PER_READ_DQS) {
34223da42859SDinh Nguyen 					/* Calibrate the VFIFO */
34233da42859SDinh Nguyen 					if (!((STATIC_CALIB_STEPS) &
34243da42859SDinh Nguyen 						CALIB_SKIP_VFIFO)) {
34253da42859SDinh Nguyen 						if (!rw_mgr_mem_calibrate_vfifo
34263da42859SDinh Nguyen 							(read_group,
34273da42859SDinh Nguyen 							read_test_bgn)) {
34283da42859SDinh Nguyen 							group_failed = 1;
34293da42859SDinh Nguyen 
34303da42859SDinh Nguyen 							if (!(gbl->
34313da42859SDinh Nguyen 							phy_debug_mode_flags &
34323da42859SDinh Nguyen 						PHY_DEBUG_SWEEP_ALL_GROUPS)) {
34333da42859SDinh Nguyen 								return 0;
34343da42859SDinh Nguyen 							}
34353da42859SDinh Nguyen 						}
34363da42859SDinh Nguyen 					}
34373da42859SDinh Nguyen 				}
34383da42859SDinh Nguyen 
34393da42859SDinh Nguyen 				/* Calibrate the output side */
34403da42859SDinh Nguyen 				if (group_failed == 0)	{
34413da42859SDinh Nguyen 					for (rank_bgn = 0, sr = 0; rank_bgn
34423da42859SDinh Nguyen 						< RW_MGR_MEM_NUMBER_OF_RANKS;
34433da42859SDinh Nguyen 						rank_bgn +=
34443da42859SDinh Nguyen 						NUM_RANKS_PER_SHADOW_REG,
34453da42859SDinh Nguyen 						++sr) {
34463da42859SDinh Nguyen 						sr_failed = 0;
34473da42859SDinh Nguyen 						if (!((STATIC_CALIB_STEPS) &
34483da42859SDinh Nguyen 						CALIB_SKIP_WRITES)) {
34493da42859SDinh Nguyen 							if ((STATIC_CALIB_STEPS)
34503da42859SDinh Nguyen 						& CALIB_SKIP_DELAY_SWEEPS) {
34513da42859SDinh Nguyen 						/* not needed in quick mode! */
34523da42859SDinh Nguyen 							} else {
34533da42859SDinh Nguyen 						/*
34543da42859SDinh Nguyen 						 * Determine if this set of
34553da42859SDinh Nguyen 						 * ranks should be skipped
34563da42859SDinh Nguyen 						 * entirely.
34573da42859SDinh Nguyen 						 */
34583da42859SDinh Nguyen 					if (!param->skip_shadow_regs[sr]) {
34593da42859SDinh Nguyen 						if (!rw_mgr_mem_calibrate_writes
34603da42859SDinh Nguyen 						(rank_bgn, write_group,
34613da42859SDinh Nguyen 						write_test_bgn)) {
34623da42859SDinh Nguyen 							sr_failed = 1;
34633da42859SDinh Nguyen 							if (!(gbl->
34643da42859SDinh Nguyen 							phy_debug_mode_flags &
34653da42859SDinh Nguyen 						PHY_DEBUG_SWEEP_ALL_GROUPS)) {
34663da42859SDinh Nguyen 								return 0;
34673da42859SDinh Nguyen 									}
34683da42859SDinh Nguyen 									}
34693da42859SDinh Nguyen 								}
34703da42859SDinh Nguyen 							}
34713da42859SDinh Nguyen 						}
34723da42859SDinh Nguyen 						if (sr_failed != 0)
34733da42859SDinh Nguyen 							group_failed = 1;
34743da42859SDinh Nguyen 					}
34753da42859SDinh Nguyen 				}
34763da42859SDinh Nguyen 
34773da42859SDinh Nguyen 				if (group_failed == 0) {
34783da42859SDinh Nguyen 					for (read_group = write_group *
34793da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
34803da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH,
34813da42859SDinh Nguyen 					read_test_bgn = 0;
34823da42859SDinh Nguyen 						read_group < (write_group + 1)
34833da42859SDinh Nguyen 						* RW_MGR_MEM_IF_READ_DQS_WIDTH
34843da42859SDinh Nguyen 						/ RW_MGR_MEM_IF_WRITE_DQS_WIDTH &&
34853da42859SDinh Nguyen 						group_failed == 0;
34863da42859SDinh Nguyen 						read_group++, read_test_bgn +=
34873da42859SDinh Nguyen 						RW_MGR_MEM_DQ_PER_READ_DQS) {
34883da42859SDinh Nguyen 						if (!((STATIC_CALIB_STEPS) &
34893da42859SDinh Nguyen 							CALIB_SKIP_WRITES)) {
34903da42859SDinh Nguyen 					if (!rw_mgr_mem_calibrate_vfifo_end
34913da42859SDinh Nguyen 						(read_group, read_test_bgn)) {
34923da42859SDinh Nguyen 							group_failed = 1;
34933da42859SDinh Nguyen 
34943da42859SDinh Nguyen 						if (!(gbl->phy_debug_mode_flags
34953da42859SDinh Nguyen 						& PHY_DEBUG_SWEEP_ALL_GROUPS)) {
34963da42859SDinh Nguyen 								return 0;
34973da42859SDinh Nguyen 								}
34983da42859SDinh Nguyen 							}
34993da42859SDinh Nguyen 						}
35003da42859SDinh Nguyen 					}
35013da42859SDinh Nguyen 				}
35023da42859SDinh Nguyen 
35033da42859SDinh Nguyen 				if (group_failed != 0)
35043da42859SDinh Nguyen 					failing_groups++;
35053da42859SDinh Nguyen 			}
35063da42859SDinh Nguyen 
35073da42859SDinh Nguyen 			/*
35083da42859SDinh Nguyen 			 * USER If there are any failing groups then report
35093da42859SDinh Nguyen 			 * the failure.
35103da42859SDinh Nguyen 			 */
35113da42859SDinh Nguyen 			if (failing_groups != 0)
35123da42859SDinh Nguyen 				return 0;
35133da42859SDinh Nguyen 
35143da42859SDinh Nguyen 			/* Calibrate the LFIFO */
35153da42859SDinh Nguyen 			if (!((STATIC_CALIB_STEPS) & CALIB_SKIP_LFIFO)) {
35163da42859SDinh Nguyen 				/*
35173da42859SDinh Nguyen 				 * If we're skipping groups as part of debug,
35183da42859SDinh Nguyen 				 * don't calibrate LFIFO.
35193da42859SDinh Nguyen 				 */
35203da42859SDinh Nguyen 				if (param->skip_groups == 0) {
35213da42859SDinh Nguyen 					if (!rw_mgr_mem_calibrate_lfifo())
35223da42859SDinh Nguyen 						return 0;
35233da42859SDinh Nguyen 				}
35243da42859SDinh Nguyen 			}
35253da42859SDinh Nguyen 		}
35263da42859SDinh Nguyen 	}
35273da42859SDinh Nguyen 
35283da42859SDinh Nguyen 	/*
35293da42859SDinh Nguyen 	 * Do not remove this line as it makes sure all of our decisions
35303da42859SDinh Nguyen 	 * have been applied.
35313da42859SDinh Nguyen 	 */
3532*1273dd9eSMarek Vasut 	writel(0, &sdr_scc_mgr->update);
35333da42859SDinh Nguyen 	return 1;
35343da42859SDinh Nguyen }
35353da42859SDinh Nguyen 
35363da42859SDinh Nguyen static uint32_t run_mem_calibrate(void)
35373da42859SDinh Nguyen {
35383da42859SDinh Nguyen 	uint32_t pass;
35393da42859SDinh Nguyen 	uint32_t debug_info;
35403da42859SDinh Nguyen 
35413da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
35423da42859SDinh Nguyen 
35433da42859SDinh Nguyen 	/* Reset pass/fail status shown on afi_cal_success/fail */
3544*1273dd9eSMarek Vasut 	writel(PHY_MGR_CAL_RESET, &phy_mgr_cfg->cal_status);
35453da42859SDinh Nguyen 
35463da42859SDinh Nguyen 	/* stop tracking manger */
35476cb9f167SMarek Vasut 	uint32_t ctrlcfg = readl(&sdr_ctrl->ctrl_cfg);
35483da42859SDinh Nguyen 
35496cb9f167SMarek Vasut 	writel(ctrlcfg & 0xFFBFFFFF, &sdr_ctrl->ctrl_cfg);
35503da42859SDinh Nguyen 
35513da42859SDinh Nguyen 	initialize();
35523da42859SDinh Nguyen 	rw_mgr_mem_initialize();
35533da42859SDinh Nguyen 
35543da42859SDinh Nguyen 	pass = mem_calibrate();
35553da42859SDinh Nguyen 
35563da42859SDinh Nguyen 	mem_precharge_and_activate();
3557*1273dd9eSMarek Vasut 	writel(0, &phy_mgr_cmd->fifo_reset);
35583da42859SDinh Nguyen 
35593da42859SDinh Nguyen 	/*
35603da42859SDinh Nguyen 	 * Handoff:
35613da42859SDinh Nguyen 	 * Don't return control of the PHY back to AFI when in debug mode.
35623da42859SDinh Nguyen 	 */
35633da42859SDinh Nguyen 	if ((gbl->phy_debug_mode_flags & PHY_DEBUG_IN_DEBUG_MODE) == 0) {
35643da42859SDinh Nguyen 		rw_mgr_mem_handoff();
35653da42859SDinh Nguyen 		/*
35663da42859SDinh Nguyen 		 * In Hard PHY this is a 2-bit control:
35673da42859SDinh Nguyen 		 * 0: AFI Mux Select
35683da42859SDinh Nguyen 		 * 1: DDIO Mux Select
35693da42859SDinh Nguyen 		 */
3570*1273dd9eSMarek Vasut 		writel(0x2, &phy_mgr_cfg->mux_sel);
35713da42859SDinh Nguyen 	}
35723da42859SDinh Nguyen 
35736cb9f167SMarek Vasut 	writel(ctrlcfg, &sdr_ctrl->ctrl_cfg);
35743da42859SDinh Nguyen 
35753da42859SDinh Nguyen 	if (pass) {
35763da42859SDinh Nguyen 		printf("%s: CALIBRATION PASSED\n", __FILE__);
35773da42859SDinh Nguyen 
35783da42859SDinh Nguyen 		gbl->fom_in /= 2;
35793da42859SDinh Nguyen 		gbl->fom_out /= 2;
35803da42859SDinh Nguyen 
35813da42859SDinh Nguyen 		if (gbl->fom_in > 0xff)
35823da42859SDinh Nguyen 			gbl->fom_in = 0xff;
35833da42859SDinh Nguyen 
35843da42859SDinh Nguyen 		if (gbl->fom_out > 0xff)
35853da42859SDinh Nguyen 			gbl->fom_out = 0xff;
35863da42859SDinh Nguyen 
35873da42859SDinh Nguyen 		/* Update the FOM in the register file */
35883da42859SDinh Nguyen 		debug_info = gbl->fom_in;
35893da42859SDinh Nguyen 		debug_info |= gbl->fom_out << 8;
3590*1273dd9eSMarek Vasut 		writel(debug_info, &sdr_reg_file->fom);
35913da42859SDinh Nguyen 
3592*1273dd9eSMarek Vasut 		writel(debug_info, &phy_mgr_cfg->cal_debug_info);
3593*1273dd9eSMarek Vasut 		writel(PHY_MGR_CAL_SUCCESS, &phy_mgr_cfg->cal_status);
35943da42859SDinh Nguyen 	} else {
35953da42859SDinh Nguyen 		printf("%s: CALIBRATION FAILED\n", __FILE__);
35963da42859SDinh Nguyen 
35973da42859SDinh Nguyen 		debug_info = gbl->error_stage;
35983da42859SDinh Nguyen 		debug_info |= gbl->error_substage << 8;
35993da42859SDinh Nguyen 		debug_info |= gbl->error_group << 16;
36003da42859SDinh Nguyen 
3601*1273dd9eSMarek Vasut 		writel(debug_info, &sdr_reg_file->failing_stage);
3602*1273dd9eSMarek Vasut 		writel(debug_info, &phy_mgr_cfg->cal_debug_info);
3603*1273dd9eSMarek Vasut 		writel(PHY_MGR_CAL_FAIL, &phy_mgr_cfg->cal_status);
36043da42859SDinh Nguyen 
36053da42859SDinh Nguyen 		/* Update the failing group/stage in the register file */
36063da42859SDinh Nguyen 		debug_info = gbl->error_stage;
36073da42859SDinh Nguyen 		debug_info |= gbl->error_substage << 8;
36083da42859SDinh Nguyen 		debug_info |= gbl->error_group << 16;
3609*1273dd9eSMarek Vasut 		writel(debug_info, &sdr_reg_file->failing_stage);
36103da42859SDinh Nguyen 	}
36113da42859SDinh Nguyen 
36123da42859SDinh Nguyen 	return pass;
36133da42859SDinh Nguyen }
36143da42859SDinh Nguyen 
36153da42859SDinh Nguyen static void hc_initialize_rom_data(void)
36163da42859SDinh Nguyen {
36173da42859SDinh Nguyen 	uint32_t i;
36183da42859SDinh Nguyen 	uint32_t addr;
36193da42859SDinh Nguyen 
3620c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_INST_ROM_WRITE_OFFSET;
36213da42859SDinh Nguyen 	for (i = 0; i < ARRAY_SIZE(inst_rom_init); i++) {
36223da42859SDinh Nguyen 		uint32_t data = inst_rom_init[i];
362317fdc916SMarek Vasut 		writel(data, addr + (i << 2));
36243da42859SDinh Nguyen 	}
36253da42859SDinh Nguyen 
3626c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_AC_ROM_WRITE_OFFSET;
36273da42859SDinh Nguyen 	for (i = 0; i < ARRAY_SIZE(ac_rom_init); i++) {
36283da42859SDinh Nguyen 		uint32_t data = ac_rom_init[i];
362917fdc916SMarek Vasut 		writel(data, addr + (i << 2));
36303da42859SDinh Nguyen 	}
36313da42859SDinh Nguyen }
36323da42859SDinh Nguyen 
36333da42859SDinh Nguyen static void initialize_reg_file(void)
36343da42859SDinh Nguyen {
36353da42859SDinh Nguyen 	/* Initialize the register file with the correct data */
3636*1273dd9eSMarek Vasut 	writel(REG_FILE_INIT_SEQ_SIGNATURE, &sdr_reg_file->signature);
3637*1273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->debug_data_addr);
3638*1273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->cur_stage);
3639*1273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->fom);
3640*1273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->failing_stage);
3641*1273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->debug1);
3642*1273dd9eSMarek Vasut 	writel(0, &sdr_reg_file->debug2);
36433da42859SDinh Nguyen }
36443da42859SDinh Nguyen 
36453da42859SDinh Nguyen static void initialize_hps_phy(void)
36463da42859SDinh Nguyen {
36473da42859SDinh Nguyen 	uint32_t reg;
36483da42859SDinh Nguyen 	/*
36493da42859SDinh Nguyen 	 * Tracking also gets configured here because it's in the
36503da42859SDinh Nguyen 	 * same register.
36513da42859SDinh Nguyen 	 */
36523da42859SDinh Nguyen 	uint32_t trk_sample_count = 7500;
36533da42859SDinh Nguyen 	uint32_t trk_long_idle_sample_count = (10 << 16) | 100;
36543da42859SDinh Nguyen 	/*
36553da42859SDinh Nguyen 	 * Format is number of outer loops in the 16 MSB, sample
36563da42859SDinh Nguyen 	 * count in 16 LSB.
36573da42859SDinh Nguyen 	 */
36583da42859SDinh Nguyen 
36593da42859SDinh Nguyen 	reg = 0;
36603da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_ACDELAYEN_SET(2);
36613da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_DQDELAYEN_SET(1);
36623da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_DQSDELAYEN_SET(1);
36633da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_DQSLOGICDELAYEN_SET(1);
36643da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_RESETDELAYEN_SET(0);
36653da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_LPDDRDIS_SET(1);
36663da42859SDinh Nguyen 	/*
36673da42859SDinh Nguyen 	 * This field selects the intrinsic latency to RDATA_EN/FULL path.
36683da42859SDinh Nguyen 	 * 00-bypass, 01- add 5 cycles, 10- add 10 cycles, 11- add 15 cycles.
36693da42859SDinh Nguyen 	 */
36703da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_ADDLATSEL_SET(0);
36713da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_SAMPLECOUNT_19_0_SET(
36723da42859SDinh Nguyen 		trk_sample_count);
36736cb9f167SMarek Vasut 	writel(reg, &sdr_ctrl->phy_ctrl0);
36743da42859SDinh Nguyen 
36753da42859SDinh Nguyen 	reg = 0;
36763da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_1_SAMPLECOUNT_31_20_SET(
36773da42859SDinh Nguyen 		trk_sample_count >>
36783da42859SDinh Nguyen 		SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_SAMPLECOUNT_19_0_WIDTH);
36793da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_1_LONGIDLESAMPLECOUNT_19_0_SET(
36803da42859SDinh Nguyen 		trk_long_idle_sample_count);
36816cb9f167SMarek Vasut 	writel(reg, &sdr_ctrl->phy_ctrl1);
36823da42859SDinh Nguyen 
36833da42859SDinh Nguyen 	reg = 0;
36843da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_2_LONGIDLESAMPLECOUNT_31_20_SET(
36853da42859SDinh Nguyen 		trk_long_idle_sample_count >>
36863da42859SDinh Nguyen 		SDR_CTRLGRP_PHYCTRL_PHYCTRL_1_LONGIDLESAMPLECOUNT_19_0_WIDTH);
36876cb9f167SMarek Vasut 	writel(reg, &sdr_ctrl->phy_ctrl2);
36883da42859SDinh Nguyen }
36893da42859SDinh Nguyen 
36903da42859SDinh Nguyen static void initialize_tracking(void)
36913da42859SDinh Nguyen {
36923da42859SDinh Nguyen 	uint32_t concatenated_longidle = 0x0;
36933da42859SDinh Nguyen 	uint32_t concatenated_delays = 0x0;
36943da42859SDinh Nguyen 	uint32_t concatenated_rw_addr = 0x0;
36953da42859SDinh Nguyen 	uint32_t concatenated_refresh = 0x0;
36963da42859SDinh Nguyen 	uint32_t trk_sample_count = 7500;
36973da42859SDinh Nguyen 	uint32_t dtaps_per_ptap;
36983da42859SDinh Nguyen 	uint32_t tmp_delay;
36993da42859SDinh Nguyen 
37003da42859SDinh Nguyen 	/*
37013da42859SDinh Nguyen 	 * compute usable version of value in case we skip full
37023da42859SDinh Nguyen 	 * computation later
37033da42859SDinh Nguyen 	 */
37043da42859SDinh Nguyen 	dtaps_per_ptap = 0;
37053da42859SDinh Nguyen 	tmp_delay = 0;
37063da42859SDinh Nguyen 	while (tmp_delay < IO_DELAY_PER_OPA_TAP) {
37073da42859SDinh Nguyen 		dtaps_per_ptap++;
37083da42859SDinh Nguyen 		tmp_delay += IO_DELAY_PER_DCHAIN_TAP;
37093da42859SDinh Nguyen 	}
37103da42859SDinh Nguyen 	dtaps_per_ptap--;
37113da42859SDinh Nguyen 
37123da42859SDinh Nguyen 	concatenated_longidle = concatenated_longidle ^ 10;
37133da42859SDinh Nguyen 		/*longidle outer loop */
37143da42859SDinh Nguyen 	concatenated_longidle = concatenated_longidle << 16;
37153da42859SDinh Nguyen 	concatenated_longidle = concatenated_longidle ^ 100;
37163da42859SDinh Nguyen 		/*longidle sample count */
37173da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 243;
37183da42859SDinh Nguyen 		/* trfc, worst case of 933Mhz 4Gb */
37193da42859SDinh Nguyen 	concatenated_delays = concatenated_delays << 8;
37203da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 14;
37213da42859SDinh Nguyen 		/* trcd, worst case */
37223da42859SDinh Nguyen 	concatenated_delays = concatenated_delays << 8;
37233da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 10;
37243da42859SDinh Nguyen 		/* vfifo wait */
37253da42859SDinh Nguyen 	concatenated_delays = concatenated_delays << 8;
37263da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 4;
37273da42859SDinh Nguyen 		/* mux delay */
37283da42859SDinh Nguyen 
37293da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_IDLE;
37303da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr << 8;
37313da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_ACTIVATE_1;
37323da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr << 8;
37333da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_SGLE_READ;
37343da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr << 8;
37353da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_PRECHARGE_ALL;
37363da42859SDinh Nguyen 
37373da42859SDinh Nguyen 	concatenated_refresh = concatenated_refresh ^ RW_MGR_REFRESH_ALL;
37383da42859SDinh Nguyen 	concatenated_refresh = concatenated_refresh << 24;
37393da42859SDinh Nguyen 	concatenated_refresh = concatenated_refresh ^ 1000; /* trefi */
37403da42859SDinh Nguyen 
37413da42859SDinh Nguyen 	/* Initialize the register file with the correct data */
3742*1273dd9eSMarek Vasut 	writel(dtaps_per_ptap, &sdr_reg_file->dtaps_per_ptap);
3743*1273dd9eSMarek Vasut 	writel(trk_sample_count, &sdr_reg_file->trk_sample_count);
3744*1273dd9eSMarek Vasut 	writel(concatenated_longidle, &sdr_reg_file->trk_longidle);
3745*1273dd9eSMarek Vasut 	writel(concatenated_delays, &sdr_reg_file->delays);
3746*1273dd9eSMarek Vasut 	writel(concatenated_rw_addr, &sdr_reg_file->trk_rw_mgr_addr);
3747*1273dd9eSMarek Vasut 	writel(RW_MGR_MEM_IF_READ_DQS_WIDTH, &sdr_reg_file->trk_read_dqs_width);
3748*1273dd9eSMarek Vasut 	writel(concatenated_refresh, &sdr_reg_file->trk_rfsh);
37493da42859SDinh Nguyen }
37503da42859SDinh Nguyen 
37513da42859SDinh Nguyen int sdram_calibration_full(void)
37523da42859SDinh Nguyen {
37533da42859SDinh Nguyen 	struct param_type my_param;
37543da42859SDinh Nguyen 	struct gbl_type my_gbl;
37553da42859SDinh Nguyen 	uint32_t pass;
37563da42859SDinh Nguyen 	uint32_t i;
37573da42859SDinh Nguyen 
37583da42859SDinh Nguyen 	param = &my_param;
37593da42859SDinh Nguyen 	gbl = &my_gbl;
37603da42859SDinh Nguyen 
37613da42859SDinh Nguyen 	/* Initialize the debug mode flags */
37623da42859SDinh Nguyen 	gbl->phy_debug_mode_flags = 0;
37633da42859SDinh Nguyen 	/* Set the calibration enabled by default */
37643da42859SDinh Nguyen 	gbl->phy_debug_mode_flags |= PHY_DEBUG_ENABLE_CAL_RPT;
37653da42859SDinh Nguyen 	/*
37663da42859SDinh Nguyen 	 * Only sweep all groups (regardless of fail state) by default
37673da42859SDinh Nguyen 	 * Set enabled read test by default.
37683da42859SDinh Nguyen 	 */
37693da42859SDinh Nguyen #if DISABLE_GUARANTEED_READ
37703da42859SDinh Nguyen 	gbl->phy_debug_mode_flags |= PHY_DEBUG_DISABLE_GUARANTEED_READ;
37713da42859SDinh Nguyen #endif
37723da42859SDinh Nguyen 	/* Initialize the register file */
37733da42859SDinh Nguyen 	initialize_reg_file();
37743da42859SDinh Nguyen 
37753da42859SDinh Nguyen 	/* Initialize any PHY CSR */
37763da42859SDinh Nguyen 	initialize_hps_phy();
37773da42859SDinh Nguyen 
37783da42859SDinh Nguyen 	scc_mgr_initialize();
37793da42859SDinh Nguyen 
37803da42859SDinh Nguyen 	initialize_tracking();
37813da42859SDinh Nguyen 
37823da42859SDinh Nguyen 	/* USER Enable all ranks, groups */
37833da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_NUMBER_OF_RANKS; i++)
37843da42859SDinh Nguyen 		param->skip_ranks[i] = 0;
37853da42859SDinh Nguyen 	for (i = 0; i < NUM_SHADOW_REGS; ++i)
37863da42859SDinh Nguyen 		param->skip_shadow_regs[i] = 0;
37873da42859SDinh Nguyen 	param->skip_groups = 0;
37883da42859SDinh Nguyen 
37893da42859SDinh Nguyen 	printf("%s: Preparing to start memory calibration\n", __FILE__);
37903da42859SDinh Nguyen 
37913da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
379223f62b36SMarek Vasut 	debug_cond(DLEVEL == 1,
379323f62b36SMarek Vasut 		   "DDR3 FULL_RATE ranks=%u cs/dimm=%u dq/dqs=%u,%u vg/dqs=%u,%u ",
379423f62b36SMarek Vasut 		   RW_MGR_MEM_NUMBER_OF_RANKS, RW_MGR_MEM_NUMBER_OF_CS_PER_DIMM,
379523f62b36SMarek Vasut 		   RW_MGR_MEM_DQ_PER_READ_DQS, RW_MGR_MEM_DQ_PER_WRITE_DQS,
379623f62b36SMarek Vasut 		   RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS,
379723f62b36SMarek Vasut 		   RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS);
379823f62b36SMarek Vasut 	debug_cond(DLEVEL == 1,
379923f62b36SMarek Vasut 		   "dqs=%u,%u dq=%u dm=%u ptap_delay=%u dtap_delay=%u ",
380023f62b36SMarek Vasut 		   RW_MGR_MEM_IF_READ_DQS_WIDTH, RW_MGR_MEM_IF_WRITE_DQS_WIDTH,
380123f62b36SMarek Vasut 		   RW_MGR_MEM_DATA_WIDTH, RW_MGR_MEM_DATA_MASK_WIDTH,
380223f62b36SMarek Vasut 		   IO_DELAY_PER_OPA_TAP, IO_DELAY_PER_DCHAIN_TAP);
380323f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "dtap_dqsen_delay=%u, dll=%u",
380423f62b36SMarek Vasut 		   IO_DELAY_PER_DQS_EN_DCHAIN_TAP, IO_DLL_CHAIN_LENGTH);
380523f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "max values: en_p=%u dqdqs_p=%u en_d=%u dqs_in_d=%u ",
380623f62b36SMarek Vasut 		   IO_DQS_EN_PHASE_MAX, IO_DQDQS_OUT_PHASE_MAX,
380723f62b36SMarek Vasut 		   IO_DQS_EN_DELAY_MAX, IO_DQS_IN_DELAY_MAX);
380823f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "io_in_d=%u io_out1_d=%u io_out2_d=%u ",
380923f62b36SMarek Vasut 		   IO_IO_IN_DELAY_MAX, IO_IO_OUT1_DELAY_MAX,
381023f62b36SMarek Vasut 		   IO_IO_OUT2_DELAY_MAX);
381123f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "dqs_in_reserve=%u dqs_out_reserve=%u\n",
381223f62b36SMarek Vasut 		   IO_DQS_IN_RESERVE, IO_DQS_OUT_RESERVE);
38133da42859SDinh Nguyen 
38143da42859SDinh Nguyen 	hc_initialize_rom_data();
38153da42859SDinh Nguyen 
38163da42859SDinh Nguyen 	/* update info for sims */
38173da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_NIL);
38183da42859SDinh Nguyen 	reg_file_set_group(0);
38193da42859SDinh Nguyen 
38203da42859SDinh Nguyen 	/*
38213da42859SDinh Nguyen 	 * Load global needed for those actions that require
38223da42859SDinh Nguyen 	 * some dynamic calibration support.
38233da42859SDinh Nguyen 	 */
38243da42859SDinh Nguyen 	dyn_calib_steps = STATIC_CALIB_STEPS;
38253da42859SDinh Nguyen 	/*
38263da42859SDinh Nguyen 	 * Load global to allow dynamic selection of delay loop settings
38273da42859SDinh Nguyen 	 * based on calibration mode.
38283da42859SDinh Nguyen 	 */
38293da42859SDinh Nguyen 	if (!(dyn_calib_steps & CALIB_SKIP_DELAY_LOOPS))
38303da42859SDinh Nguyen 		skip_delay_mask = 0xff;
38313da42859SDinh Nguyen 	else
38323da42859SDinh Nguyen 		skip_delay_mask = 0x0;
38333da42859SDinh Nguyen 
38343da42859SDinh Nguyen 	pass = run_mem_calibrate();
38353da42859SDinh Nguyen 
38363da42859SDinh Nguyen 	printf("%s: Calibration complete\n", __FILE__);
38373da42859SDinh Nguyen 	return pass;
38383da42859SDinh Nguyen }
3839