xref: /rk3399_rockchip-uboot/drivers/ddr/altera/sequencer.c (revision c4815f76715c20dd64f4fd988f57ccb9bc84d79b)
13da42859SDinh Nguyen /*
23da42859SDinh Nguyen  * Copyright Altera Corporation (C) 2012-2015
33da42859SDinh Nguyen  *
43da42859SDinh Nguyen  * SPDX-License-Identifier:    BSD-3-Clause
53da42859SDinh Nguyen  */
63da42859SDinh Nguyen 
73da42859SDinh Nguyen #include <common.h>
83da42859SDinh Nguyen #include <asm/io.h>
93da42859SDinh Nguyen #include <asm/arch/sdram.h>
103da42859SDinh Nguyen #include "sequencer.h"
113da42859SDinh Nguyen #include "sequencer_auto.h"
123da42859SDinh Nguyen #include "sequencer_auto_ac_init.h"
133da42859SDinh Nguyen #include "sequencer_auto_inst_init.h"
143da42859SDinh Nguyen #include "sequencer_defines.h"
153da42859SDinh Nguyen 
163da42859SDinh Nguyen static void scc_mgr_load_dqs_for_write_group(uint32_t write_group);
173da42859SDinh Nguyen 
183da42859SDinh Nguyen static struct socfpga_sdr_rw_load_manager *sdr_rw_load_mgr_regs =
196afb4fe2SMarek Vasut 	(struct socfpga_sdr_rw_load_manager *)(SDR_PHYGRP_RWMGRGRP_ADDRESS | 0x800);
203da42859SDinh Nguyen 
213da42859SDinh Nguyen static struct socfpga_sdr_rw_load_jump_manager *sdr_rw_load_jump_mgr_regs =
226afb4fe2SMarek Vasut 	(struct socfpga_sdr_rw_load_jump_manager *)(SDR_PHYGRP_RWMGRGRP_ADDRESS | 0xC00);
233da42859SDinh Nguyen 
243da42859SDinh Nguyen static struct socfpga_sdr_reg_file *sdr_reg_file =
25a1c654a8SMarek Vasut 	(struct socfpga_sdr_reg_file *)SDR_PHYGRP_REGFILEGRP_ADDRESS;
263da42859SDinh Nguyen 
273da42859SDinh Nguyen static struct socfpga_sdr_scc_mgr *sdr_scc_mgr =
28e79025a7SMarek Vasut 	(struct socfpga_sdr_scc_mgr *)(SDR_PHYGRP_SCCGRP_ADDRESS | 0xe00);
293da42859SDinh Nguyen 
303da42859SDinh Nguyen static struct socfpga_phy_mgr_cmd *phy_mgr_cmd =
311bc6f14aSMarek Vasut 	(struct socfpga_phy_mgr_cmd *)SDR_PHYGRP_PHYMGRGRP_ADDRESS;
323da42859SDinh Nguyen 
333da42859SDinh Nguyen static struct socfpga_phy_mgr_cfg *phy_mgr_cfg =
341bc6f14aSMarek Vasut 	(struct socfpga_phy_mgr_cfg *)(SDR_PHYGRP_PHYMGRGRP_ADDRESS | 0x40);
353da42859SDinh Nguyen 
363da42859SDinh Nguyen static struct socfpga_data_mgr *data_mgr =
37*c4815f76SMarek Vasut 	(struct socfpga_data_mgr *)SDR_PHYGRP_DATAMGRGRP_ADDRESS;
383da42859SDinh Nguyen 
393da42859SDinh Nguyen #define DELTA_D		1
403da42859SDinh Nguyen 
413da42859SDinh Nguyen /*
423da42859SDinh Nguyen  * In order to reduce ROM size, most of the selectable calibration steps are
433da42859SDinh Nguyen  * decided at compile time based on the user's calibration mode selection,
443da42859SDinh Nguyen  * as captured by the STATIC_CALIB_STEPS selection below.
453da42859SDinh Nguyen  *
463da42859SDinh Nguyen  * However, to support simulation-time selection of fast simulation mode, where
473da42859SDinh Nguyen  * we skip everything except the bare minimum, we need a few of the steps to
483da42859SDinh Nguyen  * be dynamic.  In those cases, we either use the DYNAMIC_CALIB_STEPS for the
493da42859SDinh Nguyen  * check, which is based on the rtl-supplied value, or we dynamically compute
503da42859SDinh Nguyen  * the value to use based on the dynamically-chosen calibration mode
513da42859SDinh Nguyen  */
523da42859SDinh Nguyen 
533da42859SDinh Nguyen #define DLEVEL 0
543da42859SDinh Nguyen #define STATIC_IN_RTL_SIM 0
553da42859SDinh Nguyen #define STATIC_SKIP_DELAY_LOOPS 0
563da42859SDinh Nguyen 
573da42859SDinh Nguyen #define STATIC_CALIB_STEPS (STATIC_IN_RTL_SIM | CALIB_SKIP_FULL_TEST | \
583da42859SDinh Nguyen 	STATIC_SKIP_DELAY_LOOPS)
593da42859SDinh Nguyen 
603da42859SDinh Nguyen /* calibration steps requested by the rtl */
613da42859SDinh Nguyen uint16_t dyn_calib_steps;
623da42859SDinh Nguyen 
633da42859SDinh Nguyen /*
643da42859SDinh Nguyen  * To make CALIB_SKIP_DELAY_LOOPS a dynamic conditional option
653da42859SDinh Nguyen  * instead of static, we use boolean logic to select between
663da42859SDinh Nguyen  * non-skip and skip values
673da42859SDinh Nguyen  *
683da42859SDinh Nguyen  * The mask is set to include all bits when not-skipping, but is
693da42859SDinh Nguyen  * zero when skipping
703da42859SDinh Nguyen  */
713da42859SDinh Nguyen 
723da42859SDinh Nguyen uint16_t skip_delay_mask;	/* mask off bits when skipping/not-skipping */
733da42859SDinh Nguyen 
743da42859SDinh Nguyen #define SKIP_DELAY_LOOP_VALUE_OR_ZERO(non_skip_value) \
753da42859SDinh Nguyen 	((non_skip_value) & skip_delay_mask)
763da42859SDinh Nguyen 
773da42859SDinh Nguyen struct gbl_type *gbl;
783da42859SDinh Nguyen struct param_type *param;
793da42859SDinh Nguyen uint32_t curr_shadow_reg;
803da42859SDinh Nguyen 
813da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_write_test(uint32_t rank_bgn,
823da42859SDinh Nguyen 	uint32_t write_group, uint32_t use_dm,
833da42859SDinh Nguyen 	uint32_t all_correct, uint32_t *bit_chk, uint32_t all_ranks);
843da42859SDinh Nguyen 
853da42859SDinh Nguyen static void set_failing_group_stage(uint32_t group, uint32_t stage,
863da42859SDinh Nguyen 	uint32_t substage)
873da42859SDinh Nguyen {
883da42859SDinh Nguyen 	/*
893da42859SDinh Nguyen 	 * Only set the global stage if there was not been any other
903da42859SDinh Nguyen 	 * failing group
913da42859SDinh Nguyen 	 */
923da42859SDinh Nguyen 	if (gbl->error_stage == CAL_STAGE_NIL)	{
933da42859SDinh Nguyen 		gbl->error_substage = substage;
943da42859SDinh Nguyen 		gbl->error_stage = stage;
953da42859SDinh Nguyen 		gbl->error_group = group;
963da42859SDinh Nguyen 	}
973da42859SDinh Nguyen }
983da42859SDinh Nguyen 
993da42859SDinh Nguyen static void reg_file_set_group(uint32_t set_group)
1003da42859SDinh Nguyen {
101a1c654a8SMarek Vasut 	u32 addr = (u32)&sdr_reg_file->cur_stage;
1023da42859SDinh Nguyen 
1033da42859SDinh Nguyen 	/* Read the current group and stage */
1043da42859SDinh Nguyen 	uint32_t cur_stage_group = readl(SOCFPGA_SDR_ADDRESS + addr);
1053da42859SDinh Nguyen 
1063da42859SDinh Nguyen 	/* Clear the group */
1073da42859SDinh Nguyen 	cur_stage_group &= 0x0000FFFF;
1083da42859SDinh Nguyen 
1093da42859SDinh Nguyen 	/* Set the group */
1103da42859SDinh Nguyen 	cur_stage_group |= (set_group << 16);
1113da42859SDinh Nguyen 
1123da42859SDinh Nguyen 	/* Write the data back */
1133da42859SDinh Nguyen 	writel(cur_stage_group, SOCFPGA_SDR_ADDRESS + addr);
1143da42859SDinh Nguyen }
1153da42859SDinh Nguyen 
1163da42859SDinh Nguyen static void reg_file_set_stage(uint32_t set_stage)
1173da42859SDinh Nguyen {
118a1c654a8SMarek Vasut 	u32 addr = (u32)&sdr_reg_file->cur_stage;
119a1c654a8SMarek Vasut 
1203da42859SDinh Nguyen 	/* Read the current group and stage */
1213da42859SDinh Nguyen 	uint32_t cur_stage_group = readl(SOCFPGA_SDR_ADDRESS + addr);
1223da42859SDinh Nguyen 
1233da42859SDinh Nguyen 	/* Clear the stage and substage */
1243da42859SDinh Nguyen 	cur_stage_group &= 0xFFFF0000;
1253da42859SDinh Nguyen 
1263da42859SDinh Nguyen 	/* Set the stage */
1273da42859SDinh Nguyen 	cur_stage_group |= (set_stage & 0x000000FF);
1283da42859SDinh Nguyen 
1293da42859SDinh Nguyen 	/* Write the data back */
1303da42859SDinh Nguyen 	writel(cur_stage_group, SOCFPGA_SDR_ADDRESS + addr);
1313da42859SDinh Nguyen }
1323da42859SDinh Nguyen 
1333da42859SDinh Nguyen static void reg_file_set_sub_stage(uint32_t set_sub_stage)
1343da42859SDinh Nguyen {
135a1c654a8SMarek Vasut 	u32 addr = (u32)&sdr_reg_file->cur_stage;
136a1c654a8SMarek Vasut 
1373da42859SDinh Nguyen 	/* Read the current group and stage */
1383da42859SDinh Nguyen 	uint32_t cur_stage_group = readl(SOCFPGA_SDR_ADDRESS + addr);
1393da42859SDinh Nguyen 
1403da42859SDinh Nguyen 	/* Clear the substage */
1413da42859SDinh Nguyen 	cur_stage_group &= 0xFFFF00FF;
1423da42859SDinh Nguyen 
1433da42859SDinh Nguyen 	/* Set the sub stage */
1443da42859SDinh Nguyen 	cur_stage_group |= ((set_sub_stage << 8) & 0x0000FF00);
1453da42859SDinh Nguyen 
1463da42859SDinh Nguyen 	/* Write the data back */
1473da42859SDinh Nguyen 	writel(cur_stage_group, SOCFPGA_SDR_ADDRESS + addr);
1483da42859SDinh Nguyen }
1493da42859SDinh Nguyen 
1503da42859SDinh Nguyen static void initialize(void)
1513da42859SDinh Nguyen {
1521bc6f14aSMarek Vasut 	u32 addr = (u32)&phy_mgr_cfg->mux_sel;
1533da42859SDinh Nguyen 
1543da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
1553da42859SDinh Nguyen 	/* USER calibration has control over path to memory */
1563da42859SDinh Nguyen 	/*
1573da42859SDinh Nguyen 	 * In Hard PHY this is a 2-bit control:
1583da42859SDinh Nguyen 	 * 0: AFI Mux Select
1593da42859SDinh Nguyen 	 * 1: DDIO Mux Select
1603da42859SDinh Nguyen 	 */
1613da42859SDinh Nguyen 	writel(0x3, SOCFPGA_SDR_ADDRESS + addr);
1623da42859SDinh Nguyen 
1633da42859SDinh Nguyen 	/* USER memory clock is not stable we begin initialization  */
1641bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cfg->reset_mem_stbl;
1653da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
1663da42859SDinh Nguyen 
1673da42859SDinh Nguyen 	/* USER calibration status all set to zero */
1681bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cfg->cal_status;
1693da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
1703da42859SDinh Nguyen 
1711bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cfg->cal_debug_info;
1723da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
1733da42859SDinh Nguyen 
1743da42859SDinh Nguyen 	if ((dyn_calib_steps & CALIB_SKIP_ALL) != CALIB_SKIP_ALL) {
1753da42859SDinh Nguyen 		param->read_correct_mask_vg  = ((uint32_t)1 <<
1763da42859SDinh Nguyen 			(RW_MGR_MEM_DQ_PER_READ_DQS /
1773da42859SDinh Nguyen 			RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS)) - 1;
1783da42859SDinh Nguyen 		param->write_correct_mask_vg = ((uint32_t)1 <<
1793da42859SDinh Nguyen 			(RW_MGR_MEM_DQ_PER_READ_DQS /
1803da42859SDinh Nguyen 			RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS)) - 1;
1813da42859SDinh Nguyen 		param->read_correct_mask     = ((uint32_t)1 <<
1823da42859SDinh Nguyen 			RW_MGR_MEM_DQ_PER_READ_DQS) - 1;
1833da42859SDinh Nguyen 		param->write_correct_mask    = ((uint32_t)1 <<
1843da42859SDinh Nguyen 			RW_MGR_MEM_DQ_PER_WRITE_DQS) - 1;
1853da42859SDinh Nguyen 		param->dm_correct_mask       = ((uint32_t)1 <<
1863da42859SDinh Nguyen 			(RW_MGR_MEM_DATA_WIDTH / RW_MGR_MEM_DATA_MASK_WIDTH))
1873da42859SDinh Nguyen 			- 1;
1883da42859SDinh Nguyen 	}
1893da42859SDinh Nguyen }
1903da42859SDinh Nguyen 
1913da42859SDinh Nguyen static void set_rank_and_odt_mask(uint32_t rank, uint32_t odt_mode)
1923da42859SDinh Nguyen {
1933da42859SDinh Nguyen 	uint32_t odt_mask_0 = 0;
1943da42859SDinh Nguyen 	uint32_t odt_mask_1 = 0;
1953da42859SDinh Nguyen 	uint32_t cs_and_odt_mask;
1963da42859SDinh Nguyen 	uint32_t addr;
1973da42859SDinh Nguyen 
1983da42859SDinh Nguyen 	if (odt_mode == RW_MGR_ODT_MODE_READ_WRITE) {
1993da42859SDinh Nguyen 		if (RW_MGR_MEM_NUMBER_OF_RANKS == 1) {
2003da42859SDinh Nguyen 			/*
2013da42859SDinh Nguyen 			 * 1 Rank
2023da42859SDinh Nguyen 			 * Read: ODT = 0
2033da42859SDinh Nguyen 			 * Write: ODT = 1
2043da42859SDinh Nguyen 			 */
2053da42859SDinh Nguyen 			odt_mask_0 = 0x0;
2063da42859SDinh Nguyen 			odt_mask_1 = 0x1;
2073da42859SDinh Nguyen 		} else if (RW_MGR_MEM_NUMBER_OF_RANKS == 2) {
2083da42859SDinh Nguyen 			/* 2 Ranks */
2093da42859SDinh Nguyen 			if (RW_MGR_MEM_NUMBER_OF_CS_PER_DIMM == 1) {
2103da42859SDinh Nguyen 				/* - Dual-Slot , Single-Rank
2113da42859SDinh Nguyen 				 * (1 chip-select per DIMM)
2123da42859SDinh Nguyen 				 * OR
2133da42859SDinh Nguyen 				 * - RDIMM, 4 total CS (2 CS per DIMM)
2143da42859SDinh Nguyen 				 * means 2 DIMM
2153da42859SDinh Nguyen 				 * Since MEM_NUMBER_OF_RANKS is 2 they are
2163da42859SDinh Nguyen 				 * both single rank
2173da42859SDinh Nguyen 				 * with 2 CS each (special for RDIMM)
2183da42859SDinh Nguyen 				 * Read: Turn on ODT on the opposite rank
2193da42859SDinh Nguyen 				 * Write: Turn on ODT on all ranks
2203da42859SDinh Nguyen 				 */
2213da42859SDinh Nguyen 				odt_mask_0 = 0x3 & ~(1 << rank);
2223da42859SDinh Nguyen 				odt_mask_1 = 0x3;
2233da42859SDinh Nguyen 			} else {
2243da42859SDinh Nguyen 				/*
2253da42859SDinh Nguyen 				 * USER - Single-Slot , Dual-rank DIMMs
2263da42859SDinh Nguyen 				 * (2 chip-selects per DIMM)
2273da42859SDinh Nguyen 				 * USER Read: Turn on ODT off on all ranks
2283da42859SDinh Nguyen 				 * USER Write: Turn on ODT on active rank
2293da42859SDinh Nguyen 				 */
2303da42859SDinh Nguyen 				odt_mask_0 = 0x0;
2313da42859SDinh Nguyen 				odt_mask_1 = 0x3 & (1 << rank);
2323da42859SDinh Nguyen 			}
2333da42859SDinh Nguyen 		} else {
2343da42859SDinh Nguyen 			/* 4 Ranks
2353da42859SDinh Nguyen 			 * Read:
2363da42859SDinh Nguyen 			 * ----------+-----------------------+
2373da42859SDinh Nguyen 			 *           |                       |
2383da42859SDinh Nguyen 			 *           |         ODT           |
2393da42859SDinh Nguyen 			 * Read From +-----------------------+
2403da42859SDinh Nguyen 			 *   Rank    |  3  |  2  |  1  |  0  |
2413da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2423da42859SDinh Nguyen 			 *     0     |  0  |  1  |  0  |  0  |
2433da42859SDinh Nguyen 			 *     1     |  1  |  0  |  0  |  0  |
2443da42859SDinh Nguyen 			 *     2     |  0  |  0  |  0  |  1  |
2453da42859SDinh Nguyen 			 *     3     |  0  |  0  |  1  |  0  |
2463da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2473da42859SDinh Nguyen 			 *
2483da42859SDinh Nguyen 			 * Write:
2493da42859SDinh Nguyen 			 * ----------+-----------------------+
2503da42859SDinh Nguyen 			 *           |                       |
2513da42859SDinh Nguyen 			 *           |         ODT           |
2523da42859SDinh Nguyen 			 * Write To  +-----------------------+
2533da42859SDinh Nguyen 			 *   Rank    |  3  |  2  |  1  |  0  |
2543da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2553da42859SDinh Nguyen 			 *     0     |  0  |  1  |  0  |  1  |
2563da42859SDinh Nguyen 			 *     1     |  1  |  0  |  1  |  0  |
2573da42859SDinh Nguyen 			 *     2     |  0  |  1  |  0  |  1  |
2583da42859SDinh Nguyen 			 *     3     |  1  |  0  |  1  |  0  |
2593da42859SDinh Nguyen 			 * ----------+-----+-----+-----+-----+
2603da42859SDinh Nguyen 			 */
2613da42859SDinh Nguyen 			switch (rank) {
2623da42859SDinh Nguyen 			case 0:
2633da42859SDinh Nguyen 				odt_mask_0 = 0x4;
2643da42859SDinh Nguyen 				odt_mask_1 = 0x5;
2653da42859SDinh Nguyen 				break;
2663da42859SDinh Nguyen 			case 1:
2673da42859SDinh Nguyen 				odt_mask_0 = 0x8;
2683da42859SDinh Nguyen 				odt_mask_1 = 0xA;
2693da42859SDinh Nguyen 				break;
2703da42859SDinh Nguyen 			case 2:
2713da42859SDinh Nguyen 				odt_mask_0 = 0x1;
2723da42859SDinh Nguyen 				odt_mask_1 = 0x5;
2733da42859SDinh Nguyen 				break;
2743da42859SDinh Nguyen 			case 3:
2753da42859SDinh Nguyen 				odt_mask_0 = 0x2;
2763da42859SDinh Nguyen 				odt_mask_1 = 0xA;
2773da42859SDinh Nguyen 				break;
2783da42859SDinh Nguyen 			}
2793da42859SDinh Nguyen 		}
2803da42859SDinh Nguyen 	} else {
2813da42859SDinh Nguyen 		odt_mask_0 = 0x0;
2823da42859SDinh Nguyen 		odt_mask_1 = 0x0;
2833da42859SDinh Nguyen 	}
2843da42859SDinh Nguyen 
2853da42859SDinh Nguyen 	cs_and_odt_mask =
2863da42859SDinh Nguyen 		(0xFF & ~(1 << rank)) |
2873da42859SDinh Nguyen 		((0xFF & odt_mask_0) << 8) |
2883da42859SDinh Nguyen 		((0xFF & odt_mask_1) << 16);
289*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_SET_CS_AND_ODT_MASK_OFFSET;
2903da42859SDinh Nguyen 	writel(cs_and_odt_mask, SOCFPGA_SDR_ADDRESS + addr);
2913da42859SDinh Nguyen }
2923da42859SDinh Nguyen 
2933da42859SDinh Nguyen static void scc_mgr_initialize(void)
2943da42859SDinh Nguyen {
295*c4815f76SMarek Vasut 	u32 addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_HHP_RFILE_OFFSET;
2963da42859SDinh Nguyen 
2973da42859SDinh Nguyen 	/*
2983da42859SDinh Nguyen 	 * Clear register file for HPS
2993da42859SDinh Nguyen 	 * 16 (2^4) is the size of the full register file in the scc mgr:
3003da42859SDinh Nguyen 	 *	RFILE_DEPTH = log2(MEM_DQ_PER_DQS + 1 + MEM_DM_PER_DQS +
3013da42859SDinh Nguyen 	 * MEM_IF_READ_DQS_WIDTH - 1) + 1;
3023da42859SDinh Nguyen 	 */
3033da42859SDinh Nguyen 	uint32_t i;
3043da42859SDinh Nguyen 	for (i = 0; i < 16; i++) {
3057ac40d25SMarek Vasut 		debug_cond(DLEVEL == 1, "%s:%d: Clearing SCC RFILE index %u\n",
3063da42859SDinh Nguyen 			   __func__, __LINE__, i);
3073da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr + (i << 2));
3083da42859SDinh Nguyen 	}
3093da42859SDinh Nguyen }
3103da42859SDinh Nguyen 
3113da42859SDinh Nguyen static void scc_mgr_set_dqs_bus_in_delay(uint32_t read_group,
3123da42859SDinh Nguyen 						uint32_t delay)
3133da42859SDinh Nguyen {
314*c4815f76SMarek Vasut 	u32 addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_DQS_IN_DELAY_OFFSET;
3153da42859SDinh Nguyen 
3163da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
3173da42859SDinh Nguyen 	writel(delay, SOCFPGA_SDR_ADDRESS + addr + (read_group << 2));
3183da42859SDinh Nguyen }
3193da42859SDinh Nguyen 
3203da42859SDinh Nguyen static void scc_mgr_set_dqs_io_in_delay(uint32_t write_group,
3213da42859SDinh Nguyen 	uint32_t delay)
3223da42859SDinh Nguyen {
323*c4815f76SMarek Vasut 	u32 addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_IN_DELAY_OFFSET;
3243da42859SDinh Nguyen 
3253da42859SDinh Nguyen 	writel(delay, SOCFPGA_SDR_ADDRESS + addr + (RW_MGR_MEM_DQ_PER_WRITE_DQS << 2));
3263da42859SDinh Nguyen }
3273da42859SDinh Nguyen 
3283da42859SDinh Nguyen static void scc_mgr_set_dqs_en_phase(uint32_t read_group, uint32_t phase)
3293da42859SDinh Nguyen {
330*c4815f76SMarek Vasut 	u32 addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_DQS_EN_PHASE_OFFSET;
3313da42859SDinh Nguyen 
3323da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
3333da42859SDinh Nguyen 	writel(phase, SOCFPGA_SDR_ADDRESS + addr + (read_group << 2));
3343da42859SDinh Nguyen }
3353da42859SDinh Nguyen 
3363da42859SDinh Nguyen static void scc_mgr_set_dqs_en_phase_all_ranks(uint32_t read_group,
3373da42859SDinh Nguyen 					       uint32_t phase)
3383da42859SDinh Nguyen {
3393da42859SDinh Nguyen 	uint32_t r;
3403da42859SDinh Nguyen 	uint32_t update_scan_chains;
3413da42859SDinh Nguyen 	uint32_t addr;
3423da42859SDinh Nguyen 
3433da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
3443da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
3453da42859SDinh Nguyen 		/*
3463da42859SDinh Nguyen 		 * USER although the h/w doesn't support different phases per
3473da42859SDinh Nguyen 		 * shadow register, for simplicity our scc manager modeling
3483da42859SDinh Nguyen 		 * keeps different phase settings per shadow reg, and it's
3493da42859SDinh Nguyen 		 * important for us to keep them in sync to match h/w.
3503da42859SDinh Nguyen 		 * for efficiency, the scan chain update should occur only
3513da42859SDinh Nguyen 		 * once to sr0.
3523da42859SDinh Nguyen 		 */
3533da42859SDinh Nguyen 		update_scan_chains = (r == 0) ? 1 : 0;
3543da42859SDinh Nguyen 
3553da42859SDinh Nguyen 		scc_mgr_set_dqs_en_phase(read_group, phase);
3563da42859SDinh Nguyen 
3573da42859SDinh Nguyen 		if (update_scan_chains) {
358e79025a7SMarek Vasut 			addr = (u32)&sdr_scc_mgr->dqs_ena;
3593da42859SDinh Nguyen 			writel(read_group, SOCFPGA_SDR_ADDRESS + addr);
3603da42859SDinh Nguyen 
361e79025a7SMarek Vasut 			addr = (u32)&sdr_scc_mgr->update;
3623da42859SDinh Nguyen 			writel(0, SOCFPGA_SDR_ADDRESS + addr);
3633da42859SDinh Nguyen 		}
3643da42859SDinh Nguyen 	}
3653da42859SDinh Nguyen }
3663da42859SDinh Nguyen 
3673da42859SDinh Nguyen static void scc_mgr_set_dqdqs_output_phase(uint32_t write_group,
3683da42859SDinh Nguyen 						  uint32_t phase)
3693da42859SDinh Nguyen {
370*c4815f76SMarek Vasut 	u32 addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_DQDQS_OUT_PHASE_OFFSET;
3713da42859SDinh Nguyen 
3723da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
3733da42859SDinh Nguyen 	writel(phase, SOCFPGA_SDR_ADDRESS + addr + (write_group << 2));
3743da42859SDinh Nguyen }
3753da42859SDinh Nguyen 
3763da42859SDinh Nguyen static void scc_mgr_set_dqdqs_output_phase_all_ranks(uint32_t write_group,
3773da42859SDinh Nguyen 						     uint32_t phase)
3783da42859SDinh Nguyen {
3793da42859SDinh Nguyen 	uint32_t r;
3803da42859SDinh Nguyen 	uint32_t update_scan_chains;
3813da42859SDinh Nguyen 	uint32_t addr;
3823da42859SDinh Nguyen 
3833da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
3843da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
3853da42859SDinh Nguyen 		/*
3863da42859SDinh Nguyen 		 * USER although the h/w doesn't support different phases per
3873da42859SDinh Nguyen 		 * shadow register, for simplicity our scc manager modeling
3883da42859SDinh Nguyen 		 * keeps different phase settings per shadow reg, and it's
3893da42859SDinh Nguyen 		 * important for us to keep them in sync to match h/w.
3903da42859SDinh Nguyen 		 * for efficiency, the scan chain update should occur only
3913da42859SDinh Nguyen 		 * once to sr0.
3923da42859SDinh Nguyen 		 */
3933da42859SDinh Nguyen 		update_scan_chains = (r == 0) ? 1 : 0;
3943da42859SDinh Nguyen 
3953da42859SDinh Nguyen 		scc_mgr_set_dqdqs_output_phase(write_group, phase);
3963da42859SDinh Nguyen 
3973da42859SDinh Nguyen 		if (update_scan_chains) {
398e79025a7SMarek Vasut 			addr = (u32)&sdr_scc_mgr->dqs_ena;
3993da42859SDinh Nguyen 			writel(write_group, SOCFPGA_SDR_ADDRESS + addr);
4003da42859SDinh Nguyen 
401e79025a7SMarek Vasut 			addr = (u32)&sdr_scc_mgr->update;
4023da42859SDinh Nguyen 			writel(0, SOCFPGA_SDR_ADDRESS + addr);
4033da42859SDinh Nguyen 		}
4043da42859SDinh Nguyen 	}
4053da42859SDinh Nguyen }
4063da42859SDinh Nguyen 
4073da42859SDinh Nguyen static void scc_mgr_set_dqs_en_delay(uint32_t read_group, uint32_t delay)
4083da42859SDinh Nguyen {
409*c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_DQS_EN_DELAY_OFFSET;
4103da42859SDinh Nguyen 
4113da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
4123da42859SDinh Nguyen 	writel(delay + IO_DQS_EN_DELAY_OFFSET, SOCFPGA_SDR_ADDRESS + addr +
4133da42859SDinh Nguyen 	       (read_group << 2));
4143da42859SDinh Nguyen }
4153da42859SDinh Nguyen 
4163da42859SDinh Nguyen static void scc_mgr_set_dqs_en_delay_all_ranks(uint32_t read_group,
4173da42859SDinh Nguyen 					       uint32_t delay)
4183da42859SDinh Nguyen {
4193da42859SDinh Nguyen 	uint32_t r;
4203da42859SDinh Nguyen 	uint32_t addr;
4213da42859SDinh Nguyen 
4223da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
4233da42859SDinh Nguyen 		r += NUM_RANKS_PER_SHADOW_REG) {
4243da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay(read_group, delay);
4253da42859SDinh Nguyen 
426e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->dqs_ena;
4273da42859SDinh Nguyen 		writel(read_group, SOCFPGA_SDR_ADDRESS + addr);
4283da42859SDinh Nguyen 		/*
4293da42859SDinh Nguyen 		 * In shadow register mode, the T11 settings are stored in
4303da42859SDinh Nguyen 		 * registers in the core, which are updated by the DQS_ENA
4313da42859SDinh Nguyen 		 * signals. Not issuing the SCC_MGR_UPD command allows us to
4323da42859SDinh Nguyen 		 * save lots of rank switching overhead, by calling
4333da42859SDinh Nguyen 		 * select_shadow_regs_for_update with update_scan_chains
4343da42859SDinh Nguyen 		 * set to 0.
4353da42859SDinh Nguyen 		 */
436e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->update;
4373da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
4383da42859SDinh Nguyen 	}
4393da42859SDinh Nguyen 	/*
4403da42859SDinh Nguyen 	 * In shadow register mode, the T11 settings are stored in
4413da42859SDinh Nguyen 	 * registers in the core, which are updated by the DQS_ENA
4423da42859SDinh Nguyen 	 * signals. Not issuing the SCC_MGR_UPD command allows us to
4433da42859SDinh Nguyen 	 * save lots of rank switching overhead, by calling
4443da42859SDinh Nguyen 	 * select_shadow_regs_for_update with update_scan_chains
4453da42859SDinh Nguyen 	 * set to 0.
4463da42859SDinh Nguyen 	 */
447e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
4483da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
4493da42859SDinh Nguyen }
4503da42859SDinh Nguyen 
4513da42859SDinh Nguyen static void scc_mgr_set_oct_out1_delay(uint32_t write_group, uint32_t delay)
4523da42859SDinh Nguyen {
4533da42859SDinh Nguyen 	uint32_t read_group;
454*c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_OCT_OUT1_DELAY_OFFSET;
4553da42859SDinh Nguyen 
4563da42859SDinh Nguyen 	/*
4573da42859SDinh Nguyen 	 * Load the setting in the SCC manager
4583da42859SDinh Nguyen 	 * Although OCT affects only write data, the OCT delay is controlled
4593da42859SDinh Nguyen 	 * by the DQS logic block which is instantiated once per read group.
4603da42859SDinh Nguyen 	 * For protocols where a write group consists of multiple read groups,
4613da42859SDinh Nguyen 	 * the setting must be set multiple times.
4623da42859SDinh Nguyen 	 */
4633da42859SDinh Nguyen 	for (read_group = write_group * RW_MGR_MEM_IF_READ_DQS_WIDTH /
4643da42859SDinh Nguyen 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH;
4653da42859SDinh Nguyen 	     read_group < (write_group + 1) * RW_MGR_MEM_IF_READ_DQS_WIDTH /
4663da42859SDinh Nguyen 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH; ++read_group)
4673da42859SDinh Nguyen 		writel(delay, SOCFPGA_SDR_ADDRESS + addr + (read_group << 2));
4683da42859SDinh Nguyen }
4693da42859SDinh Nguyen 
4703da42859SDinh Nguyen static void scc_mgr_set_dq_out1_delay(uint32_t write_group,
4713da42859SDinh Nguyen 				      uint32_t dq_in_group, uint32_t delay)
4723da42859SDinh Nguyen {
473*c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
4743da42859SDinh Nguyen 
4753da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
4763da42859SDinh Nguyen 	writel(delay, SOCFPGA_SDR_ADDRESS + addr + (dq_in_group << 2));
4773da42859SDinh Nguyen }
4783da42859SDinh Nguyen 
4793da42859SDinh Nguyen static void scc_mgr_set_dq_in_delay(uint32_t write_group,
4803da42859SDinh Nguyen 	uint32_t dq_in_group, uint32_t delay)
4813da42859SDinh Nguyen {
482*c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_IN_DELAY_OFFSET;
4833da42859SDinh Nguyen 
4843da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
4853da42859SDinh Nguyen 	writel(delay, SOCFPGA_SDR_ADDRESS + addr + (dq_in_group << 2));
4863da42859SDinh Nguyen }
4873da42859SDinh Nguyen 
4883da42859SDinh Nguyen static void scc_mgr_set_hhp_extras(void)
4893da42859SDinh Nguyen {
4903da42859SDinh Nguyen 	/*
4913da42859SDinh Nguyen 	 * Load the fixed setting in the SCC manager
4923da42859SDinh Nguyen 	 * bits: 0:0 = 1'b1   - dqs bypass
4933da42859SDinh Nguyen 	 * bits: 1:1 = 1'b1   - dq bypass
4943da42859SDinh Nguyen 	 * bits: 4:2 = 3'b001   - rfifo_mode
4953da42859SDinh Nguyen 	 * bits: 6:5 = 2'b01  - rfifo clock_select
4963da42859SDinh Nguyen 	 * bits: 7:7 = 1'b0  - separate gating from ungating setting
4973da42859SDinh Nguyen 	 * bits: 8:8 = 1'b0  - separate OE from Output delay setting
4983da42859SDinh Nguyen 	 */
4993da42859SDinh Nguyen 	uint32_t value = (0<<8) | (0<<7) | (1<<5) | (1<<2) | (1<<1) | (1<<0);
500*c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_HHP_GLOBALS_OFFSET;
5013da42859SDinh Nguyen 
5023da42859SDinh Nguyen 	writel(value, SOCFPGA_SDR_ADDRESS + addr + SCC_MGR_HHP_EXTRAS_OFFSET);
5033da42859SDinh Nguyen }
5043da42859SDinh Nguyen 
5053da42859SDinh Nguyen static void scc_mgr_set_dqs_out1_delay(uint32_t write_group,
5063da42859SDinh Nguyen 					      uint32_t delay)
5073da42859SDinh Nguyen {
508*c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
5093da42859SDinh Nguyen 
5103da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
5113da42859SDinh Nguyen 	writel(delay, SOCFPGA_SDR_ADDRESS + addr + (RW_MGR_MEM_DQ_PER_WRITE_DQS << 2));
5123da42859SDinh Nguyen }
5133da42859SDinh Nguyen 
5143da42859SDinh Nguyen static void scc_mgr_set_dm_out1_delay(uint32_t write_group,
5153da42859SDinh Nguyen 					     uint32_t dm, uint32_t delay)
5163da42859SDinh Nguyen {
517*c4815f76SMarek Vasut 	uint32_t addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
5183da42859SDinh Nguyen 
5193da42859SDinh Nguyen 	/* Load the setting in the SCC manager */
5203da42859SDinh Nguyen 	writel(delay, SOCFPGA_SDR_ADDRESS + addr +
5213da42859SDinh Nguyen 		((RW_MGR_MEM_DQ_PER_WRITE_DQS + 1 + dm) << 2));
5223da42859SDinh Nguyen }
5233da42859SDinh Nguyen 
5243da42859SDinh Nguyen /*
5253da42859SDinh Nguyen  * USER Zero all DQS config
5263da42859SDinh Nguyen  * TODO: maybe rename to scc_mgr_zero_dqs_config (or something)
5273da42859SDinh Nguyen  */
5283da42859SDinh Nguyen static void scc_mgr_zero_all(void)
5293da42859SDinh Nguyen {
5303da42859SDinh Nguyen 	uint32_t i, r;
5313da42859SDinh Nguyen 	uint32_t addr;
5323da42859SDinh Nguyen 
5333da42859SDinh Nguyen 	/*
5343da42859SDinh Nguyen 	 * USER Zero all DQS config settings, across all groups and all
5353da42859SDinh Nguyen 	 * shadow registers
5363da42859SDinh Nguyen 	 */
5373da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r +=
5383da42859SDinh Nguyen 	     NUM_RANKS_PER_SHADOW_REG) {
5393da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
5403da42859SDinh Nguyen 			/*
5413da42859SDinh Nguyen 			 * The phases actually don't exist on a per-rank basis,
5423da42859SDinh Nguyen 			 * but there's no harm updating them several times, so
5433da42859SDinh Nguyen 			 * let's keep the code simple.
5443da42859SDinh Nguyen 			 */
5453da42859SDinh Nguyen 			scc_mgr_set_dqs_bus_in_delay(i, IO_DQS_IN_RESERVE);
5463da42859SDinh Nguyen 			scc_mgr_set_dqs_en_phase(i, 0);
5473da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay(i, 0);
5483da42859SDinh Nguyen 		}
5493da42859SDinh Nguyen 
5503da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_WRITE_DQS_WIDTH; i++) {
5513da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, 0);
5523da42859SDinh Nguyen 			/* av/cv don't have out2 */
5533da42859SDinh Nguyen 			scc_mgr_set_oct_out1_delay(i, IO_DQS_OUT_RESERVE);
5543da42859SDinh Nguyen 		}
5553da42859SDinh Nguyen 	}
5563da42859SDinh Nguyen 
5573da42859SDinh Nguyen 	/* multicast to all DQS group enables */
558e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->dqs_ena;
5593da42859SDinh Nguyen 	writel(0xff, SOCFPGA_SDR_ADDRESS + addr);
5603da42859SDinh Nguyen 
561e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
5623da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
5633da42859SDinh Nguyen }
5643da42859SDinh Nguyen 
5653da42859SDinh Nguyen static void scc_set_bypass_mode(uint32_t write_group, uint32_t mode)
5663da42859SDinh Nguyen {
5673da42859SDinh Nguyen 	uint32_t addr;
5683da42859SDinh Nguyen 	/* mode = 0 : Do NOT bypass - Half Rate Mode */
5693da42859SDinh Nguyen 	/* mode = 1 : Bypass - Full Rate Mode */
5703da42859SDinh Nguyen 
5713da42859SDinh Nguyen 	/* only need to set once for all groups, pins, dq, dqs, dm */
5723da42859SDinh Nguyen 	if (write_group == 0) {
5733da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d Setting HHP Extras\n", __func__,
5743da42859SDinh Nguyen 			   __LINE__);
5753da42859SDinh Nguyen 		scc_mgr_set_hhp_extras();
5763da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d Done Setting HHP Extras\n",
5773da42859SDinh Nguyen 			  __func__, __LINE__);
5783da42859SDinh Nguyen 	}
5793da42859SDinh Nguyen 	/* multicast to all DQ enables */
580e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->dq_ena;
5813da42859SDinh Nguyen 	writel(0xff, SOCFPGA_SDR_ADDRESS + addr);
5823da42859SDinh Nguyen 
583e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->dm_ena;
5843da42859SDinh Nguyen 	writel(0xff, SOCFPGA_SDR_ADDRESS + addr);
5853da42859SDinh Nguyen 
5863da42859SDinh Nguyen 	/* update current DQS IO enable */
587e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->dqs_io_ena;
5883da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
5893da42859SDinh Nguyen 
5903da42859SDinh Nguyen 	/* update the DQS logic */
591e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->dqs_ena;
5923da42859SDinh Nguyen 	writel(write_group, SOCFPGA_SDR_ADDRESS + addr);
5933da42859SDinh Nguyen 
5943da42859SDinh Nguyen 	/* hit update */
595e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
5963da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
5973da42859SDinh Nguyen }
5983da42859SDinh Nguyen 
5993da42859SDinh Nguyen static void scc_mgr_zero_group(uint32_t write_group, uint32_t test_begin,
6003da42859SDinh Nguyen 			       int32_t out_only)
6013da42859SDinh Nguyen {
6023da42859SDinh Nguyen 	uint32_t i, r;
6033da42859SDinh Nguyen 	uint32_t addr;
6043da42859SDinh Nguyen 
6053da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r +=
6063da42859SDinh Nguyen 		NUM_RANKS_PER_SHADOW_REG) {
6073da42859SDinh Nguyen 		/* Zero all DQ config settings */
6083da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
6093da42859SDinh Nguyen 			scc_mgr_set_dq_out1_delay(write_group, i, 0);
6103da42859SDinh Nguyen 			if (!out_only)
6113da42859SDinh Nguyen 				scc_mgr_set_dq_in_delay(write_group, i, 0);
6123da42859SDinh Nguyen 		}
6133da42859SDinh Nguyen 
6143da42859SDinh Nguyen 		/* multicast to all DQ enables */
615e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->dq_ena;
6163da42859SDinh Nguyen 		writel(0xff, SOCFPGA_SDR_ADDRESS + addr);
6173da42859SDinh Nguyen 
6183da42859SDinh Nguyen 		/* Zero all DM config settings */
6193da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_NUM_DM_PER_WRITE_GROUP; i++) {
6203da42859SDinh Nguyen 			scc_mgr_set_dm_out1_delay(write_group, i, 0);
6213da42859SDinh Nguyen 		}
6223da42859SDinh Nguyen 
6233da42859SDinh Nguyen 		/* multicast to all DM enables */
624e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->dm_ena;
6253da42859SDinh Nguyen 		writel(0xff, SOCFPGA_SDR_ADDRESS + addr);
6263da42859SDinh Nguyen 
6273da42859SDinh Nguyen 		/* zero all DQS io settings */
6283da42859SDinh Nguyen 		if (!out_only)
6293da42859SDinh Nguyen 			scc_mgr_set_dqs_io_in_delay(write_group, 0);
6303da42859SDinh Nguyen 		/* av/cv don't have out2 */
6313da42859SDinh Nguyen 		scc_mgr_set_dqs_out1_delay(write_group, IO_DQS_OUT_RESERVE);
6323da42859SDinh Nguyen 		scc_mgr_set_oct_out1_delay(write_group, IO_DQS_OUT_RESERVE);
6333da42859SDinh Nguyen 		scc_mgr_load_dqs_for_write_group(write_group);
6343da42859SDinh Nguyen 
6353da42859SDinh Nguyen 		/* multicast to all DQS IO enables (only 1) */
636e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->dqs_io_ena;
6373da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
6383da42859SDinh Nguyen 
6393da42859SDinh Nguyen 		/* hit update to zero everything */
640e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->update;
6413da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
6423da42859SDinh Nguyen 	}
6433da42859SDinh Nguyen }
6443da42859SDinh Nguyen 
6453da42859SDinh Nguyen /* load up dqs config settings */
6463da42859SDinh Nguyen static void scc_mgr_load_dqs(uint32_t dqs)
6473da42859SDinh Nguyen {
648e79025a7SMarek Vasut 	uint32_t addr = (u32)&sdr_scc_mgr->dqs_ena;
6493da42859SDinh Nguyen 
6503da42859SDinh Nguyen 	writel(dqs, SOCFPGA_SDR_ADDRESS + addr);
6513da42859SDinh Nguyen }
6523da42859SDinh Nguyen 
6533da42859SDinh Nguyen static void scc_mgr_load_dqs_for_write_group(uint32_t write_group)
6543da42859SDinh Nguyen {
6553da42859SDinh Nguyen 	uint32_t read_group;
656e79025a7SMarek Vasut 	uint32_t addr = (u32)&sdr_scc_mgr->dqs_ena;
6573da42859SDinh Nguyen 	/*
6583da42859SDinh Nguyen 	 * Although OCT affects only write data, the OCT delay is controlled
6593da42859SDinh Nguyen 	 * by the DQS logic block which is instantiated once per read group.
6603da42859SDinh Nguyen 	 * For protocols where a write group consists of multiple read groups,
6613da42859SDinh Nguyen 	 * the setting must be scanned multiple times.
6623da42859SDinh Nguyen 	 */
6633da42859SDinh Nguyen 	for (read_group = write_group * RW_MGR_MEM_IF_READ_DQS_WIDTH /
6643da42859SDinh Nguyen 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH;
6653da42859SDinh Nguyen 	     read_group < (write_group + 1) * RW_MGR_MEM_IF_READ_DQS_WIDTH /
6663da42859SDinh Nguyen 	     RW_MGR_MEM_IF_WRITE_DQS_WIDTH; ++read_group)
6673da42859SDinh Nguyen 		writel(read_group, SOCFPGA_SDR_ADDRESS + addr);
6683da42859SDinh Nguyen }
6693da42859SDinh Nguyen 
6703da42859SDinh Nguyen /* load up dqs io config settings */
6713da42859SDinh Nguyen static void scc_mgr_load_dqs_io(void)
6723da42859SDinh Nguyen {
673e79025a7SMarek Vasut 	uint32_t addr = (u32)&sdr_scc_mgr->dqs_io_ena;
6743da42859SDinh Nguyen 
6753da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
6763da42859SDinh Nguyen }
6773da42859SDinh Nguyen 
6783da42859SDinh Nguyen /* load up dq config settings */
6793da42859SDinh Nguyen static void scc_mgr_load_dq(uint32_t dq_in_group)
6803da42859SDinh Nguyen {
681e79025a7SMarek Vasut 	uint32_t addr = (u32)&sdr_scc_mgr->dq_ena;
6823da42859SDinh Nguyen 
6833da42859SDinh Nguyen 	writel(dq_in_group, SOCFPGA_SDR_ADDRESS + addr);
6843da42859SDinh Nguyen }
6853da42859SDinh Nguyen 
6863da42859SDinh Nguyen /* load up dm config settings */
6873da42859SDinh Nguyen static void scc_mgr_load_dm(uint32_t dm)
6883da42859SDinh Nguyen {
689e79025a7SMarek Vasut 	uint32_t addr = (u32)&sdr_scc_mgr->dm_ena;
6903da42859SDinh Nguyen 
6913da42859SDinh Nguyen 	writel(dm, SOCFPGA_SDR_ADDRESS + addr);
6923da42859SDinh Nguyen }
6933da42859SDinh Nguyen 
6943da42859SDinh Nguyen /*
6953da42859SDinh Nguyen  * apply and load a particular input delay for the DQ pins in a group
6963da42859SDinh Nguyen  * group_bgn is the index of the first dq pin (in the write group)
6973da42859SDinh Nguyen  */
6983da42859SDinh Nguyen static void scc_mgr_apply_group_dq_in_delay(uint32_t write_group,
6993da42859SDinh Nguyen 					    uint32_t group_bgn, uint32_t delay)
7003da42859SDinh Nguyen {
7013da42859SDinh Nguyen 	uint32_t i, p;
7023da42859SDinh Nguyen 
7033da42859SDinh Nguyen 	for (i = 0, p = group_bgn; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++, p++) {
7043da42859SDinh Nguyen 		scc_mgr_set_dq_in_delay(write_group, p, delay);
7053da42859SDinh Nguyen 		scc_mgr_load_dq(p);
7063da42859SDinh Nguyen 	}
7073da42859SDinh Nguyen }
7083da42859SDinh Nguyen 
7093da42859SDinh Nguyen /* apply and load a particular output delay for the DQ pins in a group */
7103da42859SDinh Nguyen static void scc_mgr_apply_group_dq_out1_delay(uint32_t write_group,
7113da42859SDinh Nguyen 					      uint32_t group_bgn,
7123da42859SDinh Nguyen 					      uint32_t delay1)
7133da42859SDinh Nguyen {
7143da42859SDinh Nguyen 	uint32_t i, p;
7153da42859SDinh Nguyen 
7163da42859SDinh Nguyen 	for (i = 0, p = group_bgn; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++, p++) {
7173da42859SDinh Nguyen 		scc_mgr_set_dq_out1_delay(write_group, i, delay1);
7183da42859SDinh Nguyen 		scc_mgr_load_dq(i);
7193da42859SDinh Nguyen 	}
7203da42859SDinh Nguyen }
7213da42859SDinh Nguyen 
7223da42859SDinh Nguyen /* apply and load a particular output delay for the DM pins in a group */
7233da42859SDinh Nguyen static void scc_mgr_apply_group_dm_out1_delay(uint32_t write_group,
7243da42859SDinh Nguyen 					      uint32_t delay1)
7253da42859SDinh Nguyen {
7263da42859SDinh Nguyen 	uint32_t i;
7273da42859SDinh Nguyen 
7283da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_NUM_DM_PER_WRITE_GROUP; i++) {
7293da42859SDinh Nguyen 		scc_mgr_set_dm_out1_delay(write_group, i, delay1);
7303da42859SDinh Nguyen 		scc_mgr_load_dm(i);
7313da42859SDinh Nguyen 	}
7323da42859SDinh Nguyen }
7333da42859SDinh Nguyen 
7343da42859SDinh Nguyen 
7353da42859SDinh Nguyen /* apply and load delay on both DQS and OCT out1 */
7363da42859SDinh Nguyen static void scc_mgr_apply_group_dqs_io_and_oct_out1(uint32_t write_group,
7373da42859SDinh Nguyen 						    uint32_t delay)
7383da42859SDinh Nguyen {
7393da42859SDinh Nguyen 	scc_mgr_set_dqs_out1_delay(write_group, delay);
7403da42859SDinh Nguyen 	scc_mgr_load_dqs_io();
7413da42859SDinh Nguyen 
7423da42859SDinh Nguyen 	scc_mgr_set_oct_out1_delay(write_group, delay);
7433da42859SDinh Nguyen 	scc_mgr_load_dqs_for_write_group(write_group);
7443da42859SDinh Nguyen }
7453da42859SDinh Nguyen 
7463da42859SDinh Nguyen /* apply a delay to the entire output side: DQ, DM, DQS, OCT */
7473da42859SDinh Nguyen static void scc_mgr_apply_group_all_out_delay_add(uint32_t write_group,
7483da42859SDinh Nguyen 						  uint32_t group_bgn,
7493da42859SDinh Nguyen 						  uint32_t delay)
7503da42859SDinh Nguyen {
7513da42859SDinh Nguyen 	uint32_t i, p, new_delay;
7523da42859SDinh Nguyen 
7533da42859SDinh Nguyen 	/* dq shift */
7543da42859SDinh Nguyen 	for (i = 0, p = group_bgn; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++, p++) {
7553da42859SDinh Nguyen 		new_delay = READ_SCC_DQ_OUT2_DELAY;
7563da42859SDinh Nguyen 		new_delay += delay;
7573da42859SDinh Nguyen 
7583da42859SDinh Nguyen 		if (new_delay > IO_IO_OUT2_DELAY_MAX) {
7593da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DQ[%u,%u]:\
7603da42859SDinh Nguyen 				   %u > %lu => %lu", __func__, __LINE__,
7613da42859SDinh Nguyen 				   write_group, group_bgn, delay, i, p, new_delay,
7623da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX,
7633da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX);
7643da42859SDinh Nguyen 			new_delay = IO_IO_OUT2_DELAY_MAX;
7653da42859SDinh Nguyen 		}
7663da42859SDinh Nguyen 
7673da42859SDinh Nguyen 		scc_mgr_load_dq(i);
7683da42859SDinh Nguyen 	}
7693da42859SDinh Nguyen 
7703da42859SDinh Nguyen 	/* dm shift */
7713da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_NUM_DM_PER_WRITE_GROUP; i++) {
7723da42859SDinh Nguyen 		new_delay = READ_SCC_DM_IO_OUT2_DELAY;
7733da42859SDinh Nguyen 		new_delay += delay;
7743da42859SDinh Nguyen 
7753da42859SDinh Nguyen 		if (new_delay > IO_IO_OUT2_DELAY_MAX) {
7763da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DM[%u]:\
7773da42859SDinh Nguyen 				   %u > %lu => %lu\n",  __func__, __LINE__,
7783da42859SDinh Nguyen 				   write_group, group_bgn, delay, i, new_delay,
7793da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX,
7803da42859SDinh Nguyen 				   (long unsigned int)IO_IO_OUT2_DELAY_MAX);
7813da42859SDinh Nguyen 			new_delay = IO_IO_OUT2_DELAY_MAX;
7823da42859SDinh Nguyen 		}
7833da42859SDinh Nguyen 
7843da42859SDinh Nguyen 		scc_mgr_load_dm(i);
7853da42859SDinh Nguyen 	}
7863da42859SDinh Nguyen 
7873da42859SDinh Nguyen 	/* dqs shift */
7883da42859SDinh Nguyen 	new_delay = READ_SCC_DQS_IO_OUT2_DELAY;
7893da42859SDinh Nguyen 	new_delay += delay;
7903da42859SDinh Nguyen 
7913da42859SDinh Nguyen 	if (new_delay > IO_IO_OUT2_DELAY_MAX) {
7923da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DQS: %u > %d => %d;"
7933da42859SDinh Nguyen 			   " adding %u to OUT1\n", __func__, __LINE__,
7943da42859SDinh Nguyen 			   write_group, group_bgn, delay, new_delay,
7953da42859SDinh Nguyen 			   IO_IO_OUT2_DELAY_MAX, IO_IO_OUT2_DELAY_MAX,
7963da42859SDinh Nguyen 			   new_delay - IO_IO_OUT2_DELAY_MAX);
7973da42859SDinh Nguyen 		scc_mgr_set_dqs_out1_delay(write_group, new_delay -
7983da42859SDinh Nguyen 					   IO_IO_OUT2_DELAY_MAX);
7993da42859SDinh Nguyen 		new_delay = IO_IO_OUT2_DELAY_MAX;
8003da42859SDinh Nguyen 	}
8013da42859SDinh Nguyen 
8023da42859SDinh Nguyen 	scc_mgr_load_dqs_io();
8033da42859SDinh Nguyen 
8043da42859SDinh Nguyen 	/* oct shift */
8053da42859SDinh Nguyen 	new_delay = READ_SCC_OCT_OUT2_DELAY;
8063da42859SDinh Nguyen 	new_delay += delay;
8073da42859SDinh Nguyen 
8083da42859SDinh Nguyen 	if (new_delay > IO_IO_OUT2_DELAY_MAX) {
8093da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d (%u, %u, %u) DQS: %u > %d => %d;"
8103da42859SDinh Nguyen 			   " adding %u to OUT1\n", __func__, __LINE__,
8113da42859SDinh Nguyen 			   write_group, group_bgn, delay, new_delay,
8123da42859SDinh Nguyen 			   IO_IO_OUT2_DELAY_MAX, IO_IO_OUT2_DELAY_MAX,
8133da42859SDinh Nguyen 			   new_delay - IO_IO_OUT2_DELAY_MAX);
8143da42859SDinh Nguyen 		scc_mgr_set_oct_out1_delay(write_group, new_delay -
8153da42859SDinh Nguyen 					   IO_IO_OUT2_DELAY_MAX);
8163da42859SDinh Nguyen 		new_delay = IO_IO_OUT2_DELAY_MAX;
8173da42859SDinh Nguyen 	}
8183da42859SDinh Nguyen 
8193da42859SDinh Nguyen 	scc_mgr_load_dqs_for_write_group(write_group);
8203da42859SDinh Nguyen }
8213da42859SDinh Nguyen 
8223da42859SDinh Nguyen /*
8233da42859SDinh Nguyen  * USER apply a delay to the entire output side (DQ, DM, DQS, OCT)
8243da42859SDinh Nguyen  * and to all ranks
8253da42859SDinh Nguyen  */
8263da42859SDinh Nguyen static void scc_mgr_apply_group_all_out_delay_add_all_ranks(
8273da42859SDinh Nguyen 	uint32_t write_group, uint32_t group_bgn, uint32_t delay)
8283da42859SDinh Nguyen {
8293da42859SDinh Nguyen 	uint32_t r;
830e79025a7SMarek Vasut 	uint32_t addr = (u32)&sdr_scc_mgr->update;
8313da42859SDinh Nguyen 
8323da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
8333da42859SDinh Nguyen 		r += NUM_RANKS_PER_SHADOW_REG) {
8343da42859SDinh Nguyen 		scc_mgr_apply_group_all_out_delay_add(write_group,
8353da42859SDinh Nguyen 						      group_bgn, delay);
8363da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
8373da42859SDinh Nguyen 	}
8383da42859SDinh Nguyen }
8393da42859SDinh Nguyen 
8403da42859SDinh Nguyen /* optimization used to recover some slots in ddr3 inst_rom */
8413da42859SDinh Nguyen /* could be applied to other protocols if we wanted to */
8423da42859SDinh Nguyen static void set_jump_as_return(void)
8433da42859SDinh Nguyen {
8446afb4fe2SMarek Vasut 	uint32_t addr = (u32)&sdr_rw_load_mgr_regs->load_cntr0;
8453da42859SDinh Nguyen 
8463da42859SDinh Nguyen 	/*
8473da42859SDinh Nguyen 	 * to save space, we replace return with jump to special shared
8483da42859SDinh Nguyen 	 * RETURN instruction so we set the counter to large value so that
8493da42859SDinh Nguyen 	 * we always jump
8503da42859SDinh Nguyen 	 */
8513da42859SDinh Nguyen 	writel(0xff, SOCFPGA_SDR_ADDRESS + addr);
8526afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add0;
8533da42859SDinh Nguyen 	writel(RW_MGR_RETURN, SOCFPGA_SDR_ADDRESS + addr);
8543da42859SDinh Nguyen }
8553da42859SDinh Nguyen 
8563da42859SDinh Nguyen /*
8573da42859SDinh Nguyen  * should always use constants as argument to ensure all computations are
8583da42859SDinh Nguyen  * performed at compile time
8593da42859SDinh Nguyen  */
8603da42859SDinh Nguyen static void delay_for_n_mem_clocks(const uint32_t clocks)
8613da42859SDinh Nguyen {
8623da42859SDinh Nguyen 	uint32_t afi_clocks;
8633da42859SDinh Nguyen 	uint8_t inner = 0;
8643da42859SDinh Nguyen 	uint8_t outer = 0;
8653da42859SDinh Nguyen 	uint16_t c_loop = 0;
8663da42859SDinh Nguyen 	uint32_t addr;
8673da42859SDinh Nguyen 
8683da42859SDinh Nguyen 	debug("%s:%d: clocks=%u ... start\n", __func__, __LINE__, clocks);
8693da42859SDinh Nguyen 
8703da42859SDinh Nguyen 
8713da42859SDinh Nguyen 	afi_clocks = (clocks + AFI_RATE_RATIO-1) / AFI_RATE_RATIO;
8723da42859SDinh Nguyen 	/* scale (rounding up) to get afi clocks */
8733da42859SDinh Nguyen 
8743da42859SDinh Nguyen 	/*
8753da42859SDinh Nguyen 	 * Note, we don't bother accounting for being off a little bit
8763da42859SDinh Nguyen 	 * because of a few extra instructions in outer loops
8773da42859SDinh Nguyen 	 * Note, the loops have a test at the end, and do the test before
8783da42859SDinh Nguyen 	 * the decrement, and so always perform the loop
8793da42859SDinh Nguyen 	 * 1 time more than the counter value
8803da42859SDinh Nguyen 	 */
8813da42859SDinh Nguyen 	if (afi_clocks == 0) {
8823da42859SDinh Nguyen 		;
8833da42859SDinh Nguyen 	} else if (afi_clocks <= 0x100) {
8843da42859SDinh Nguyen 		inner = afi_clocks-1;
8853da42859SDinh Nguyen 		outer = 0;
8863da42859SDinh Nguyen 		c_loop = 0;
8873da42859SDinh Nguyen 	} else if (afi_clocks <= 0x10000) {
8883da42859SDinh Nguyen 		inner = 0xff;
8893da42859SDinh Nguyen 		outer = (afi_clocks-1) >> 8;
8903da42859SDinh Nguyen 		c_loop = 0;
8913da42859SDinh Nguyen 	} else {
8923da42859SDinh Nguyen 		inner = 0xff;
8933da42859SDinh Nguyen 		outer = 0xff;
8943da42859SDinh Nguyen 		c_loop = (afi_clocks-1) >> 16;
8953da42859SDinh Nguyen 	}
8963da42859SDinh Nguyen 
8973da42859SDinh Nguyen 	/*
8983da42859SDinh Nguyen 	 * rom instructions are structured as follows:
8993da42859SDinh Nguyen 	 *
9003da42859SDinh Nguyen 	 *    IDLE_LOOP2: jnz cntr0, TARGET_A
9013da42859SDinh Nguyen 	 *    IDLE_LOOP1: jnz cntr1, TARGET_B
9023da42859SDinh Nguyen 	 *                return
9033da42859SDinh Nguyen 	 *
9043da42859SDinh Nguyen 	 * so, when doing nested loops, TARGET_A is set to IDLE_LOOP2, and
9053da42859SDinh Nguyen 	 * TARGET_B is set to IDLE_LOOP2 as well
9063da42859SDinh Nguyen 	 *
9073da42859SDinh Nguyen 	 * if we have no outer loop, though, then we can use IDLE_LOOP1 only,
9083da42859SDinh Nguyen 	 * and set TARGET_B to IDLE_LOOP1 and we skip IDLE_LOOP2 entirely
9093da42859SDinh Nguyen 	 *
9103da42859SDinh Nguyen 	 * a little confusing, but it helps save precious space in the inst_rom
9113da42859SDinh Nguyen 	 * and sequencer rom and keeps the delays more accurate and reduces
9123da42859SDinh Nguyen 	 * overhead
9133da42859SDinh Nguyen 	 */
9143da42859SDinh Nguyen 	if (afi_clocks <= 0x100) {
9156afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr1;
9163da42859SDinh Nguyen 		writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(inner), SOCFPGA_SDR_ADDRESS + addr);
9173da42859SDinh Nguyen 
9186afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add1;
9193da42859SDinh Nguyen 		writel(RW_MGR_IDLE_LOOP1, SOCFPGA_SDR_ADDRESS + addr);
9203da42859SDinh Nguyen 
921*c4815f76SMarek Vasut 		addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
9223da42859SDinh Nguyen 		writel(RW_MGR_IDLE_LOOP1, SOCFPGA_SDR_ADDRESS + addr);
9233da42859SDinh Nguyen 	} else {
9246afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr0;
9253da42859SDinh Nguyen 		writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(inner), SOCFPGA_SDR_ADDRESS + addr);
9263da42859SDinh Nguyen 
9276afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr1;
9283da42859SDinh Nguyen 		writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(outer), SOCFPGA_SDR_ADDRESS + addr);
9293da42859SDinh Nguyen 
9306afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add0;
9313da42859SDinh Nguyen 		writel(RW_MGR_IDLE_LOOP2, SOCFPGA_SDR_ADDRESS + addr);
9323da42859SDinh Nguyen 
9336afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add1;
9343da42859SDinh Nguyen 		writel(RW_MGR_IDLE_LOOP2, SOCFPGA_SDR_ADDRESS + addr);
9353da42859SDinh Nguyen 
9363da42859SDinh Nguyen 		/* hack to get around compiler not being smart enough */
9373da42859SDinh Nguyen 		if (afi_clocks <= 0x10000) {
9383da42859SDinh Nguyen 			/* only need to run once */
939*c4815f76SMarek Vasut 			addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
9403da42859SDinh Nguyen 			writel(RW_MGR_IDLE_LOOP2, SOCFPGA_SDR_ADDRESS + addr);
9413da42859SDinh Nguyen 		} else {
9423da42859SDinh Nguyen 			do {
943*c4815f76SMarek Vasut 				addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
9443da42859SDinh Nguyen 				writel(RW_MGR_IDLE_LOOP2, SOCFPGA_SDR_ADDRESS + addr);
9453da42859SDinh Nguyen 			} while (c_loop-- != 0);
9463da42859SDinh Nguyen 		}
9473da42859SDinh Nguyen 	}
9483da42859SDinh Nguyen 	debug("%s:%d clocks=%u ... end\n", __func__, __LINE__, clocks);
9493da42859SDinh Nguyen }
9503da42859SDinh Nguyen 
9513da42859SDinh Nguyen static void rw_mgr_mem_initialize(void)
9523da42859SDinh Nguyen {
9533da42859SDinh Nguyen 	uint32_t r;
9543da42859SDinh Nguyen 	uint32_t addr;
9553da42859SDinh Nguyen 
9563da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
9573da42859SDinh Nguyen 
9583da42859SDinh Nguyen 	/* The reset / cke part of initialization is broadcasted to all ranks */
959*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_SET_CS_AND_ODT_MASK_OFFSET;
9603da42859SDinh Nguyen 	writel(RW_MGR_RANK_ALL, SOCFPGA_SDR_ADDRESS + addr);
9613da42859SDinh Nguyen 
9623da42859SDinh Nguyen 	/*
9633da42859SDinh Nguyen 	 * Here's how you load register for a loop
9643da42859SDinh Nguyen 	 * Counters are located @ 0x800
9653da42859SDinh Nguyen 	 * Jump address are located @ 0xC00
9663da42859SDinh Nguyen 	 * For both, registers 0 to 3 are selected using bits 3 and 2, like
9673da42859SDinh Nguyen 	 * in 0x800, 0x804, 0x808, 0x80C and 0xC00, 0xC04, 0xC08, 0xC0C
9683da42859SDinh Nguyen 	 * I know this ain't pretty, but Avalon bus throws away the 2 least
9693da42859SDinh Nguyen 	 * significant bits
9703da42859SDinh Nguyen 	 */
9713da42859SDinh Nguyen 
9723da42859SDinh Nguyen 	/* start with memory RESET activated */
9733da42859SDinh Nguyen 
9743da42859SDinh Nguyen 	/* tINIT = 200us */
9753da42859SDinh Nguyen 
9763da42859SDinh Nguyen 	/*
9773da42859SDinh Nguyen 	 * 200us @ 266MHz (3.75 ns) ~ 54000 clock cycles
9783da42859SDinh Nguyen 	 * If a and b are the number of iteration in 2 nested loops
9793da42859SDinh Nguyen 	 * it takes the following number of cycles to complete the operation:
9803da42859SDinh Nguyen 	 * number_of_cycles = ((2 + n) * a + 2) * b
9813da42859SDinh Nguyen 	 * where n is the number of instruction in the inner loop
9823da42859SDinh Nguyen 	 * One possible solution is n = 0 , a = 256 , b = 106 => a = FF,
9833da42859SDinh Nguyen 	 * b = 6A
9843da42859SDinh Nguyen 	 */
9853da42859SDinh Nguyen 
9863da42859SDinh Nguyen 	/* Load counters */
9876afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_mgr_regs->load_cntr0;
9883da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TINIT_CNTR0_VAL),
9893da42859SDinh Nguyen 	       SOCFPGA_SDR_ADDRESS + addr);
9906afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_mgr_regs->load_cntr1;
9913da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TINIT_CNTR1_VAL),
9923da42859SDinh Nguyen 	       SOCFPGA_SDR_ADDRESS + addr);
9936afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_mgr_regs->load_cntr2;
9943da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TINIT_CNTR2_VAL),
9953da42859SDinh Nguyen 	       SOCFPGA_SDR_ADDRESS + addr);
9963da42859SDinh Nguyen 
9973da42859SDinh Nguyen 	/* Load jump address */
9986afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add0;
9993da42859SDinh Nguyen 	writel(RW_MGR_INIT_RESET_0_CKE_0, SOCFPGA_SDR_ADDRESS + addr);
10003da42859SDinh Nguyen 
10016afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add1;
10023da42859SDinh Nguyen 	writel(RW_MGR_INIT_RESET_0_CKE_0, SOCFPGA_SDR_ADDRESS + addr);
10033da42859SDinh Nguyen 
10046afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add2;
10053da42859SDinh Nguyen 	writel(RW_MGR_INIT_RESET_0_CKE_0, SOCFPGA_SDR_ADDRESS + addr);
10063da42859SDinh Nguyen 
10073da42859SDinh Nguyen 	/* Execute count instruction */
1008*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
10093da42859SDinh Nguyen 	writel(RW_MGR_INIT_RESET_0_CKE_0, SOCFPGA_SDR_ADDRESS + addr);
10103da42859SDinh Nguyen 
10113da42859SDinh Nguyen 	/* indicate that memory is stable */
10121bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cfg->reset_mem_stbl;
10133da42859SDinh Nguyen 	writel(1, SOCFPGA_SDR_ADDRESS + addr);
10143da42859SDinh Nguyen 
10153da42859SDinh Nguyen 	/*
10163da42859SDinh Nguyen 	 * transition the RESET to high
10173da42859SDinh Nguyen 	 * Wait for 500us
10183da42859SDinh Nguyen 	 */
10193da42859SDinh Nguyen 
10203da42859SDinh Nguyen 	/*
10213da42859SDinh Nguyen 	 * 500us @ 266MHz (3.75 ns) ~ 134000 clock cycles
10223da42859SDinh Nguyen 	 * If a and b are the number of iteration in 2 nested loops
10233da42859SDinh Nguyen 	 * it takes the following number of cycles to complete the operation
10243da42859SDinh Nguyen 	 * number_of_cycles = ((2 + n) * a + 2) * b
10253da42859SDinh Nguyen 	 * where n is the number of instruction in the inner loop
10263da42859SDinh Nguyen 	 * One possible solution is n = 2 , a = 131 , b = 256 => a = 83,
10273da42859SDinh Nguyen 	 * b = FF
10283da42859SDinh Nguyen 	 */
10293da42859SDinh Nguyen 
10303da42859SDinh Nguyen 	/* Load counters */
10316afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_mgr_regs->load_cntr0;
10323da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TRESET_CNTR0_VAL),
10333da42859SDinh Nguyen 	       SOCFPGA_SDR_ADDRESS + addr);
10346afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_mgr_regs->load_cntr1;
10353da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TRESET_CNTR1_VAL),
10363da42859SDinh Nguyen 	       SOCFPGA_SDR_ADDRESS + addr);
10376afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_mgr_regs->load_cntr2;
10383da42859SDinh Nguyen 	writel(SKIP_DELAY_LOOP_VALUE_OR_ZERO(SEQ_TRESET_CNTR2_VAL),
10393da42859SDinh Nguyen 	       SOCFPGA_SDR_ADDRESS + addr);
10403da42859SDinh Nguyen 
10413da42859SDinh Nguyen 	/* Load jump address */
10426afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add0;
10433da42859SDinh Nguyen 	writel(RW_MGR_INIT_RESET_1_CKE_0, SOCFPGA_SDR_ADDRESS + addr);
10446afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add1;
10453da42859SDinh Nguyen 	writel(RW_MGR_INIT_RESET_1_CKE_0, SOCFPGA_SDR_ADDRESS + addr);
10466afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add2;
10473da42859SDinh Nguyen 	writel(RW_MGR_INIT_RESET_1_CKE_0, SOCFPGA_SDR_ADDRESS + addr);
10483da42859SDinh Nguyen 
1049*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
10503da42859SDinh Nguyen 	writel(RW_MGR_INIT_RESET_1_CKE_0, SOCFPGA_SDR_ADDRESS + addr);
10513da42859SDinh Nguyen 
10523da42859SDinh Nguyen 	/* bring up clock enable */
10533da42859SDinh Nguyen 
10543da42859SDinh Nguyen 	/* tXRP < 250 ck cycles */
10553da42859SDinh Nguyen 	delay_for_n_mem_clocks(250);
10563da42859SDinh Nguyen 
10573da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r++) {
10583da42859SDinh Nguyen 		if (param->skip_ranks[r]) {
10593da42859SDinh Nguyen 			/* request to skip the rank */
10603da42859SDinh Nguyen 			continue;
10613da42859SDinh Nguyen 		}
10623da42859SDinh Nguyen 
10633da42859SDinh Nguyen 		/* set rank */
10643da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_OFF);
10653da42859SDinh Nguyen 
10663da42859SDinh Nguyen 		/*
10673da42859SDinh Nguyen 		 * USER Use Mirror-ed commands for odd ranks if address
10683da42859SDinh Nguyen 		 * mirrorring is on
10693da42859SDinh Nguyen 		 */
10703da42859SDinh Nguyen 		if ((RW_MGR_MEM_ADDRESS_MIRRORING >> r) & 0x1) {
10713da42859SDinh Nguyen 			set_jump_as_return();
1072*c4815f76SMarek Vasut 			addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
10733da42859SDinh Nguyen 			writel(RW_MGR_MRS2_MIRR, SOCFPGA_SDR_ADDRESS + addr);
10743da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10753da42859SDinh Nguyen 			set_jump_as_return();
10763da42859SDinh Nguyen 			writel(RW_MGR_MRS3_MIRR, SOCFPGA_SDR_ADDRESS + addr);
10773da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10783da42859SDinh Nguyen 			set_jump_as_return();
10793da42859SDinh Nguyen 			writel(RW_MGR_MRS1_MIRR, SOCFPGA_SDR_ADDRESS + addr);
10803da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10813da42859SDinh Nguyen 			set_jump_as_return();
10823da42859SDinh Nguyen 			writel(RW_MGR_MRS0_DLL_RESET_MIRR, SOCFPGA_SDR_ADDRESS + addr);
10833da42859SDinh Nguyen 		} else {
10843da42859SDinh Nguyen 			set_jump_as_return();
1085*c4815f76SMarek Vasut 			addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
10863da42859SDinh Nguyen 			writel(RW_MGR_MRS2, SOCFPGA_SDR_ADDRESS + addr);
10873da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10883da42859SDinh Nguyen 			set_jump_as_return();
10893da42859SDinh Nguyen 			writel(RW_MGR_MRS3, SOCFPGA_SDR_ADDRESS + addr);
10903da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
10913da42859SDinh Nguyen 			set_jump_as_return();
10923da42859SDinh Nguyen 			writel(RW_MGR_MRS1, SOCFPGA_SDR_ADDRESS + addr);
10933da42859SDinh Nguyen 			set_jump_as_return();
10943da42859SDinh Nguyen 			writel(RW_MGR_MRS0_DLL_RESET, SOCFPGA_SDR_ADDRESS + addr);
10953da42859SDinh Nguyen 		}
10963da42859SDinh Nguyen 		set_jump_as_return();
1097*c4815f76SMarek Vasut 		addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
10983da42859SDinh Nguyen 		writel(RW_MGR_ZQCL, SOCFPGA_SDR_ADDRESS + addr);
10993da42859SDinh Nguyen 
11003da42859SDinh Nguyen 		/* tZQinit = tDLLK = 512 ck cycles */
11013da42859SDinh Nguyen 		delay_for_n_mem_clocks(512);
11023da42859SDinh Nguyen 	}
11033da42859SDinh Nguyen }
11043da42859SDinh Nguyen 
11053da42859SDinh Nguyen /*
11063da42859SDinh Nguyen  * At the end of calibration we have to program the user settings in, and
11073da42859SDinh Nguyen  * USER  hand off the memory to the user.
11083da42859SDinh Nguyen  */
11093da42859SDinh Nguyen static void rw_mgr_mem_handoff(void)
11103da42859SDinh Nguyen {
11113da42859SDinh Nguyen 	uint32_t r;
11123da42859SDinh Nguyen 	uint32_t addr;
11133da42859SDinh Nguyen 
11143da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
11153da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r++) {
11163da42859SDinh Nguyen 		if (param->skip_ranks[r])
11173da42859SDinh Nguyen 			/* request to skip the rank */
11183da42859SDinh Nguyen 			continue;
11193da42859SDinh Nguyen 		/* set rank */
11203da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_OFF);
11213da42859SDinh Nguyen 
11223da42859SDinh Nguyen 		/* precharge all banks ... */
1123*c4815f76SMarek Vasut 		addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
11243da42859SDinh Nguyen 		writel(RW_MGR_PRECHARGE_ALL, SOCFPGA_SDR_ADDRESS + addr);
11253da42859SDinh Nguyen 
11263da42859SDinh Nguyen 		/* load up MR settings specified by user */
11273da42859SDinh Nguyen 
11283da42859SDinh Nguyen 		/*
11293da42859SDinh Nguyen 		 * Use Mirror-ed commands for odd ranks if address
11303da42859SDinh Nguyen 		 * mirrorring is on
11313da42859SDinh Nguyen 		 */
1132*c4815f76SMarek Vasut 		addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
11333da42859SDinh Nguyen 		if ((RW_MGR_MEM_ADDRESS_MIRRORING >> r) & 0x1) {
11343da42859SDinh Nguyen 			set_jump_as_return();
11353da42859SDinh Nguyen 			writel(RW_MGR_MRS2_MIRR, SOCFPGA_SDR_ADDRESS + addr);
11363da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
11373da42859SDinh Nguyen 			set_jump_as_return();
11383da42859SDinh Nguyen 			writel(RW_MGR_MRS3_MIRR, SOCFPGA_SDR_ADDRESS + addr);
11393da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
11403da42859SDinh Nguyen 			set_jump_as_return();
11413da42859SDinh Nguyen 			writel(RW_MGR_MRS1_MIRR, SOCFPGA_SDR_ADDRESS + addr);
11423da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
11433da42859SDinh Nguyen 			set_jump_as_return();
11443da42859SDinh Nguyen 			writel(RW_MGR_MRS0_USER_MIRR, SOCFPGA_SDR_ADDRESS + addr);
11453da42859SDinh Nguyen 		} else {
11463da42859SDinh Nguyen 			set_jump_as_return();
11473da42859SDinh Nguyen 			writel(RW_MGR_MRS2, SOCFPGA_SDR_ADDRESS + addr);
11483da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
11493da42859SDinh Nguyen 			set_jump_as_return();
11503da42859SDinh Nguyen 			writel(RW_MGR_MRS3, SOCFPGA_SDR_ADDRESS + addr);
11513da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
11523da42859SDinh Nguyen 			set_jump_as_return();
11533da42859SDinh Nguyen 			writel(RW_MGR_MRS1, SOCFPGA_SDR_ADDRESS + addr);
11543da42859SDinh Nguyen 			delay_for_n_mem_clocks(4);
11553da42859SDinh Nguyen 			set_jump_as_return();
11563da42859SDinh Nguyen 			writel(RW_MGR_MRS0_USER, SOCFPGA_SDR_ADDRESS + addr);
11573da42859SDinh Nguyen 		}
11583da42859SDinh Nguyen 		/*
11593da42859SDinh Nguyen 		 * USER  need to wait tMOD (12CK or 15ns) time before issuing
11603da42859SDinh Nguyen 		 * other commands, but we will have plenty of NIOS cycles before
11613da42859SDinh Nguyen 		 * actual handoff so its okay.
11623da42859SDinh Nguyen 		 */
11633da42859SDinh Nguyen 	}
11643da42859SDinh Nguyen }
11653da42859SDinh Nguyen 
11663da42859SDinh Nguyen /*
11673da42859SDinh Nguyen  * performs a guaranteed read on the patterns we are going to use during a
11683da42859SDinh Nguyen  * read test to ensure memory works
11693da42859SDinh Nguyen  */
11703da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test_patterns(uint32_t rank_bgn,
11713da42859SDinh Nguyen 	uint32_t group, uint32_t num_tries, uint32_t *bit_chk,
11723da42859SDinh Nguyen 	uint32_t all_ranks)
11733da42859SDinh Nguyen {
11743da42859SDinh Nguyen 	uint32_t r, vg;
11753da42859SDinh Nguyen 	uint32_t correct_mask_vg;
11763da42859SDinh Nguyen 	uint32_t tmp_bit_chk;
11773da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
11783da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
11793da42859SDinh Nguyen 	uint32_t addr;
11803da42859SDinh Nguyen 	uint32_t base_rw_mgr;
11813da42859SDinh Nguyen 
11823da42859SDinh Nguyen 	*bit_chk = param->read_correct_mask;
11833da42859SDinh Nguyen 	correct_mask_vg = param->read_correct_mask_vg;
11843da42859SDinh Nguyen 
11853da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
11863da42859SDinh Nguyen 		if (param->skip_ranks[r])
11873da42859SDinh Nguyen 			/* request to skip the rank */
11883da42859SDinh Nguyen 			continue;
11893da42859SDinh Nguyen 
11903da42859SDinh Nguyen 		/* set rank */
11913da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
11923da42859SDinh Nguyen 
11933da42859SDinh Nguyen 		/* Load up a constant bursts of read commands */
11946afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr0;
11953da42859SDinh Nguyen 		writel(0x20, SOCFPGA_SDR_ADDRESS + addr);
11966afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add0;
11973da42859SDinh Nguyen 		writel(RW_MGR_GUARANTEED_READ, SOCFPGA_SDR_ADDRESS + addr);
11983da42859SDinh Nguyen 
11996afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr1;
12003da42859SDinh Nguyen 		writel(0x20, SOCFPGA_SDR_ADDRESS + addr);
12016afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add1;
12023da42859SDinh Nguyen 		writel(RW_MGR_GUARANTEED_READ_CONT, SOCFPGA_SDR_ADDRESS + addr);
12033da42859SDinh Nguyen 
12043da42859SDinh Nguyen 		tmp_bit_chk = 0;
12053da42859SDinh Nguyen 		for (vg = RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS-1; ; vg--) {
12063da42859SDinh Nguyen 			/* reset the fifos to get pointers to known state */
12073da42859SDinh Nguyen 
12081bc6f14aSMarek Vasut 			addr = (u32)&phy_mgr_cmd->fifo_reset;
12093da42859SDinh Nguyen 			writel(0, SOCFPGA_SDR_ADDRESS + addr);
1210*c4815f76SMarek Vasut 			addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RESET_READ_DATAPATH_OFFSET;
12113da42859SDinh Nguyen 			writel(0, SOCFPGA_SDR_ADDRESS + addr);
12123da42859SDinh Nguyen 
12133da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk << (RW_MGR_MEM_DQ_PER_READ_DQS
12143da42859SDinh Nguyen 				/ RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS);
12153da42859SDinh Nguyen 
1216*c4815f76SMarek Vasut 			addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
12173da42859SDinh Nguyen 			writel(RW_MGR_GUARANTEED_READ, SOCFPGA_SDR_ADDRESS + addr +
12183da42859SDinh Nguyen 			       ((group * RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS +
12193da42859SDinh Nguyen 				vg) << 2));
12203da42859SDinh Nguyen 
1221a4bfa463SMarek Vasut 			addr = SDR_PHYGRP_RWMGRGRP_ADDRESS;
12223da42859SDinh Nguyen 			base_rw_mgr = readl(SOCFPGA_SDR_ADDRESS + addr);
12233da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk | (correct_mask_vg & (~base_rw_mgr));
12243da42859SDinh Nguyen 
12253da42859SDinh Nguyen 			if (vg == 0)
12263da42859SDinh Nguyen 				break;
12273da42859SDinh Nguyen 		}
12283da42859SDinh Nguyen 		*bit_chk &= tmp_bit_chk;
12293da42859SDinh Nguyen 	}
12303da42859SDinh Nguyen 
1231*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
12323da42859SDinh Nguyen 	writel(RW_MGR_CLEAR_DQS_ENABLE, SOCFPGA_SDR_ADDRESS + addr + (group << 2));
12333da42859SDinh Nguyen 
12343da42859SDinh Nguyen 	set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
12353da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d test_load_patterns(%u,ALL) => (%u == %u) =>\
12363da42859SDinh Nguyen 		   %lu\n", __func__, __LINE__, group, *bit_chk, param->read_correct_mask,
12373da42859SDinh Nguyen 		   (long unsigned int)(*bit_chk == param->read_correct_mask));
12383da42859SDinh Nguyen 	return *bit_chk == param->read_correct_mask;
12393da42859SDinh Nguyen }
12403da42859SDinh Nguyen 
12413da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test_patterns_all_ranks
12423da42859SDinh Nguyen 	(uint32_t group, uint32_t num_tries, uint32_t *bit_chk)
12433da42859SDinh Nguyen {
12443da42859SDinh Nguyen 	return rw_mgr_mem_calibrate_read_test_patterns(0, group,
12453da42859SDinh Nguyen 		num_tries, bit_chk, 1);
12463da42859SDinh Nguyen }
12473da42859SDinh Nguyen 
12483da42859SDinh Nguyen /* load up the patterns we are going to use during a read test */
12493da42859SDinh Nguyen static void rw_mgr_mem_calibrate_read_load_patterns(uint32_t rank_bgn,
12503da42859SDinh Nguyen 	uint32_t all_ranks)
12513da42859SDinh Nguyen {
12523da42859SDinh Nguyen 	uint32_t r;
12533da42859SDinh Nguyen 	uint32_t addr;
12543da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
12553da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
12563da42859SDinh Nguyen 
12573da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
12583da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
12593da42859SDinh Nguyen 		if (param->skip_ranks[r])
12603da42859SDinh Nguyen 			/* request to skip the rank */
12613da42859SDinh Nguyen 			continue;
12623da42859SDinh Nguyen 
12633da42859SDinh Nguyen 		/* set rank */
12643da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
12653da42859SDinh Nguyen 
12663da42859SDinh Nguyen 		/* Load up a constant bursts */
12676afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr0;
12683da42859SDinh Nguyen 		writel(0x20, SOCFPGA_SDR_ADDRESS + addr);
12693da42859SDinh Nguyen 
12706afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add0;
12713da42859SDinh Nguyen 		writel(RW_MGR_GUARANTEED_WRITE_WAIT0, SOCFPGA_SDR_ADDRESS + addr);
12723da42859SDinh Nguyen 
12736afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr1;
12743da42859SDinh Nguyen 		writel(0x20, SOCFPGA_SDR_ADDRESS + addr);
12753da42859SDinh Nguyen 
12766afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add1;
12773da42859SDinh Nguyen 		writel(RW_MGR_GUARANTEED_WRITE_WAIT1, SOCFPGA_SDR_ADDRESS + addr);
12783da42859SDinh Nguyen 
12796afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr2;
12803da42859SDinh Nguyen 		writel(0x04, SOCFPGA_SDR_ADDRESS + addr);
12813da42859SDinh Nguyen 
12826afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add2;
12833da42859SDinh Nguyen 		writel(RW_MGR_GUARANTEED_WRITE_WAIT2, SOCFPGA_SDR_ADDRESS + addr);
12843da42859SDinh Nguyen 
12856afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr3;
12863da42859SDinh Nguyen 		writel(0x04, SOCFPGA_SDR_ADDRESS + addr);
12873da42859SDinh Nguyen 
12886afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add3;
12893da42859SDinh Nguyen 		writel(RW_MGR_GUARANTEED_WRITE_WAIT3, SOCFPGA_SDR_ADDRESS + addr);
12903da42859SDinh Nguyen 
1291*c4815f76SMarek Vasut 		addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
12923da42859SDinh Nguyen 		writel(RW_MGR_GUARANTEED_WRITE, SOCFPGA_SDR_ADDRESS + addr);
12933da42859SDinh Nguyen 	}
12943da42859SDinh Nguyen 
12953da42859SDinh Nguyen 	set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
12963da42859SDinh Nguyen }
12973da42859SDinh Nguyen 
12983da42859SDinh Nguyen /*
12993da42859SDinh Nguyen  * try a read and see if it returns correct data back. has dummy reads
13003da42859SDinh Nguyen  * inserted into the mix used to align dqs enable. has more thorough checks
13013da42859SDinh Nguyen  * than the regular read test.
13023da42859SDinh Nguyen  */
13033da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test(uint32_t rank_bgn, uint32_t group,
13043da42859SDinh Nguyen 	uint32_t num_tries, uint32_t all_correct, uint32_t *bit_chk,
13053da42859SDinh Nguyen 	uint32_t all_groups, uint32_t all_ranks)
13063da42859SDinh Nguyen {
13073da42859SDinh Nguyen 	uint32_t r, vg;
13083da42859SDinh Nguyen 	uint32_t correct_mask_vg;
13093da42859SDinh Nguyen 	uint32_t tmp_bit_chk;
13103da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
13113da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
13123da42859SDinh Nguyen 	uint32_t addr;
13133da42859SDinh Nguyen 	uint32_t base_rw_mgr;
13143da42859SDinh Nguyen 
13153da42859SDinh Nguyen 	*bit_chk = param->read_correct_mask;
13163da42859SDinh Nguyen 	correct_mask_vg = param->read_correct_mask_vg;
13173da42859SDinh Nguyen 
13183da42859SDinh Nguyen 	uint32_t quick_read_mode = (((STATIC_CALIB_STEPS) &
13193da42859SDinh Nguyen 		CALIB_SKIP_DELAY_SWEEPS) && ENABLE_SUPER_QUICK_CALIBRATION);
13203da42859SDinh Nguyen 
13213da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
13223da42859SDinh Nguyen 		if (param->skip_ranks[r])
13233da42859SDinh Nguyen 			/* request to skip the rank */
13243da42859SDinh Nguyen 			continue;
13253da42859SDinh Nguyen 
13263da42859SDinh Nguyen 		/* set rank */
13273da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
13283da42859SDinh Nguyen 
13296afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr1;
13303da42859SDinh Nguyen 		writel(0x10, SOCFPGA_SDR_ADDRESS + addr);
13313da42859SDinh Nguyen 
13326afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add1;
13333da42859SDinh Nguyen 		writel(RW_MGR_READ_B2B_WAIT1, SOCFPGA_SDR_ADDRESS + addr);
13343da42859SDinh Nguyen 
13356afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr2;
13363da42859SDinh Nguyen 		writel(0x10, SOCFPGA_SDR_ADDRESS + addr);
13376afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add2;
13383da42859SDinh Nguyen 		writel(RW_MGR_READ_B2B_WAIT2, SOCFPGA_SDR_ADDRESS + addr);
13393da42859SDinh Nguyen 
13406afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr0;
13413da42859SDinh Nguyen 		if (quick_read_mode)
13423da42859SDinh Nguyen 			writel(0x1, SOCFPGA_SDR_ADDRESS + addr);
13433da42859SDinh Nguyen 			/* need at least two (1+1) reads to capture failures */
13443da42859SDinh Nguyen 		else if (all_groups)
13453da42859SDinh Nguyen 			writel(0x06, SOCFPGA_SDR_ADDRESS + addr);
13463da42859SDinh Nguyen 		else
13473da42859SDinh Nguyen 			writel(0x32, SOCFPGA_SDR_ADDRESS + addr);
13483da42859SDinh Nguyen 
13496afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add0;
13503da42859SDinh Nguyen 		writel(RW_MGR_READ_B2B, SOCFPGA_SDR_ADDRESS + addr);
13516afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr3;
13523da42859SDinh Nguyen 		if (all_groups)
13533da42859SDinh Nguyen 			writel(RW_MGR_MEM_IF_READ_DQS_WIDTH *
13543da42859SDinh Nguyen 			       RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS - 1,
13553da42859SDinh Nguyen 			       SOCFPGA_SDR_ADDRESS + addr);
13563da42859SDinh Nguyen 		else
13573da42859SDinh Nguyen 			writel(0x0, SOCFPGA_SDR_ADDRESS + addr);
13583da42859SDinh Nguyen 
13596afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add3;
13603da42859SDinh Nguyen 		writel(RW_MGR_READ_B2B, SOCFPGA_SDR_ADDRESS + addr);
13613da42859SDinh Nguyen 
13623da42859SDinh Nguyen 		tmp_bit_chk = 0;
13633da42859SDinh Nguyen 		for (vg = RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS-1; ; vg--) {
13643da42859SDinh Nguyen 			/* reset the fifos to get pointers to known state */
13651bc6f14aSMarek Vasut 			addr = (u32)&phy_mgr_cmd->fifo_reset;
13663da42859SDinh Nguyen 			writel(0, SOCFPGA_SDR_ADDRESS + addr);
1367*c4815f76SMarek Vasut 			addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RESET_READ_DATAPATH_OFFSET;
13683da42859SDinh Nguyen 			writel(0, SOCFPGA_SDR_ADDRESS + addr);
13693da42859SDinh Nguyen 
13703da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk << (RW_MGR_MEM_DQ_PER_READ_DQS
13713da42859SDinh Nguyen 				/ RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS);
13723da42859SDinh Nguyen 
1373*c4815f76SMarek Vasut 			if (all_groups)
1374*c4815f76SMarek Vasut 				addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_ALL_GROUPS_OFFSET;
1375*c4815f76SMarek Vasut 			else
1376*c4815f76SMarek Vasut 				addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
1377*c4815f76SMarek Vasut 
13783da42859SDinh Nguyen 			writel(RW_MGR_READ_B2B, SOCFPGA_SDR_ADDRESS + addr +
13793da42859SDinh Nguyen 			       ((group * RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS +
13803da42859SDinh Nguyen 			       vg) << 2));
13813da42859SDinh Nguyen 
1382a4bfa463SMarek Vasut 			addr = SDR_PHYGRP_RWMGRGRP_ADDRESS;
13833da42859SDinh Nguyen 			base_rw_mgr = readl(SOCFPGA_SDR_ADDRESS + addr);
13843da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk | (correct_mask_vg & ~(base_rw_mgr));
13853da42859SDinh Nguyen 
13863da42859SDinh Nguyen 			if (vg == 0)
13873da42859SDinh Nguyen 				break;
13883da42859SDinh Nguyen 		}
13893da42859SDinh Nguyen 		*bit_chk &= tmp_bit_chk;
13903da42859SDinh Nguyen 	}
13913da42859SDinh Nguyen 
1392*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
13933da42859SDinh Nguyen 	writel(RW_MGR_CLEAR_DQS_ENABLE, SOCFPGA_SDR_ADDRESS + addr + (group << 2));
13943da42859SDinh Nguyen 
13953da42859SDinh Nguyen 	if (all_correct) {
13963da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
13973da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d read_test(%u,ALL,%u) =>\
13983da42859SDinh Nguyen 			   (%u == %u) => %lu", __func__, __LINE__, group,
13993da42859SDinh Nguyen 			   all_groups, *bit_chk, param->read_correct_mask,
14003da42859SDinh Nguyen 			   (long unsigned int)(*bit_chk ==
14013da42859SDinh Nguyen 			   param->read_correct_mask));
14023da42859SDinh Nguyen 		return *bit_chk == param->read_correct_mask;
14033da42859SDinh Nguyen 	} else	{
14043da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
14053da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d read_test(%u,ONE,%u) =>\
14063da42859SDinh Nguyen 			   (%u != %lu) => %lu\n", __func__, __LINE__,
14073da42859SDinh Nguyen 			   group, all_groups, *bit_chk, (long unsigned int)0,
14083da42859SDinh Nguyen 			   (long unsigned int)(*bit_chk != 0x00));
14093da42859SDinh Nguyen 		return *bit_chk != 0x00;
14103da42859SDinh Nguyen 	}
14113da42859SDinh Nguyen }
14123da42859SDinh Nguyen 
14133da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_read_test_all_ranks(uint32_t group,
14143da42859SDinh Nguyen 	uint32_t num_tries, uint32_t all_correct, uint32_t *bit_chk,
14153da42859SDinh Nguyen 	uint32_t all_groups)
14163da42859SDinh Nguyen {
14173da42859SDinh Nguyen 	return rw_mgr_mem_calibrate_read_test(0, group, num_tries, all_correct,
14183da42859SDinh Nguyen 					      bit_chk, all_groups, 1);
14193da42859SDinh Nguyen }
14203da42859SDinh Nguyen 
14213da42859SDinh Nguyen static void rw_mgr_incr_vfifo(uint32_t grp, uint32_t *v)
14223da42859SDinh Nguyen {
14231bc6f14aSMarek Vasut 	uint32_t addr = (u32)&phy_mgr_cmd->inc_vfifo_hard_phy;
14243da42859SDinh Nguyen 
14253da42859SDinh Nguyen 	writel(grp, SOCFPGA_SDR_ADDRESS + addr);
14263da42859SDinh Nguyen 	(*v)++;
14273da42859SDinh Nguyen }
14283da42859SDinh Nguyen 
14293da42859SDinh Nguyen static void rw_mgr_decr_vfifo(uint32_t grp, uint32_t *v)
14303da42859SDinh Nguyen {
14313da42859SDinh Nguyen 	uint32_t i;
14323da42859SDinh Nguyen 
14333da42859SDinh Nguyen 	for (i = 0; i < VFIFO_SIZE-1; i++)
14343da42859SDinh Nguyen 		rw_mgr_incr_vfifo(grp, v);
14353da42859SDinh Nguyen }
14363da42859SDinh Nguyen 
14373da42859SDinh Nguyen static int find_vfifo_read(uint32_t grp, uint32_t *bit_chk)
14383da42859SDinh Nguyen {
14393da42859SDinh Nguyen 	uint32_t  v;
14403da42859SDinh Nguyen 	uint32_t fail_cnt = 0;
14413da42859SDinh Nguyen 	uint32_t test_status;
14423da42859SDinh Nguyen 
14433da42859SDinh Nguyen 	for (v = 0; v < VFIFO_SIZE; ) {
14443da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: vfifo %u\n",
14453da42859SDinh Nguyen 			   __func__, __LINE__, v);
14463da42859SDinh Nguyen 		test_status = rw_mgr_mem_calibrate_read_test_all_ranks
14473da42859SDinh Nguyen 			(grp, 1, PASS_ONE_BIT, bit_chk, 0);
14483da42859SDinh Nguyen 		if (!test_status) {
14493da42859SDinh Nguyen 			fail_cnt++;
14503da42859SDinh Nguyen 
14513da42859SDinh Nguyen 			if (fail_cnt == 2)
14523da42859SDinh Nguyen 				break;
14533da42859SDinh Nguyen 		}
14543da42859SDinh Nguyen 
14553da42859SDinh Nguyen 		/* fiddle with FIFO */
14563da42859SDinh Nguyen 		rw_mgr_incr_vfifo(grp, &v);
14573da42859SDinh Nguyen 	}
14583da42859SDinh Nguyen 
14593da42859SDinh Nguyen 	if (v >= VFIFO_SIZE) {
14603da42859SDinh Nguyen 		/* no failing read found!! Something must have gone wrong */
14613da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: vfifo failed\n",
14623da42859SDinh Nguyen 			   __func__, __LINE__);
14633da42859SDinh Nguyen 		return 0;
14643da42859SDinh Nguyen 	} else {
14653da42859SDinh Nguyen 		return v;
14663da42859SDinh Nguyen 	}
14673da42859SDinh Nguyen }
14683da42859SDinh Nguyen 
14693da42859SDinh Nguyen static int find_working_phase(uint32_t *grp, uint32_t *bit_chk,
14703da42859SDinh Nguyen 			      uint32_t dtaps_per_ptap, uint32_t *work_bgn,
14713da42859SDinh Nguyen 			      uint32_t *v, uint32_t *d, uint32_t *p,
14723da42859SDinh Nguyen 			      uint32_t *i, uint32_t *max_working_cnt)
14733da42859SDinh Nguyen {
14743da42859SDinh Nguyen 	uint32_t found_begin = 0;
14753da42859SDinh Nguyen 	uint32_t tmp_delay = 0;
14763da42859SDinh Nguyen 	uint32_t test_status;
14773da42859SDinh Nguyen 
14783da42859SDinh Nguyen 	for (*d = 0; *d <= dtaps_per_ptap; (*d)++, tmp_delay +=
14793da42859SDinh Nguyen 		IO_DELAY_PER_DQS_EN_DCHAIN_TAP) {
14803da42859SDinh Nguyen 		*work_bgn = tmp_delay;
14813da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay_all_ranks(*grp, *d);
14823da42859SDinh Nguyen 
14833da42859SDinh Nguyen 		for (*i = 0; *i < VFIFO_SIZE; (*i)++) {
14843da42859SDinh Nguyen 			for (*p = 0; *p <= IO_DQS_EN_PHASE_MAX; (*p)++, *work_bgn +=
14853da42859SDinh Nguyen 				IO_DELAY_PER_OPA_TAP) {
14863da42859SDinh Nguyen 				scc_mgr_set_dqs_en_phase_all_ranks(*grp, *p);
14873da42859SDinh Nguyen 
14883da42859SDinh Nguyen 				test_status =
14893da42859SDinh Nguyen 				rw_mgr_mem_calibrate_read_test_all_ranks
14903da42859SDinh Nguyen 				(*grp, 1, PASS_ONE_BIT, bit_chk, 0);
14913da42859SDinh Nguyen 
14923da42859SDinh Nguyen 				if (test_status) {
14933da42859SDinh Nguyen 					*max_working_cnt = 1;
14943da42859SDinh Nguyen 					found_begin = 1;
14953da42859SDinh Nguyen 					break;
14963da42859SDinh Nguyen 				}
14973da42859SDinh Nguyen 			}
14983da42859SDinh Nguyen 
14993da42859SDinh Nguyen 			if (found_begin)
15003da42859SDinh Nguyen 				break;
15013da42859SDinh Nguyen 
15023da42859SDinh Nguyen 			if (*p > IO_DQS_EN_PHASE_MAX)
15033da42859SDinh Nguyen 				/* fiddle with FIFO */
15043da42859SDinh Nguyen 				rw_mgr_incr_vfifo(*grp, v);
15053da42859SDinh Nguyen 		}
15063da42859SDinh Nguyen 
15073da42859SDinh Nguyen 		if (found_begin)
15083da42859SDinh Nguyen 			break;
15093da42859SDinh Nguyen 	}
15103da42859SDinh Nguyen 
15113da42859SDinh Nguyen 	if (*i >= VFIFO_SIZE) {
15123da42859SDinh Nguyen 		/* cannot find working solution */
15133da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: no vfifo/\
15143da42859SDinh Nguyen 			   ptap/dtap\n", __func__, __LINE__);
15153da42859SDinh Nguyen 		return 0;
15163da42859SDinh Nguyen 	} else {
15173da42859SDinh Nguyen 		return 1;
15183da42859SDinh Nguyen 	}
15193da42859SDinh Nguyen }
15203da42859SDinh Nguyen 
15213da42859SDinh Nguyen static void sdr_backup_phase(uint32_t *grp, uint32_t *bit_chk,
15223da42859SDinh Nguyen 			     uint32_t *work_bgn, uint32_t *v, uint32_t *d,
15233da42859SDinh Nguyen 			     uint32_t *p, uint32_t *max_working_cnt)
15243da42859SDinh Nguyen {
15253da42859SDinh Nguyen 	uint32_t found_begin = 0;
15263da42859SDinh Nguyen 	uint32_t tmp_delay;
15273da42859SDinh Nguyen 
15283da42859SDinh Nguyen 	/* Special case code for backing up a phase */
15293da42859SDinh Nguyen 	if (*p == 0) {
15303da42859SDinh Nguyen 		*p = IO_DQS_EN_PHASE_MAX;
15313da42859SDinh Nguyen 		rw_mgr_decr_vfifo(*grp, v);
15323da42859SDinh Nguyen 	} else {
15333da42859SDinh Nguyen 		(*p)--;
15343da42859SDinh Nguyen 	}
15353da42859SDinh Nguyen 	tmp_delay = *work_bgn - IO_DELAY_PER_OPA_TAP;
15363da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(*grp, *p);
15373da42859SDinh Nguyen 
15383da42859SDinh Nguyen 	for (*d = 0; *d <= IO_DQS_EN_DELAY_MAX && tmp_delay < *work_bgn;
15393da42859SDinh Nguyen 		(*d)++, tmp_delay += IO_DELAY_PER_DQS_EN_DCHAIN_TAP) {
15403da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay_all_ranks(*grp, *d);
15413da42859SDinh Nguyen 
15423da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_read_test_all_ranks(*grp, 1,
15433da42859SDinh Nguyen 							     PASS_ONE_BIT,
15443da42859SDinh Nguyen 							     bit_chk, 0)) {
15453da42859SDinh Nguyen 			found_begin = 1;
15463da42859SDinh Nguyen 			*work_bgn = tmp_delay;
15473da42859SDinh Nguyen 			break;
15483da42859SDinh Nguyen 		}
15493da42859SDinh Nguyen 	}
15503da42859SDinh Nguyen 
15513da42859SDinh Nguyen 	/* We have found a working dtap before the ptap found above */
15523da42859SDinh Nguyen 	if (found_begin == 1)
15533da42859SDinh Nguyen 		(*max_working_cnt)++;
15543da42859SDinh Nguyen 
15553da42859SDinh Nguyen 	/*
15563da42859SDinh Nguyen 	 * Restore VFIFO to old state before we decremented it
15573da42859SDinh Nguyen 	 * (if needed).
15583da42859SDinh Nguyen 	 */
15593da42859SDinh Nguyen 	(*p)++;
15603da42859SDinh Nguyen 	if (*p > IO_DQS_EN_PHASE_MAX) {
15613da42859SDinh Nguyen 		*p = 0;
15623da42859SDinh Nguyen 		rw_mgr_incr_vfifo(*grp, v);
15633da42859SDinh Nguyen 	}
15643da42859SDinh Nguyen 
15653da42859SDinh Nguyen 	scc_mgr_set_dqs_en_delay_all_ranks(*grp, 0);
15663da42859SDinh Nguyen }
15673da42859SDinh Nguyen 
15683da42859SDinh Nguyen static int sdr_nonworking_phase(uint32_t *grp, uint32_t *bit_chk,
15693da42859SDinh Nguyen 			     uint32_t *work_bgn, uint32_t *v, uint32_t *d,
15703da42859SDinh Nguyen 			     uint32_t *p, uint32_t *i, uint32_t *max_working_cnt,
15713da42859SDinh Nguyen 			     uint32_t *work_end)
15723da42859SDinh Nguyen {
15733da42859SDinh Nguyen 	uint32_t found_end = 0;
15743da42859SDinh Nguyen 
15753da42859SDinh Nguyen 	(*p)++;
15763da42859SDinh Nguyen 	*work_end += IO_DELAY_PER_OPA_TAP;
15773da42859SDinh Nguyen 	if (*p > IO_DQS_EN_PHASE_MAX) {
15783da42859SDinh Nguyen 		/* fiddle with FIFO */
15793da42859SDinh Nguyen 		*p = 0;
15803da42859SDinh Nguyen 		rw_mgr_incr_vfifo(*grp, v);
15813da42859SDinh Nguyen 	}
15823da42859SDinh Nguyen 
15833da42859SDinh Nguyen 	for (; *i < VFIFO_SIZE + 1; (*i)++) {
15843da42859SDinh Nguyen 		for (; *p <= IO_DQS_EN_PHASE_MAX; (*p)++, *work_end
15853da42859SDinh Nguyen 			+= IO_DELAY_PER_OPA_TAP) {
15863da42859SDinh Nguyen 			scc_mgr_set_dqs_en_phase_all_ranks(*grp, *p);
15873da42859SDinh Nguyen 
15883da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_read_test_all_ranks
15893da42859SDinh Nguyen 				(*grp, 1, PASS_ONE_BIT, bit_chk, 0)) {
15903da42859SDinh Nguyen 				found_end = 1;
15913da42859SDinh Nguyen 				break;
15923da42859SDinh Nguyen 			} else {
15933da42859SDinh Nguyen 				(*max_working_cnt)++;
15943da42859SDinh Nguyen 			}
15953da42859SDinh Nguyen 		}
15963da42859SDinh Nguyen 
15973da42859SDinh Nguyen 		if (found_end)
15983da42859SDinh Nguyen 			break;
15993da42859SDinh Nguyen 
16003da42859SDinh Nguyen 		if (*p > IO_DQS_EN_PHASE_MAX) {
16013da42859SDinh Nguyen 			/* fiddle with FIFO */
16023da42859SDinh Nguyen 			rw_mgr_incr_vfifo(*grp, v);
16033da42859SDinh Nguyen 			*p = 0;
16043da42859SDinh Nguyen 		}
16053da42859SDinh Nguyen 	}
16063da42859SDinh Nguyen 
16073da42859SDinh Nguyen 	if (*i >= VFIFO_SIZE + 1) {
16083da42859SDinh Nguyen 		/* cannot see edge of failing read */
16093da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d sdr_nonworking_phase: end:\
16103da42859SDinh Nguyen 			   failed\n", __func__, __LINE__);
16113da42859SDinh Nguyen 		return 0;
16123da42859SDinh Nguyen 	} else {
16133da42859SDinh Nguyen 		return 1;
16143da42859SDinh Nguyen 	}
16153da42859SDinh Nguyen }
16163da42859SDinh Nguyen 
16173da42859SDinh Nguyen static int sdr_find_window_centre(uint32_t *grp, uint32_t *bit_chk,
16183da42859SDinh Nguyen 				  uint32_t *work_bgn, uint32_t *v, uint32_t *d,
16193da42859SDinh Nguyen 				  uint32_t *p, uint32_t *work_mid,
16203da42859SDinh Nguyen 				  uint32_t *work_end)
16213da42859SDinh Nguyen {
16223da42859SDinh Nguyen 	int i;
16233da42859SDinh Nguyen 	int tmp_delay = 0;
16243da42859SDinh Nguyen 
16253da42859SDinh Nguyen 	*work_mid = (*work_bgn + *work_end) / 2;
16263da42859SDinh Nguyen 
16273da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "work_bgn=%d work_end=%d work_mid=%d\n",
16283da42859SDinh Nguyen 		   *work_bgn, *work_end, *work_mid);
16293da42859SDinh Nguyen 	/* Get the middle delay to be less than a VFIFO delay */
16303da42859SDinh Nguyen 	for (*p = 0; *p <= IO_DQS_EN_PHASE_MAX;
16313da42859SDinh Nguyen 		(*p)++, tmp_delay += IO_DELAY_PER_OPA_TAP)
16323da42859SDinh Nguyen 		;
16333da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "vfifo ptap delay %d\n", tmp_delay);
16343da42859SDinh Nguyen 	while (*work_mid > tmp_delay)
16353da42859SDinh Nguyen 		*work_mid -= tmp_delay;
16363da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "new work_mid %d\n", *work_mid);
16373da42859SDinh Nguyen 
16383da42859SDinh Nguyen 	tmp_delay = 0;
16393da42859SDinh Nguyen 	for (*p = 0; *p <= IO_DQS_EN_PHASE_MAX && tmp_delay < *work_mid;
16403da42859SDinh Nguyen 		(*p)++, tmp_delay += IO_DELAY_PER_OPA_TAP)
16413da42859SDinh Nguyen 		;
16423da42859SDinh Nguyen 	tmp_delay -= IO_DELAY_PER_OPA_TAP;
16433da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "new p %d, tmp_delay=%d\n", (*p) - 1, tmp_delay);
16443da42859SDinh Nguyen 	for (*d = 0; *d <= IO_DQS_EN_DELAY_MAX && tmp_delay < *work_mid; (*d)++,
16453da42859SDinh Nguyen 		tmp_delay += IO_DELAY_PER_DQS_EN_DCHAIN_TAP)
16463da42859SDinh Nguyen 		;
16473da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "new d %d, tmp_delay=%d\n", *d, tmp_delay);
16483da42859SDinh Nguyen 
16493da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(*grp, (*p) - 1);
16503da42859SDinh Nguyen 	scc_mgr_set_dqs_en_delay_all_ranks(*grp, *d);
16513da42859SDinh Nguyen 
16523da42859SDinh Nguyen 	/*
16533da42859SDinh Nguyen 	 * push vfifo until we can successfully calibrate. We can do this
16543da42859SDinh Nguyen 	 * because the largest possible margin in 1 VFIFO cycle.
16553da42859SDinh Nguyen 	 */
16563da42859SDinh Nguyen 	for (i = 0; i < VFIFO_SIZE; i++) {
16573da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "find_dqs_en_phase: center: vfifo=%u\n",
16583da42859SDinh Nguyen 			   *v);
16593da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_read_test_all_ranks(*grp, 1,
16603da42859SDinh Nguyen 							     PASS_ONE_BIT,
16613da42859SDinh Nguyen 							     bit_chk, 0)) {
16623da42859SDinh Nguyen 			break;
16633da42859SDinh Nguyen 		}
16643da42859SDinh Nguyen 
16653da42859SDinh Nguyen 		/* fiddle with FIFO */
16663da42859SDinh Nguyen 		rw_mgr_incr_vfifo(*grp, v);
16673da42859SDinh Nguyen 	}
16683da42859SDinh Nguyen 
16693da42859SDinh Nguyen 	if (i >= VFIFO_SIZE) {
16703da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: center: \
16713da42859SDinh Nguyen 			   failed\n", __func__, __LINE__);
16723da42859SDinh Nguyen 		return 0;
16733da42859SDinh Nguyen 	} else {
16743da42859SDinh Nguyen 		return 1;
16753da42859SDinh Nguyen 	}
16763da42859SDinh Nguyen }
16773da42859SDinh Nguyen 
16783da42859SDinh Nguyen /* find a good dqs enable to use */
16793da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase(uint32_t grp)
16803da42859SDinh Nguyen {
16813da42859SDinh Nguyen 	uint32_t v, d, p, i;
16823da42859SDinh Nguyen 	uint32_t max_working_cnt;
16833da42859SDinh Nguyen 	uint32_t bit_chk;
16843da42859SDinh Nguyen 	uint32_t dtaps_per_ptap;
16853da42859SDinh Nguyen 	uint32_t work_bgn, work_mid, work_end;
16863da42859SDinh Nguyen 	uint32_t found_passing_read, found_failing_read, initial_failing_dtap;
16873da42859SDinh Nguyen 	uint32_t addr;
16883da42859SDinh Nguyen 
16893da42859SDinh Nguyen 	debug("%s:%d %u\n", __func__, __LINE__, grp);
16903da42859SDinh Nguyen 
16913da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_VFIFO_CENTER);
16923da42859SDinh Nguyen 
16933da42859SDinh Nguyen 	scc_mgr_set_dqs_en_delay_all_ranks(grp, 0);
16943da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(grp, 0);
16953da42859SDinh Nguyen 
16963da42859SDinh Nguyen 	/* ************************************************************** */
16973da42859SDinh Nguyen 	/* * Step 0 : Determine number of delay taps for each phase tap * */
16983da42859SDinh Nguyen 	dtaps_per_ptap = IO_DELAY_PER_OPA_TAP/IO_DELAY_PER_DQS_EN_DCHAIN_TAP;
16993da42859SDinh Nguyen 
17003da42859SDinh Nguyen 	/* ********************************************************* */
17013da42859SDinh Nguyen 	/* * Step 1 : First push vfifo until we get a failing read * */
17023da42859SDinh Nguyen 	v = find_vfifo_read(grp, &bit_chk);
17033da42859SDinh Nguyen 
17043da42859SDinh Nguyen 	max_working_cnt = 0;
17053da42859SDinh Nguyen 
17063da42859SDinh Nguyen 	/* ******************************************************** */
17073da42859SDinh Nguyen 	/* * step 2: find first working phase, increment in ptaps * */
17083da42859SDinh Nguyen 	work_bgn = 0;
17093da42859SDinh Nguyen 	if (find_working_phase(&grp, &bit_chk, dtaps_per_ptap, &work_bgn, &v, &d,
17103da42859SDinh Nguyen 				&p, &i, &max_working_cnt) == 0)
17113da42859SDinh Nguyen 		return 0;
17123da42859SDinh Nguyen 
17133da42859SDinh Nguyen 	work_end = work_bgn;
17143da42859SDinh Nguyen 
17153da42859SDinh Nguyen 	/*
17163da42859SDinh Nguyen 	 * If d is 0 then the working window covers a phase tap and
17173da42859SDinh Nguyen 	 * we can follow the old procedure otherwise, we've found the beginning,
17183da42859SDinh Nguyen 	 * and we need to increment the dtaps until we find the end.
17193da42859SDinh Nguyen 	 */
17203da42859SDinh Nguyen 	if (d == 0) {
17213da42859SDinh Nguyen 		/* ********************************************************* */
17223da42859SDinh Nguyen 		/* * step 3a: if we have room, back off by one and
17233da42859SDinh Nguyen 		increment in dtaps * */
17243da42859SDinh Nguyen 
17253da42859SDinh Nguyen 		sdr_backup_phase(&grp, &bit_chk, &work_bgn, &v, &d, &p,
17263da42859SDinh Nguyen 				 &max_working_cnt);
17273da42859SDinh Nguyen 
17283da42859SDinh Nguyen 		/* ********************************************************* */
17293da42859SDinh Nguyen 		/* * step 4a: go forward from working phase to non working
17303da42859SDinh Nguyen 		phase, increment in ptaps * */
17313da42859SDinh Nguyen 		if (sdr_nonworking_phase(&grp, &bit_chk, &work_bgn, &v, &d, &p,
17323da42859SDinh Nguyen 					 &i, &max_working_cnt, &work_end) == 0)
17333da42859SDinh Nguyen 			return 0;
17343da42859SDinh Nguyen 
17353da42859SDinh Nguyen 		/* ********************************************************* */
17363da42859SDinh Nguyen 		/* * step 5a:  back off one from last, increment in dtaps  * */
17373da42859SDinh Nguyen 
17383da42859SDinh Nguyen 		/* Special case code for backing up a phase */
17393da42859SDinh Nguyen 		if (p == 0) {
17403da42859SDinh Nguyen 			p = IO_DQS_EN_PHASE_MAX;
17413da42859SDinh Nguyen 			rw_mgr_decr_vfifo(grp, &v);
17423da42859SDinh Nguyen 		} else {
17433da42859SDinh Nguyen 			p = p - 1;
17443da42859SDinh Nguyen 		}
17453da42859SDinh Nguyen 
17463da42859SDinh Nguyen 		work_end -= IO_DELAY_PER_OPA_TAP;
17473da42859SDinh Nguyen 		scc_mgr_set_dqs_en_phase_all_ranks(grp, p);
17483da42859SDinh Nguyen 
17493da42859SDinh Nguyen 		/* * The actual increment of dtaps is done outside of
17503da42859SDinh Nguyen 		the if/else loop to share code */
17513da42859SDinh Nguyen 		d = 0;
17523da42859SDinh Nguyen 
17533da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: v/p: \
17543da42859SDinh Nguyen 			   vfifo=%u ptap=%u\n", __func__, __LINE__,
17553da42859SDinh Nguyen 			   v, p);
17563da42859SDinh Nguyen 	} else {
17573da42859SDinh Nguyen 		/* ******************************************************* */
17583da42859SDinh Nguyen 		/* * step 3-5b:  Find the right edge of the window using
17593da42859SDinh Nguyen 		delay taps   * */
17603da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase:vfifo=%u \
17613da42859SDinh Nguyen 			   ptap=%u dtap=%u bgn=%u\n", __func__, __LINE__,
17623da42859SDinh Nguyen 			   v, p, d, work_bgn);
17633da42859SDinh Nguyen 
17643da42859SDinh Nguyen 		work_end = work_bgn;
17653da42859SDinh Nguyen 
17663da42859SDinh Nguyen 		/* * The actual increment of dtaps is done outside of the
17673da42859SDinh Nguyen 		if/else loop to share code */
17683da42859SDinh Nguyen 
17693da42859SDinh Nguyen 		/* Only here to counterbalance a subtract later on which is
17703da42859SDinh Nguyen 		not needed if this branch of the algorithm is taken */
17713da42859SDinh Nguyen 		max_working_cnt++;
17723da42859SDinh Nguyen 	}
17733da42859SDinh Nguyen 
17743da42859SDinh Nguyen 	/* The dtap increment to find the failing edge is done here */
17753da42859SDinh Nguyen 	for (; d <= IO_DQS_EN_DELAY_MAX; d++, work_end +=
17763da42859SDinh Nguyen 		IO_DELAY_PER_DQS_EN_DCHAIN_TAP) {
17773da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: \
17783da42859SDinh Nguyen 				   end-2: dtap=%u\n", __func__, __LINE__, d);
17793da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay_all_ranks(grp, d);
17803da42859SDinh Nguyen 
17813da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_read_test_all_ranks(grp, 1,
17823da42859SDinh Nguyen 								      PASS_ONE_BIT,
17833da42859SDinh Nguyen 								      &bit_chk, 0)) {
17843da42859SDinh Nguyen 				break;
17853da42859SDinh Nguyen 			}
17863da42859SDinh Nguyen 	}
17873da42859SDinh Nguyen 
17883da42859SDinh Nguyen 	/* Go back to working dtap */
17893da42859SDinh Nguyen 	if (d != 0)
17903da42859SDinh Nguyen 		work_end -= IO_DELAY_PER_DQS_EN_DCHAIN_TAP;
17913da42859SDinh Nguyen 
17923da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: v/p/d: vfifo=%u \
17933da42859SDinh Nguyen 		   ptap=%u dtap=%u end=%u\n", __func__, __LINE__,
17943da42859SDinh Nguyen 		   v, p, d-1, work_end);
17953da42859SDinh Nguyen 
17963da42859SDinh Nguyen 	if (work_end < work_bgn) {
17973da42859SDinh Nguyen 		/* nil range */
17983da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: end-2: \
17993da42859SDinh Nguyen 			   failed\n", __func__, __LINE__);
18003da42859SDinh Nguyen 		return 0;
18013da42859SDinh Nguyen 	}
18023da42859SDinh Nguyen 
18033da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: found range [%u,%u]\n",
18043da42859SDinh Nguyen 		   __func__, __LINE__, work_bgn, work_end);
18053da42859SDinh Nguyen 
18063da42859SDinh Nguyen 	/* *************************************************************** */
18073da42859SDinh Nguyen 	/*
18083da42859SDinh Nguyen 	 * * We need to calculate the number of dtaps that equal a ptap
18093da42859SDinh Nguyen 	 * * To do that we'll back up a ptap and re-find the edge of the
18103da42859SDinh Nguyen 	 * * window using dtaps
18113da42859SDinh Nguyen 	 */
18123da42859SDinh Nguyen 
18133da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: calculate dtaps_per_ptap \
18143da42859SDinh Nguyen 		   for tracking\n", __func__, __LINE__);
18153da42859SDinh Nguyen 
18163da42859SDinh Nguyen 	/* Special case code for backing up a phase */
18173da42859SDinh Nguyen 	if (p == 0) {
18183da42859SDinh Nguyen 		p = IO_DQS_EN_PHASE_MAX;
18193da42859SDinh Nguyen 		rw_mgr_decr_vfifo(grp, &v);
18203da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: backedup \
18213da42859SDinh Nguyen 			   cycle/phase: v=%u p=%u\n", __func__, __LINE__,
18223da42859SDinh Nguyen 			   v, p);
18233da42859SDinh Nguyen 	} else {
18243da42859SDinh Nguyen 		p = p - 1;
18253da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: backedup \
18263da42859SDinh Nguyen 			   phase only: v=%u p=%u", __func__, __LINE__,
18273da42859SDinh Nguyen 			   v, p);
18283da42859SDinh Nguyen 	}
18293da42859SDinh Nguyen 
18303da42859SDinh Nguyen 	scc_mgr_set_dqs_en_phase_all_ranks(grp, p);
18313da42859SDinh Nguyen 
18323da42859SDinh Nguyen 	/*
18333da42859SDinh Nguyen 	 * Increase dtap until we first see a passing read (in case the
18343da42859SDinh Nguyen 	 * window is smaller than a ptap),
18353da42859SDinh Nguyen 	 * and then a failing read to mark the edge of the window again
18363da42859SDinh Nguyen 	 */
18373da42859SDinh Nguyen 
18383da42859SDinh Nguyen 	/* Find a passing read */
18393da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: find passing read\n",
18403da42859SDinh Nguyen 		   __func__, __LINE__);
18413da42859SDinh Nguyen 	found_passing_read = 0;
18423da42859SDinh Nguyen 	found_failing_read = 0;
18433da42859SDinh Nguyen 	initial_failing_dtap = d;
18443da42859SDinh Nguyen 	for (; d <= IO_DQS_EN_DELAY_MAX; d++) {
18453da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: testing \
18463da42859SDinh Nguyen 			   read d=%u\n", __func__, __LINE__, d);
18473da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay_all_ranks(grp, d);
18483da42859SDinh Nguyen 
18493da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_read_test_all_ranks(grp, 1,
18503da42859SDinh Nguyen 							     PASS_ONE_BIT,
18513da42859SDinh Nguyen 							     &bit_chk, 0)) {
18523da42859SDinh Nguyen 			found_passing_read = 1;
18533da42859SDinh Nguyen 			break;
18543da42859SDinh Nguyen 		}
18553da42859SDinh Nguyen 	}
18563da42859SDinh Nguyen 
18573da42859SDinh Nguyen 	if (found_passing_read) {
18583da42859SDinh Nguyen 		/* Find a failing read */
18593da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: find failing \
18603da42859SDinh Nguyen 			   read\n", __func__, __LINE__);
18613da42859SDinh Nguyen 		for (d = d + 1; d <= IO_DQS_EN_DELAY_MAX; d++) {
18623da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: \
18633da42859SDinh Nguyen 				   testing read d=%u\n", __func__, __LINE__, d);
18643da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay_all_ranks(grp, d);
18653da42859SDinh Nguyen 
18663da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_read_test_all_ranks
18673da42859SDinh Nguyen 				(grp, 1, PASS_ONE_BIT, &bit_chk, 0)) {
18683da42859SDinh Nguyen 				found_failing_read = 1;
18693da42859SDinh Nguyen 				break;
18703da42859SDinh Nguyen 			}
18713da42859SDinh Nguyen 		}
18723da42859SDinh Nguyen 	} else {
18733da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "%s:%d find_dqs_en_phase: failed to \
18743da42859SDinh Nguyen 			   calculate dtaps", __func__, __LINE__);
18753da42859SDinh Nguyen 		debug_cond(DLEVEL == 1, "per ptap. Fall back on static value\n");
18763da42859SDinh Nguyen 	}
18773da42859SDinh Nguyen 
18783da42859SDinh Nguyen 	/*
18793da42859SDinh Nguyen 	 * The dynamically calculated dtaps_per_ptap is only valid if we
18803da42859SDinh Nguyen 	 * found a passing/failing read. If we didn't, it means d hit the max
18813da42859SDinh Nguyen 	 * (IO_DQS_EN_DELAY_MAX). Otherwise, dtaps_per_ptap retains its
18823da42859SDinh Nguyen 	 * statically calculated value.
18833da42859SDinh Nguyen 	 */
18843da42859SDinh Nguyen 	if (found_passing_read && found_failing_read)
18853da42859SDinh Nguyen 		dtaps_per_ptap = d - initial_failing_dtap;
18863da42859SDinh Nguyen 
1887a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->dtaps_per_ptap;
18883da42859SDinh Nguyen 	writel(dtaps_per_ptap, SOCFPGA_SDR_ADDRESS + addr);
18893da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: dtaps_per_ptap=%u \
18903da42859SDinh Nguyen 		   - %u = %u",  __func__, __LINE__, d,
18913da42859SDinh Nguyen 		   initial_failing_dtap, dtaps_per_ptap);
18923da42859SDinh Nguyen 
18933da42859SDinh Nguyen 	/* ******************************************** */
18943da42859SDinh Nguyen 	/* * step 6:  Find the centre of the window   * */
18953da42859SDinh Nguyen 	if (sdr_find_window_centre(&grp, &bit_chk, &work_bgn, &v, &d, &p,
18963da42859SDinh Nguyen 				   &work_mid, &work_end) == 0)
18973da42859SDinh Nguyen 		return 0;
18983da42859SDinh Nguyen 
18993da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d find_dqs_en_phase: center found: \
19003da42859SDinh Nguyen 		   vfifo=%u ptap=%u dtap=%u\n", __func__, __LINE__,
19013da42859SDinh Nguyen 		   v, p-1, d);
19023da42859SDinh Nguyen 	return 1;
19033da42859SDinh Nguyen }
19043da42859SDinh Nguyen 
19053da42859SDinh Nguyen /*
19063da42859SDinh Nguyen  * Try rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase across different
19073da42859SDinh Nguyen  * dq_in_delay values
19083da42859SDinh Nguyen  */
19093da42859SDinh Nguyen static uint32_t
19103da42859SDinh Nguyen rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase_sweep_dq_in_delay
19113da42859SDinh Nguyen (uint32_t write_group, uint32_t read_group, uint32_t test_bgn)
19123da42859SDinh Nguyen {
19133da42859SDinh Nguyen 	uint32_t found;
19143da42859SDinh Nguyen 	uint32_t i;
19153da42859SDinh Nguyen 	uint32_t p;
19163da42859SDinh Nguyen 	uint32_t d;
19173da42859SDinh Nguyen 	uint32_t r;
19183da42859SDinh Nguyen 	uint32_t addr;
19193da42859SDinh Nguyen 
19203da42859SDinh Nguyen 	const uint32_t delay_step = IO_IO_IN_DELAY_MAX /
19213da42859SDinh Nguyen 		(RW_MGR_MEM_DQ_PER_READ_DQS-1);
19223da42859SDinh Nguyen 		/* we start at zero, so have one less dq to devide among */
19233da42859SDinh Nguyen 
19243da42859SDinh Nguyen 	debug("%s:%d (%u,%u,%u)", __func__, __LINE__, write_group, read_group,
19253da42859SDinh Nguyen 	      test_bgn);
19263da42859SDinh Nguyen 
19273da42859SDinh Nguyen 	/* try different dq_in_delays since the dq path is shorter than dqs */
19283da42859SDinh Nguyen 
19293da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
19303da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
19313da42859SDinh Nguyen 		for (i = 0, p = test_bgn, d = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS;
19323da42859SDinh Nguyen 			i++, p++, d += delay_step) {
19333da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d rw_mgr_mem_calibrate_\
19343da42859SDinh Nguyen 				   vfifo_find_dqs_", __func__, __LINE__);
19353da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "en_phase_sweep_dq_in_delay: g=%u/%u ",
19363da42859SDinh Nguyen 			       write_group, read_group);
19373da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "r=%u, i=%u p=%u d=%u\n", r, i , p, d);
19383da42859SDinh Nguyen 			scc_mgr_set_dq_in_delay(write_group, p, d);
19393da42859SDinh Nguyen 			scc_mgr_load_dq(p);
19403da42859SDinh Nguyen 		}
1941e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->update;
19423da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
19433da42859SDinh Nguyen 	}
19443da42859SDinh Nguyen 
19453da42859SDinh Nguyen 	found = rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase(read_group);
19463da42859SDinh Nguyen 
19473da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d rw_mgr_mem_calibrate_vfifo_find_dqs_\
19483da42859SDinh Nguyen 		   en_phase_sweep_dq", __func__, __LINE__);
19493da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "_in_delay: g=%u/%u found=%u; Reseting delay \
19503da42859SDinh Nguyen 		   chain to zero\n", write_group, read_group, found);
19513da42859SDinh Nguyen 
19523da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
19533da42859SDinh Nguyen 	     r += NUM_RANKS_PER_SHADOW_REG) {
19543da42859SDinh Nguyen 		for (i = 0, p = test_bgn; i < RW_MGR_MEM_DQ_PER_READ_DQS;
19553da42859SDinh Nguyen 			i++, p++) {
19563da42859SDinh Nguyen 			scc_mgr_set_dq_in_delay(write_group, p, 0);
19573da42859SDinh Nguyen 			scc_mgr_load_dq(p);
19583da42859SDinh Nguyen 		}
1959e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->update;
19603da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
19613da42859SDinh Nguyen 	}
19623da42859SDinh Nguyen 
19633da42859SDinh Nguyen 	return found;
19643da42859SDinh Nguyen }
19653da42859SDinh Nguyen 
19663da42859SDinh Nguyen /* per-bit deskew DQ and center */
19673da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo_center(uint32_t rank_bgn,
19683da42859SDinh Nguyen 	uint32_t write_group, uint32_t read_group, uint32_t test_bgn,
19693da42859SDinh Nguyen 	uint32_t use_read_test, uint32_t update_fom)
19703da42859SDinh Nguyen {
19713da42859SDinh Nguyen 	uint32_t i, p, d, min_index;
19723da42859SDinh Nguyen 	/*
19733da42859SDinh Nguyen 	 * Store these as signed since there are comparisons with
19743da42859SDinh Nguyen 	 * signed numbers.
19753da42859SDinh Nguyen 	 */
19763da42859SDinh Nguyen 	uint32_t bit_chk;
19773da42859SDinh Nguyen 	uint32_t sticky_bit_chk;
19783da42859SDinh Nguyen 	int32_t left_edge[RW_MGR_MEM_DQ_PER_READ_DQS];
19793da42859SDinh Nguyen 	int32_t right_edge[RW_MGR_MEM_DQ_PER_READ_DQS];
19803da42859SDinh Nguyen 	int32_t final_dq[RW_MGR_MEM_DQ_PER_READ_DQS];
19813da42859SDinh Nguyen 	int32_t mid;
19823da42859SDinh Nguyen 	int32_t orig_mid_min, mid_min;
19833da42859SDinh Nguyen 	int32_t new_dqs, start_dqs, start_dqs_en, shift_dq, final_dqs,
19843da42859SDinh Nguyen 		final_dqs_en;
19853da42859SDinh Nguyen 	int32_t dq_margin, dqs_margin;
19863da42859SDinh Nguyen 	uint32_t stop;
19873da42859SDinh Nguyen 	uint32_t temp_dq_in_delay1, temp_dq_in_delay2;
19883da42859SDinh Nguyen 	uint32_t addr;
19893da42859SDinh Nguyen 
19903da42859SDinh Nguyen 	debug("%s:%d: %u %u", __func__, __LINE__, read_group, test_bgn);
19913da42859SDinh Nguyen 
1992*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_DQS_IN_DELAY_OFFSET;
19933da42859SDinh Nguyen 	start_dqs = readl(SOCFPGA_SDR_ADDRESS + addr + (read_group << 2));
19943da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS)
19953da42859SDinh Nguyen 		start_dqs_en = readl(SOCFPGA_SDR_ADDRESS + addr + ((read_group << 2)
19963da42859SDinh Nguyen 				     - IO_DQS_EN_DELAY_OFFSET));
19973da42859SDinh Nguyen 
19983da42859SDinh Nguyen 	/* set the left and right edge of each bit to an illegal value */
19993da42859SDinh Nguyen 	/* use (IO_IO_IN_DELAY_MAX + 1) as an illegal value */
20003da42859SDinh Nguyen 	sticky_bit_chk = 0;
20013da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
20023da42859SDinh Nguyen 		left_edge[i]  = IO_IO_IN_DELAY_MAX + 1;
20033da42859SDinh Nguyen 		right_edge[i] = IO_IO_IN_DELAY_MAX + 1;
20043da42859SDinh Nguyen 	}
20053da42859SDinh Nguyen 
2006e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
20073da42859SDinh Nguyen 	/* Search for the left edge of the window for each bit */
20083da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_IN_DELAY_MAX; d++) {
20093da42859SDinh Nguyen 		scc_mgr_apply_group_dq_in_delay(write_group, test_bgn, d);
20103da42859SDinh Nguyen 
20113da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
20123da42859SDinh Nguyen 
20133da42859SDinh Nguyen 		/*
20143da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
20153da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
20163da42859SDinh Nguyen 		 */
20173da42859SDinh Nguyen 		if (use_read_test) {
20183da42859SDinh Nguyen 			stop = !rw_mgr_mem_calibrate_read_test(rank_bgn,
20193da42859SDinh Nguyen 				read_group, NUM_READ_PB_TESTS, PASS_ONE_BIT,
20203da42859SDinh Nguyen 				&bit_chk, 0, 0);
20213da42859SDinh Nguyen 		} else {
20223da42859SDinh Nguyen 			rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
20233da42859SDinh Nguyen 							0, PASS_ONE_BIT,
20243da42859SDinh Nguyen 							&bit_chk, 0);
20253da42859SDinh Nguyen 			bit_chk = bit_chk >> (RW_MGR_MEM_DQ_PER_READ_DQS *
20263da42859SDinh Nguyen 				(read_group - (write_group *
20273da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
20283da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH)));
20293da42859SDinh Nguyen 			stop = (bit_chk == 0);
20303da42859SDinh Nguyen 		}
20313da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
20323da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->read_correct_mask);
20333da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center(left): dtap=%u => %u == %u \
20343da42859SDinh Nguyen 			   && %u", __func__, __LINE__, d,
20353da42859SDinh Nguyen 			   sticky_bit_chk,
20363da42859SDinh Nguyen 			param->read_correct_mask, stop);
20373da42859SDinh Nguyen 
20383da42859SDinh Nguyen 		if (stop == 1) {
20393da42859SDinh Nguyen 			break;
20403da42859SDinh Nguyen 		} else {
20413da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
20423da42859SDinh Nguyen 				if (bit_chk & 1) {
20433da42859SDinh Nguyen 					/* Remember a passing test as the
20443da42859SDinh Nguyen 					left_edge */
20453da42859SDinh Nguyen 					left_edge[i] = d;
20463da42859SDinh Nguyen 				} else {
20473da42859SDinh Nguyen 					/* If a left edge has not been seen yet,
20483da42859SDinh Nguyen 					then a future passing test will mark
20493da42859SDinh Nguyen 					this edge as the right edge */
20503da42859SDinh Nguyen 					if (left_edge[i] ==
20513da42859SDinh Nguyen 						IO_IO_IN_DELAY_MAX + 1) {
20523da42859SDinh Nguyen 						right_edge[i] = -(d + 1);
20533da42859SDinh Nguyen 					}
20543da42859SDinh Nguyen 				}
20553da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
20563da42859SDinh Nguyen 			}
20573da42859SDinh Nguyen 		}
20583da42859SDinh Nguyen 	}
20593da42859SDinh Nguyen 
20603da42859SDinh Nguyen 	/* Reset DQ delay chains to 0 */
20613da42859SDinh Nguyen 	scc_mgr_apply_group_dq_in_delay(write_group, test_bgn, 0);
20623da42859SDinh Nguyen 	sticky_bit_chk = 0;
20633da42859SDinh Nguyen 	for (i = RW_MGR_MEM_DQ_PER_READ_DQS - 1;; i--) {
20643da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center: left_edge[%u]: \
20653da42859SDinh Nguyen 			   %d right_edge[%u]: %d\n", __func__, __LINE__,
20663da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
20673da42859SDinh Nguyen 
20683da42859SDinh Nguyen 		/*
20693da42859SDinh Nguyen 		 * Check for cases where we haven't found the left edge,
20703da42859SDinh Nguyen 		 * which makes our assignment of the the right edge invalid.
20713da42859SDinh Nguyen 		 * Reset it to the illegal value.
20723da42859SDinh Nguyen 		 */
20733da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_IN_DELAY_MAX + 1) && (
20743da42859SDinh Nguyen 			right_edge[i] != IO_IO_IN_DELAY_MAX + 1)) {
20753da42859SDinh Nguyen 			right_edge[i] = IO_IO_IN_DELAY_MAX + 1;
20763da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d vfifo_center: reset \
20773da42859SDinh Nguyen 				   right_edge[%u]: %d\n", __func__, __LINE__,
20783da42859SDinh Nguyen 				   i, right_edge[i]);
20793da42859SDinh Nguyen 		}
20803da42859SDinh Nguyen 
20813da42859SDinh Nguyen 		/*
20823da42859SDinh Nguyen 		 * Reset sticky bit (except for bits where we have seen
20833da42859SDinh Nguyen 		 * both the left and right edge).
20843da42859SDinh Nguyen 		 */
20853da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk << 1;
20863da42859SDinh Nguyen 		if ((left_edge[i] != IO_IO_IN_DELAY_MAX + 1) &&
20873da42859SDinh Nguyen 		    (right_edge[i] != IO_IO_IN_DELAY_MAX + 1)) {
20883da42859SDinh Nguyen 			sticky_bit_chk = sticky_bit_chk | 1;
20893da42859SDinh Nguyen 		}
20903da42859SDinh Nguyen 
20913da42859SDinh Nguyen 		if (i == 0)
20923da42859SDinh Nguyen 			break;
20933da42859SDinh Nguyen 	}
20943da42859SDinh Nguyen 
2095e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
20963da42859SDinh Nguyen 	/* Search for the right edge of the window for each bit */
20973da42859SDinh Nguyen 	for (d = 0; d <= IO_DQS_IN_DELAY_MAX - start_dqs; d++) {
20983da42859SDinh Nguyen 		scc_mgr_set_dqs_bus_in_delay(read_group, d + start_dqs);
20993da42859SDinh Nguyen 		if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
21003da42859SDinh Nguyen 			uint32_t delay = d + start_dqs_en;
21013da42859SDinh Nguyen 			if (delay > IO_DQS_EN_DELAY_MAX)
21023da42859SDinh Nguyen 				delay = IO_DQS_EN_DELAY_MAX;
21033da42859SDinh Nguyen 			scc_mgr_set_dqs_en_delay(read_group, delay);
21043da42859SDinh Nguyen 		}
21053da42859SDinh Nguyen 		scc_mgr_load_dqs(read_group);
21063da42859SDinh Nguyen 
21073da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
21083da42859SDinh Nguyen 
21093da42859SDinh Nguyen 		/*
21103da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
21113da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
21123da42859SDinh Nguyen 		 */
21133da42859SDinh Nguyen 		if (use_read_test) {
21143da42859SDinh Nguyen 			stop = !rw_mgr_mem_calibrate_read_test(rank_bgn,
21153da42859SDinh Nguyen 				read_group, NUM_READ_PB_TESTS, PASS_ONE_BIT,
21163da42859SDinh Nguyen 				&bit_chk, 0, 0);
21173da42859SDinh Nguyen 		} else {
21183da42859SDinh Nguyen 			rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
21193da42859SDinh Nguyen 							0, PASS_ONE_BIT,
21203da42859SDinh Nguyen 							&bit_chk, 0);
21213da42859SDinh Nguyen 			bit_chk = bit_chk >> (RW_MGR_MEM_DQ_PER_READ_DQS *
21223da42859SDinh Nguyen 				(read_group - (write_group *
21233da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
21243da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH)));
21253da42859SDinh Nguyen 			stop = (bit_chk == 0);
21263da42859SDinh Nguyen 		}
21273da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
21283da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->read_correct_mask);
21293da42859SDinh Nguyen 
21303da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center(right): dtap=%u => %u == \
21313da42859SDinh Nguyen 			   %u && %u", __func__, __LINE__, d,
21323da42859SDinh Nguyen 			   sticky_bit_chk, param->read_correct_mask, stop);
21333da42859SDinh Nguyen 
21343da42859SDinh Nguyen 		if (stop == 1) {
21353da42859SDinh Nguyen 			break;
21363da42859SDinh Nguyen 		} else {
21373da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
21383da42859SDinh Nguyen 				if (bit_chk & 1) {
21393da42859SDinh Nguyen 					/* Remember a passing test as
21403da42859SDinh Nguyen 					the right_edge */
21413da42859SDinh Nguyen 					right_edge[i] = d;
21423da42859SDinh Nguyen 				} else {
21433da42859SDinh Nguyen 					if (d != 0) {
21443da42859SDinh Nguyen 						/* If a right edge has not been
21453da42859SDinh Nguyen 						seen yet, then a future passing
21463da42859SDinh Nguyen 						test will mark this edge as the
21473da42859SDinh Nguyen 						left edge */
21483da42859SDinh Nguyen 						if (right_edge[i] ==
21493da42859SDinh Nguyen 						IO_IO_IN_DELAY_MAX + 1) {
21503da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
21513da42859SDinh Nguyen 						}
21523da42859SDinh Nguyen 					} else {
21533da42859SDinh Nguyen 						/* d = 0 failed, but it passed
21543da42859SDinh Nguyen 						when testing the left edge,
21553da42859SDinh Nguyen 						so it must be marginal,
21563da42859SDinh Nguyen 						set it to -1 */
21573da42859SDinh Nguyen 						if (right_edge[i] ==
21583da42859SDinh Nguyen 							IO_IO_IN_DELAY_MAX + 1 &&
21593da42859SDinh Nguyen 							left_edge[i] !=
21603da42859SDinh Nguyen 							IO_IO_IN_DELAY_MAX
21613da42859SDinh Nguyen 							+ 1) {
21623da42859SDinh Nguyen 							right_edge[i] = -1;
21633da42859SDinh Nguyen 						}
21643da42859SDinh Nguyen 						/* If a right edge has not been
21653da42859SDinh Nguyen 						seen yet, then a future passing
21663da42859SDinh Nguyen 						test will mark this edge as the
21673da42859SDinh Nguyen 						left edge */
21683da42859SDinh Nguyen 						else if (right_edge[i] ==
21693da42859SDinh Nguyen 							IO_IO_IN_DELAY_MAX +
21703da42859SDinh Nguyen 							1) {
21713da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
21723da42859SDinh Nguyen 						}
21733da42859SDinh Nguyen 					}
21743da42859SDinh Nguyen 				}
21753da42859SDinh Nguyen 
21763da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "%s:%d vfifo_center[r,\
21773da42859SDinh Nguyen 					   d=%u]: ", __func__, __LINE__, d);
21783da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "bit_chk_test=%d left_edge[%u]: %d ",
21793da42859SDinh Nguyen 					   (int)(bit_chk & 1), i, left_edge[i]);
21803da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "right_edge[%u]: %d\n", i,
21813da42859SDinh Nguyen 					   right_edge[i]);
21823da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
21833da42859SDinh Nguyen 			}
21843da42859SDinh Nguyen 		}
21853da42859SDinh Nguyen 	}
21863da42859SDinh Nguyen 
21873da42859SDinh Nguyen 	/* Check that all bits have a window */
2188e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
21893da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
21903da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d vfifo_center: left_edge[%u]: \
21913da42859SDinh Nguyen 			   %d right_edge[%u]: %d", __func__, __LINE__,
21923da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
21933da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_IN_DELAY_MAX + 1) || (right_edge[i]
21943da42859SDinh Nguyen 			== IO_IO_IN_DELAY_MAX + 1)) {
21953da42859SDinh Nguyen 			/*
21963da42859SDinh Nguyen 			 * Restore delay chain settings before letting the loop
21973da42859SDinh Nguyen 			 * in rw_mgr_mem_calibrate_vfifo to retry different
21983da42859SDinh Nguyen 			 * dqs/ck relationships.
21993da42859SDinh Nguyen 			 */
22003da42859SDinh Nguyen 			scc_mgr_set_dqs_bus_in_delay(read_group, start_dqs);
22013da42859SDinh Nguyen 			if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
22023da42859SDinh Nguyen 				scc_mgr_set_dqs_en_delay(read_group,
22033da42859SDinh Nguyen 							 start_dqs_en);
22043da42859SDinh Nguyen 			}
22053da42859SDinh Nguyen 			scc_mgr_load_dqs(read_group);
22063da42859SDinh Nguyen 			writel(0, SOCFPGA_SDR_ADDRESS + addr);
22073da42859SDinh Nguyen 
22083da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d vfifo_center: failed to \
22093da42859SDinh Nguyen 				   find edge [%u]: %d %d", __func__, __LINE__,
22103da42859SDinh Nguyen 				   i, left_edge[i], right_edge[i]);
22113da42859SDinh Nguyen 			if (use_read_test) {
22123da42859SDinh Nguyen 				set_failing_group_stage(read_group *
22133da42859SDinh Nguyen 					RW_MGR_MEM_DQ_PER_READ_DQS + i,
22143da42859SDinh Nguyen 					CAL_STAGE_VFIFO,
22153da42859SDinh Nguyen 					CAL_SUBSTAGE_VFIFO_CENTER);
22163da42859SDinh Nguyen 			} else {
22173da42859SDinh Nguyen 				set_failing_group_stage(read_group *
22183da42859SDinh Nguyen 					RW_MGR_MEM_DQ_PER_READ_DQS + i,
22193da42859SDinh Nguyen 					CAL_STAGE_VFIFO_AFTER_WRITES,
22203da42859SDinh Nguyen 					CAL_SUBSTAGE_VFIFO_CENTER);
22213da42859SDinh Nguyen 			}
22223da42859SDinh Nguyen 			return 0;
22233da42859SDinh Nguyen 		}
22243da42859SDinh Nguyen 	}
22253da42859SDinh Nguyen 
22263da42859SDinh Nguyen 	/* Find middle of window for each DQ bit */
22273da42859SDinh Nguyen 	mid_min = left_edge[0] - right_edge[0];
22283da42859SDinh Nguyen 	min_index = 0;
22293da42859SDinh Nguyen 	for (i = 1; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++) {
22303da42859SDinh Nguyen 		mid = left_edge[i] - right_edge[i];
22313da42859SDinh Nguyen 		if (mid < mid_min) {
22323da42859SDinh Nguyen 			mid_min = mid;
22333da42859SDinh Nguyen 			min_index = i;
22343da42859SDinh Nguyen 		}
22353da42859SDinh Nguyen 	}
22363da42859SDinh Nguyen 
22373da42859SDinh Nguyen 	/*
22383da42859SDinh Nguyen 	 * -mid_min/2 represents the amount that we need to move DQS.
22393da42859SDinh Nguyen 	 * If mid_min is odd and positive we'll need to add one to
22403da42859SDinh Nguyen 	 * make sure the rounding in further calculations is correct
22413da42859SDinh Nguyen 	 * (always bias to the right), so just add 1 for all positive values.
22423da42859SDinh Nguyen 	 */
22433da42859SDinh Nguyen 	if (mid_min > 0)
22443da42859SDinh Nguyen 		mid_min++;
22453da42859SDinh Nguyen 
22463da42859SDinh Nguyen 	mid_min = mid_min / 2;
22473da42859SDinh Nguyen 
22483da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d vfifo_center: mid_min=%d (index=%u)\n",
22493da42859SDinh Nguyen 		   __func__, __LINE__, mid_min, min_index);
22503da42859SDinh Nguyen 
22513da42859SDinh Nguyen 	/* Determine the amount we can change DQS (which is -mid_min) */
22523da42859SDinh Nguyen 	orig_mid_min = mid_min;
22533da42859SDinh Nguyen 	new_dqs = start_dqs - mid_min;
22543da42859SDinh Nguyen 	if (new_dqs > IO_DQS_IN_DELAY_MAX)
22553da42859SDinh Nguyen 		new_dqs = IO_DQS_IN_DELAY_MAX;
22563da42859SDinh Nguyen 	else if (new_dqs < 0)
22573da42859SDinh Nguyen 		new_dqs = 0;
22583da42859SDinh Nguyen 
22593da42859SDinh Nguyen 	mid_min = start_dqs - new_dqs;
22603da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "vfifo_center: new mid_min=%d new_dqs=%d\n",
22613da42859SDinh Nguyen 		   mid_min, new_dqs);
22623da42859SDinh Nguyen 
22633da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
22643da42859SDinh Nguyen 		if (start_dqs_en - mid_min > IO_DQS_EN_DELAY_MAX)
22653da42859SDinh Nguyen 			mid_min += start_dqs_en - mid_min - IO_DQS_EN_DELAY_MAX;
22663da42859SDinh Nguyen 		else if (start_dqs_en - mid_min < 0)
22673da42859SDinh Nguyen 			mid_min += start_dqs_en - mid_min;
22683da42859SDinh Nguyen 	}
22693da42859SDinh Nguyen 	new_dqs = start_dqs - mid_min;
22703da42859SDinh Nguyen 
22713da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "vfifo_center: start_dqs=%d start_dqs_en=%d \
22723da42859SDinh Nguyen 		   new_dqs=%d mid_min=%d\n", start_dqs,
22733da42859SDinh Nguyen 		   IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS ? start_dqs_en : -1,
22743da42859SDinh Nguyen 		   new_dqs, mid_min);
22753da42859SDinh Nguyen 
22763da42859SDinh Nguyen 	/* Initialize data for export structures */
22773da42859SDinh Nguyen 	dqs_margin = IO_IO_IN_DELAY_MAX + 1;
22783da42859SDinh Nguyen 	dq_margin  = IO_IO_IN_DELAY_MAX + 1;
22793da42859SDinh Nguyen 
2280*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_IN_DELAY_OFFSET;
22813da42859SDinh Nguyen 	/* add delay to bring centre of all DQ windows to the same "level" */
22823da42859SDinh Nguyen 	for (i = 0, p = test_bgn; i < RW_MGR_MEM_DQ_PER_READ_DQS; i++, p++) {
22833da42859SDinh Nguyen 		/* Use values before divide by 2 to reduce round off error */
22843da42859SDinh Nguyen 		shift_dq = (left_edge[i] - right_edge[i] -
22853da42859SDinh Nguyen 			(left_edge[min_index] - right_edge[min_index]))/2  +
22863da42859SDinh Nguyen 			(orig_mid_min - mid_min);
22873da42859SDinh Nguyen 
22883da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "vfifo_center: before: \
22893da42859SDinh Nguyen 			   shift_dq[%u]=%d\n", i, shift_dq);
22903da42859SDinh Nguyen 
22913da42859SDinh Nguyen 		temp_dq_in_delay1 = readl(SOCFPGA_SDR_ADDRESS + addr + (p << 2));
22923da42859SDinh Nguyen 		temp_dq_in_delay2 = readl(SOCFPGA_SDR_ADDRESS + addr + (i << 2));
22933da42859SDinh Nguyen 
22943da42859SDinh Nguyen 		if (shift_dq + (int32_t)temp_dq_in_delay1 >
22953da42859SDinh Nguyen 			(int32_t)IO_IO_IN_DELAY_MAX) {
22963da42859SDinh Nguyen 			shift_dq = (int32_t)IO_IO_IN_DELAY_MAX - temp_dq_in_delay2;
22973da42859SDinh Nguyen 		} else if (shift_dq + (int32_t)temp_dq_in_delay1 < 0) {
22983da42859SDinh Nguyen 			shift_dq = -(int32_t)temp_dq_in_delay1;
22993da42859SDinh Nguyen 		}
23003da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "vfifo_center: after: \
23013da42859SDinh Nguyen 			   shift_dq[%u]=%d\n", i, shift_dq);
23023da42859SDinh Nguyen 		final_dq[i] = temp_dq_in_delay1 + shift_dq;
23033da42859SDinh Nguyen 		scc_mgr_set_dq_in_delay(write_group, p, final_dq[i]);
23043da42859SDinh Nguyen 		scc_mgr_load_dq(p);
23053da42859SDinh Nguyen 
23063da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "vfifo_center: margin[%u]=[%d,%d]\n", i,
23073da42859SDinh Nguyen 			   left_edge[i] - shift_dq + (-mid_min),
23083da42859SDinh Nguyen 			   right_edge[i] + shift_dq - (-mid_min));
23093da42859SDinh Nguyen 		/* To determine values for export structures */
23103da42859SDinh Nguyen 		if (left_edge[i] - shift_dq + (-mid_min) < dq_margin)
23113da42859SDinh Nguyen 			dq_margin = left_edge[i] - shift_dq + (-mid_min);
23123da42859SDinh Nguyen 
23133da42859SDinh Nguyen 		if (right_edge[i] + shift_dq - (-mid_min) < dqs_margin)
23143da42859SDinh Nguyen 			dqs_margin = right_edge[i] + shift_dq - (-mid_min);
23153da42859SDinh Nguyen 	}
23163da42859SDinh Nguyen 
23173da42859SDinh Nguyen 	final_dqs = new_dqs;
23183da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS)
23193da42859SDinh Nguyen 		final_dqs_en = start_dqs_en - mid_min;
23203da42859SDinh Nguyen 
23213da42859SDinh Nguyen 	/* Move DQS-en */
23223da42859SDinh Nguyen 	if (IO_SHIFT_DQS_EN_WHEN_SHIFT_DQS) {
23233da42859SDinh Nguyen 		scc_mgr_set_dqs_en_delay(read_group, final_dqs_en);
23243da42859SDinh Nguyen 		scc_mgr_load_dqs(read_group);
23253da42859SDinh Nguyen 	}
23263da42859SDinh Nguyen 
23273da42859SDinh Nguyen 	/* Move DQS */
23283da42859SDinh Nguyen 	scc_mgr_set_dqs_bus_in_delay(read_group, final_dqs);
23293da42859SDinh Nguyen 	scc_mgr_load_dqs(read_group);
23303da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d vfifo_center: dq_margin=%d \
23313da42859SDinh Nguyen 		   dqs_margin=%d", __func__, __LINE__,
23323da42859SDinh Nguyen 		   dq_margin, dqs_margin);
23333da42859SDinh Nguyen 
23343da42859SDinh Nguyen 	/*
23353da42859SDinh Nguyen 	 * Do not remove this line as it makes sure all of our decisions
23363da42859SDinh Nguyen 	 * have been applied. Apply the update bit.
23373da42859SDinh Nguyen 	 */
2338e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
23393da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
23403da42859SDinh Nguyen 
23413da42859SDinh Nguyen 	return (dq_margin >= 0) && (dqs_margin >= 0);
23423da42859SDinh Nguyen }
23433da42859SDinh Nguyen 
23443da42859SDinh Nguyen /*
23453da42859SDinh Nguyen  * calibrate the read valid prediction FIFO.
23463da42859SDinh Nguyen  *
23473da42859SDinh Nguyen  *  - read valid prediction will consist of finding a good DQS enable phase,
23483da42859SDinh Nguyen  * DQS enable delay, DQS input phase, and DQS input delay.
23493da42859SDinh Nguyen  *  - we also do a per-bit deskew on the DQ lines.
23503da42859SDinh Nguyen  */
23513da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo(uint32_t read_group,
23523da42859SDinh Nguyen 					   uint32_t test_bgn)
23533da42859SDinh Nguyen {
23543da42859SDinh Nguyen 	uint32_t p, d, rank_bgn, sr;
23553da42859SDinh Nguyen 	uint32_t dtaps_per_ptap;
23563da42859SDinh Nguyen 	uint32_t tmp_delay;
23573da42859SDinh Nguyen 	uint32_t bit_chk;
23583da42859SDinh Nguyen 	uint32_t grp_calibrated;
23593da42859SDinh Nguyen 	uint32_t write_group, write_test_bgn;
23603da42859SDinh Nguyen 	uint32_t failed_substage;
23613da42859SDinh Nguyen 
23627ac40d25SMarek Vasut 	debug("%s:%d: %u %u\n", __func__, __LINE__, read_group, test_bgn);
23633da42859SDinh Nguyen 
23643da42859SDinh Nguyen 	/* update info for sims */
23653da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_VFIFO);
23663da42859SDinh Nguyen 
23673da42859SDinh Nguyen 	write_group = read_group;
23683da42859SDinh Nguyen 	write_test_bgn = test_bgn;
23693da42859SDinh Nguyen 
23703da42859SDinh Nguyen 	/* USER Determine number of delay taps for each phase tap */
23713da42859SDinh Nguyen 	dtaps_per_ptap = 0;
23723da42859SDinh Nguyen 	tmp_delay = 0;
23733da42859SDinh Nguyen 	while (tmp_delay < IO_DELAY_PER_OPA_TAP) {
23743da42859SDinh Nguyen 		dtaps_per_ptap++;
23753da42859SDinh Nguyen 		tmp_delay += IO_DELAY_PER_DQS_EN_DCHAIN_TAP;
23763da42859SDinh Nguyen 	}
23773da42859SDinh Nguyen 	dtaps_per_ptap--;
23783da42859SDinh Nguyen 	tmp_delay = 0;
23793da42859SDinh Nguyen 
23803da42859SDinh Nguyen 	/* update info for sims */
23813da42859SDinh Nguyen 	reg_file_set_group(read_group);
23823da42859SDinh Nguyen 
23833da42859SDinh Nguyen 	grp_calibrated = 0;
23843da42859SDinh Nguyen 
23853da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_GUARANTEED_READ);
23863da42859SDinh Nguyen 	failed_substage = CAL_SUBSTAGE_GUARANTEED_READ;
23873da42859SDinh Nguyen 
23883da42859SDinh Nguyen 	for (d = 0; d <= dtaps_per_ptap && grp_calibrated == 0; d += 2) {
23893da42859SDinh Nguyen 		/*
23903da42859SDinh Nguyen 		 * In RLDRAMX we may be messing the delay of pins in
23913da42859SDinh Nguyen 		 * the same write group but outside of the current read
23923da42859SDinh Nguyen 		 * the group, but that's ok because we haven't
23933da42859SDinh Nguyen 		 * calibrated output side yet.
23943da42859SDinh Nguyen 		 */
23953da42859SDinh Nguyen 		if (d > 0) {
23963da42859SDinh Nguyen 			scc_mgr_apply_group_all_out_delay_add_all_ranks
23973da42859SDinh Nguyen 			(write_group, write_test_bgn, d);
23983da42859SDinh Nguyen 		}
23993da42859SDinh Nguyen 
24003da42859SDinh Nguyen 		for (p = 0; p <= IO_DQDQS_OUT_PHASE_MAX && grp_calibrated == 0;
24013da42859SDinh Nguyen 			p++) {
24023da42859SDinh Nguyen 			/* set a particular dqdqs phase */
24033da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase_all_ranks(read_group, p);
24043da42859SDinh Nguyen 
24053da42859SDinh Nguyen 			debug_cond(DLEVEL == 1, "%s:%d calibrate_vfifo: g=%u \
24063da42859SDinh Nguyen 				   p=%u d=%u\n", __func__, __LINE__,
24073da42859SDinh Nguyen 				   read_group, p, d);
24083da42859SDinh Nguyen 
24093da42859SDinh Nguyen 			/*
24103da42859SDinh Nguyen 			 * Load up the patterns used by read calibration
24113da42859SDinh Nguyen 			 * using current DQDQS phase.
24123da42859SDinh Nguyen 			 */
24133da42859SDinh Nguyen 			rw_mgr_mem_calibrate_read_load_patterns(0, 1);
24143da42859SDinh Nguyen 			if (!(gbl->phy_debug_mode_flags &
24153da42859SDinh Nguyen 				PHY_DEBUG_DISABLE_GUARANTEED_READ)) {
24163da42859SDinh Nguyen 				if (!rw_mgr_mem_calibrate_read_test_patterns_all_ranks
24173da42859SDinh Nguyen 				    (read_group, 1, &bit_chk)) {
24183da42859SDinh Nguyen 					debug_cond(DLEVEL == 1, "%s:%d Guaranteed read test failed:",
24193da42859SDinh Nguyen 						   __func__, __LINE__);
24203da42859SDinh Nguyen 					debug_cond(DLEVEL == 1, " g=%u p=%u d=%u\n",
24213da42859SDinh Nguyen 						   read_group, p, d);
24223da42859SDinh Nguyen 					break;
24233da42859SDinh Nguyen 				}
24243da42859SDinh Nguyen 			}
24253da42859SDinh Nguyen 
24263da42859SDinh Nguyen /* case:56390 */
24273da42859SDinh Nguyen 			grp_calibrated = 1;
24283da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_vfifo_find_dqs_en_phase_sweep_dq_in_delay
24293da42859SDinh Nguyen 		    (write_group, read_group, test_bgn)) {
24303da42859SDinh Nguyen 				/*
24313da42859SDinh Nguyen 				 * USER Read per-bit deskew can be done on a
24323da42859SDinh Nguyen 				 * per shadow register basis.
24333da42859SDinh Nguyen 				 */
24343da42859SDinh Nguyen 				for (rank_bgn = 0, sr = 0;
24353da42859SDinh Nguyen 					rank_bgn < RW_MGR_MEM_NUMBER_OF_RANKS;
24363da42859SDinh Nguyen 					rank_bgn += NUM_RANKS_PER_SHADOW_REG,
24373da42859SDinh Nguyen 					++sr) {
24383da42859SDinh Nguyen 					/*
24393da42859SDinh Nguyen 					 * Determine if this set of ranks
24403da42859SDinh Nguyen 					 * should be skipped entirely.
24413da42859SDinh Nguyen 					 */
24423da42859SDinh Nguyen 					if (!param->skip_shadow_regs[sr]) {
24433da42859SDinh Nguyen 						/*
24443da42859SDinh Nguyen 						 * If doing read after write
24453da42859SDinh Nguyen 						 * calibration, do not update
24463da42859SDinh Nguyen 						 * FOM, now - do it then.
24473da42859SDinh Nguyen 						 */
24483da42859SDinh Nguyen 					if (!rw_mgr_mem_calibrate_vfifo_center
24493da42859SDinh Nguyen 						(rank_bgn, write_group,
24503da42859SDinh Nguyen 						read_group, test_bgn, 1, 0)) {
24513da42859SDinh Nguyen 							grp_calibrated = 0;
24523da42859SDinh Nguyen 							failed_substage =
24533da42859SDinh Nguyen 						CAL_SUBSTAGE_VFIFO_CENTER;
24543da42859SDinh Nguyen 						}
24553da42859SDinh Nguyen 					}
24563da42859SDinh Nguyen 				}
24573da42859SDinh Nguyen 			} else {
24583da42859SDinh Nguyen 				grp_calibrated = 0;
24593da42859SDinh Nguyen 				failed_substage = CAL_SUBSTAGE_DQS_EN_PHASE;
24603da42859SDinh Nguyen 			}
24613da42859SDinh Nguyen 		}
24623da42859SDinh Nguyen 	}
24633da42859SDinh Nguyen 
24643da42859SDinh Nguyen 	if (grp_calibrated == 0) {
24653da42859SDinh Nguyen 		set_failing_group_stage(write_group, CAL_STAGE_VFIFO,
24663da42859SDinh Nguyen 					failed_substage);
24673da42859SDinh Nguyen 		return 0;
24683da42859SDinh Nguyen 	}
24693da42859SDinh Nguyen 
24703da42859SDinh Nguyen 	/*
24713da42859SDinh Nguyen 	 * Reset the delay chains back to zero if they have moved > 1
24723da42859SDinh Nguyen 	 * (check for > 1 because loop will increase d even when pass in
24733da42859SDinh Nguyen 	 * first case).
24743da42859SDinh Nguyen 	 */
24753da42859SDinh Nguyen 	if (d > 2)
24763da42859SDinh Nguyen 		scc_mgr_zero_group(write_group, write_test_bgn, 1);
24773da42859SDinh Nguyen 
24783da42859SDinh Nguyen 	return 1;
24793da42859SDinh Nguyen }
24803da42859SDinh Nguyen 
24813da42859SDinh Nguyen /* VFIFO Calibration -- Read Deskew Calibration after write deskew */
24823da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_vfifo_end(uint32_t read_group,
24833da42859SDinh Nguyen 					       uint32_t test_bgn)
24843da42859SDinh Nguyen {
24853da42859SDinh Nguyen 	uint32_t rank_bgn, sr;
24863da42859SDinh Nguyen 	uint32_t grp_calibrated;
24873da42859SDinh Nguyen 	uint32_t write_group;
24883da42859SDinh Nguyen 
24893da42859SDinh Nguyen 	debug("%s:%d %u %u", __func__, __LINE__, read_group, test_bgn);
24903da42859SDinh Nguyen 
24913da42859SDinh Nguyen 	/* update info for sims */
24923da42859SDinh Nguyen 
24933da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_VFIFO_AFTER_WRITES);
24943da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_VFIFO_CENTER);
24953da42859SDinh Nguyen 
24963da42859SDinh Nguyen 	write_group = read_group;
24973da42859SDinh Nguyen 
24983da42859SDinh Nguyen 	/* update info for sims */
24993da42859SDinh Nguyen 	reg_file_set_group(read_group);
25003da42859SDinh Nguyen 
25013da42859SDinh Nguyen 	grp_calibrated = 1;
25023da42859SDinh Nguyen 	/* Read per-bit deskew can be done on a per shadow register basis */
25033da42859SDinh Nguyen 	for (rank_bgn = 0, sr = 0; rank_bgn < RW_MGR_MEM_NUMBER_OF_RANKS;
25043da42859SDinh Nguyen 		rank_bgn += NUM_RANKS_PER_SHADOW_REG, ++sr) {
25053da42859SDinh Nguyen 		/* Determine if this set of ranks should be skipped entirely */
25063da42859SDinh Nguyen 		if (!param->skip_shadow_regs[sr]) {
25073da42859SDinh Nguyen 		/* This is the last calibration round, update FOM here */
25083da42859SDinh Nguyen 			if (!rw_mgr_mem_calibrate_vfifo_center(rank_bgn,
25093da42859SDinh Nguyen 								write_group,
25103da42859SDinh Nguyen 								read_group,
25113da42859SDinh Nguyen 								test_bgn, 0,
25123da42859SDinh Nguyen 								1)) {
25133da42859SDinh Nguyen 				grp_calibrated = 0;
25143da42859SDinh Nguyen 			}
25153da42859SDinh Nguyen 		}
25163da42859SDinh Nguyen 	}
25173da42859SDinh Nguyen 
25183da42859SDinh Nguyen 
25193da42859SDinh Nguyen 	if (grp_calibrated == 0) {
25203da42859SDinh Nguyen 		set_failing_group_stage(write_group,
25213da42859SDinh Nguyen 					CAL_STAGE_VFIFO_AFTER_WRITES,
25223da42859SDinh Nguyen 					CAL_SUBSTAGE_VFIFO_CENTER);
25233da42859SDinh Nguyen 		return 0;
25243da42859SDinh Nguyen 	}
25253da42859SDinh Nguyen 
25263da42859SDinh Nguyen 	return 1;
25273da42859SDinh Nguyen }
25283da42859SDinh Nguyen 
25293da42859SDinh Nguyen /* Calibrate LFIFO to find smallest read latency */
25303da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_lfifo(void)
25313da42859SDinh Nguyen {
25323da42859SDinh Nguyen 	uint32_t found_one;
25333da42859SDinh Nguyen 	uint32_t bit_chk;
25343da42859SDinh Nguyen 	uint32_t addr;
25353da42859SDinh Nguyen 
25363da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
25373da42859SDinh Nguyen 
25383da42859SDinh Nguyen 	/* update info for sims */
25393da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_LFIFO);
25403da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_READ_LATENCY);
25413da42859SDinh Nguyen 
25423da42859SDinh Nguyen 	/* Load up the patterns used by read calibration for all ranks */
25433da42859SDinh Nguyen 	rw_mgr_mem_calibrate_read_load_patterns(0, 1);
25443da42859SDinh Nguyen 	found_one = 0;
25453da42859SDinh Nguyen 
25461bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cfg->phy_rlat;
25473da42859SDinh Nguyen 	do {
25483da42859SDinh Nguyen 		writel(gbl->curr_read_lat, SOCFPGA_SDR_ADDRESS + addr);
25493da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d lfifo: read_lat=%u",
25503da42859SDinh Nguyen 			   __func__, __LINE__, gbl->curr_read_lat);
25513da42859SDinh Nguyen 
25523da42859SDinh Nguyen 		if (!rw_mgr_mem_calibrate_read_test_all_ranks(0,
25533da42859SDinh Nguyen 							      NUM_READ_TESTS,
25543da42859SDinh Nguyen 							      PASS_ALL_BITS,
25553da42859SDinh Nguyen 							      &bit_chk, 1)) {
25563da42859SDinh Nguyen 			break;
25573da42859SDinh Nguyen 		}
25583da42859SDinh Nguyen 
25593da42859SDinh Nguyen 		found_one = 1;
25603da42859SDinh Nguyen 		/* reduce read latency and see if things are working */
25613da42859SDinh Nguyen 		/* correctly */
25623da42859SDinh Nguyen 		gbl->curr_read_lat--;
25633da42859SDinh Nguyen 	} while (gbl->curr_read_lat > 0);
25643da42859SDinh Nguyen 
25653da42859SDinh Nguyen 	/* reset the fifos to get pointers to known state */
25663da42859SDinh Nguyen 
25671bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cmd->fifo_reset;
25683da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
25693da42859SDinh Nguyen 
25703da42859SDinh Nguyen 	if (found_one) {
25713da42859SDinh Nguyen 		/* add a fudge factor to the read latency that was determined */
25723da42859SDinh Nguyen 		gbl->curr_read_lat += 2;
25731bc6f14aSMarek Vasut 		addr = (u32)&phy_mgr_cfg->phy_rlat;
25743da42859SDinh Nguyen 		writel(gbl->curr_read_lat, SOCFPGA_SDR_ADDRESS + addr);
25753da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d lfifo: success: using \
25763da42859SDinh Nguyen 			   read_lat=%u\n", __func__, __LINE__,
25773da42859SDinh Nguyen 			   gbl->curr_read_lat);
25783da42859SDinh Nguyen 		return 1;
25793da42859SDinh Nguyen 	} else {
25803da42859SDinh Nguyen 		set_failing_group_stage(0xff, CAL_STAGE_LFIFO,
25813da42859SDinh Nguyen 					CAL_SUBSTAGE_READ_LATENCY);
25823da42859SDinh Nguyen 
25833da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d lfifo: failed at initial \
25843da42859SDinh Nguyen 			   read_lat=%u\n", __func__, __LINE__,
25853da42859SDinh Nguyen 			   gbl->curr_read_lat);
25863da42859SDinh Nguyen 		return 0;
25873da42859SDinh Nguyen 	}
25883da42859SDinh Nguyen }
25893da42859SDinh Nguyen 
25903da42859SDinh Nguyen /*
25913da42859SDinh Nguyen  * issue write test command.
25923da42859SDinh Nguyen  * two variants are provided. one that just tests a write pattern and
25933da42859SDinh Nguyen  * another that tests datamask functionality.
25943da42859SDinh Nguyen  */
25953da42859SDinh Nguyen static void rw_mgr_mem_calibrate_write_test_issue(uint32_t group,
25963da42859SDinh Nguyen 						  uint32_t test_dm)
25973da42859SDinh Nguyen {
25983da42859SDinh Nguyen 	uint32_t mcc_instruction;
25993da42859SDinh Nguyen 	uint32_t quick_write_mode = (((STATIC_CALIB_STEPS) & CALIB_SKIP_WRITES) &&
26003da42859SDinh Nguyen 		ENABLE_SUPER_QUICK_CALIBRATION);
26013da42859SDinh Nguyen 	uint32_t rw_wl_nop_cycles;
26023da42859SDinh Nguyen 	uint32_t addr;
26033da42859SDinh Nguyen 
26043da42859SDinh Nguyen 	/*
26053da42859SDinh Nguyen 	 * Set counter and jump addresses for the right
26063da42859SDinh Nguyen 	 * number of NOP cycles.
26073da42859SDinh Nguyen 	 * The number of supported NOP cycles can range from -1 to infinity
26083da42859SDinh Nguyen 	 * Three different cases are handled:
26093da42859SDinh Nguyen 	 *
26103da42859SDinh Nguyen 	 * 1. For a number of NOP cycles greater than 0, the RW Mgr looping
26113da42859SDinh Nguyen 	 *    mechanism will be used to insert the right number of NOPs
26123da42859SDinh Nguyen 	 *
26133da42859SDinh Nguyen 	 * 2. For a number of NOP cycles equals to 0, the micro-instruction
26143da42859SDinh Nguyen 	 *    issuing the write command will jump straight to the
26153da42859SDinh Nguyen 	 *    micro-instruction that turns on DQS (for DDRx), or outputs write
26163da42859SDinh Nguyen 	 *    data (for RLD), skipping
26173da42859SDinh Nguyen 	 *    the NOP micro-instruction all together
26183da42859SDinh Nguyen 	 *
26193da42859SDinh Nguyen 	 * 3. A number of NOP cycles equal to -1 indicates that DQS must be
26203da42859SDinh Nguyen 	 *    turned on in the same micro-instruction that issues the write
26213da42859SDinh Nguyen 	 *    command. Then we need
26223da42859SDinh Nguyen 	 *    to directly jump to the micro-instruction that sends out the data
26233da42859SDinh Nguyen 	 *
26243da42859SDinh Nguyen 	 * NOTE: Implementing this mechanism uses 2 RW Mgr jump-counters
26253da42859SDinh Nguyen 	 *       (2 and 3). One jump-counter (0) is used to perform multiple
26263da42859SDinh Nguyen 	 *       write-read operations.
26273da42859SDinh Nguyen 	 *       one counter left to issue this command in "multiple-group" mode
26283da42859SDinh Nguyen 	 */
26293da42859SDinh Nguyen 
26303da42859SDinh Nguyen 	rw_wl_nop_cycles = gbl->rw_wl_nop_cycles;
26313da42859SDinh Nguyen 
26323da42859SDinh Nguyen 	if (rw_wl_nop_cycles == -1) {
26333da42859SDinh Nguyen 		/*
26343da42859SDinh Nguyen 		 * CNTR 2 - We want to execute the special write operation that
26353da42859SDinh Nguyen 		 * turns on DQS right away and then skip directly to the
26363da42859SDinh Nguyen 		 * instruction that sends out the data. We set the counter to a
26373da42859SDinh Nguyen 		 * large number so that the jump is always taken.
26383da42859SDinh Nguyen 		 */
26396afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr2;
26403da42859SDinh Nguyen 		writel(0xFF, SOCFPGA_SDR_ADDRESS + addr);
26413da42859SDinh Nguyen 
26423da42859SDinh Nguyen 		/* CNTR 3 - Not used */
26433da42859SDinh Nguyen 		if (test_dm) {
26443da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_DM_BANK_0_WL_1;
26456afb4fe2SMarek Vasut 			addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add2;
26463da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_DATA,
26473da42859SDinh Nguyen 			       SOCFPGA_SDR_ADDRESS + addr);
26486afb4fe2SMarek Vasut 			addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add3;
26493da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_NOP,
26503da42859SDinh Nguyen 			       SOCFPGA_SDR_ADDRESS + addr);
26513da42859SDinh Nguyen 		} else {
26523da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_BANK_0_WL_1;
26536afb4fe2SMarek Vasut 			addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add2;
26543da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_BANK_0_DATA, SOCFPGA_SDR_ADDRESS + addr);
26556afb4fe2SMarek Vasut 			addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add3;
26563da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_BANK_0_NOP, SOCFPGA_SDR_ADDRESS + addr);
26573da42859SDinh Nguyen 		}
26583da42859SDinh Nguyen 	} else if (rw_wl_nop_cycles == 0) {
26593da42859SDinh Nguyen 		/*
26603da42859SDinh Nguyen 		 * CNTR 2 - We want to skip the NOP operation and go straight
26613da42859SDinh Nguyen 		 * to the DQS enable instruction. We set the counter to a large
26623da42859SDinh Nguyen 		 * number so that the jump is always taken.
26633da42859SDinh Nguyen 		 */
26646afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr2;
26653da42859SDinh Nguyen 		writel(0xFF, SOCFPGA_SDR_ADDRESS + addr);
26663da42859SDinh Nguyen 
26673da42859SDinh Nguyen 		/* CNTR 3 - Not used */
26683da42859SDinh Nguyen 		if (test_dm) {
26693da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_DM_BANK_0;
26706afb4fe2SMarek Vasut 			addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add2;
26713da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_DQS,
26723da42859SDinh Nguyen 			       SOCFPGA_SDR_ADDRESS + addr);
26733da42859SDinh Nguyen 		} else {
26743da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_BANK_0;
26756afb4fe2SMarek Vasut 			addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add2;
26763da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_BANK_0_DQS, SOCFPGA_SDR_ADDRESS + addr);
26773da42859SDinh Nguyen 		}
26783da42859SDinh Nguyen 	} else {
26793da42859SDinh Nguyen 		/*
26803da42859SDinh Nguyen 		 * CNTR 2 - In this case we want to execute the next instruction
26813da42859SDinh Nguyen 		 * and NOT take the jump. So we set the counter to 0. The jump
26823da42859SDinh Nguyen 		 * address doesn't count.
26833da42859SDinh Nguyen 		 */
26846afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr2;
26853da42859SDinh Nguyen 		writel(0x0, SOCFPGA_SDR_ADDRESS + addr);
26866afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add2;
26873da42859SDinh Nguyen 		writel(0x0, SOCFPGA_SDR_ADDRESS + addr);
26883da42859SDinh Nguyen 
26893da42859SDinh Nguyen 		/*
26903da42859SDinh Nguyen 		 * CNTR 3 - Set the nop counter to the number of cycles we
26913da42859SDinh Nguyen 		 * need to loop for, minus 1.
26923da42859SDinh Nguyen 		 */
26936afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr3;
26943da42859SDinh Nguyen 		writel(rw_wl_nop_cycles - 1, SOCFPGA_SDR_ADDRESS + addr);
26953da42859SDinh Nguyen 		if (test_dm) {
26963da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_DM_BANK_0;
26976afb4fe2SMarek Vasut 			addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add3;
26983da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_NOP, SOCFPGA_SDR_ADDRESS + addr);
26993da42859SDinh Nguyen 		} else {
27003da42859SDinh Nguyen 			mcc_instruction = RW_MGR_LFSR_WR_RD_BANK_0;
27016afb4fe2SMarek Vasut 			addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add3;
27023da42859SDinh Nguyen 			writel(RW_MGR_LFSR_WR_RD_BANK_0_NOP, SOCFPGA_SDR_ADDRESS + addr);
27033da42859SDinh Nguyen 		}
27043da42859SDinh Nguyen 	}
27053da42859SDinh Nguyen 
2706*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RESET_READ_DATAPATH_OFFSET;
27073da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
27083da42859SDinh Nguyen 
27096afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_mgr_regs->load_cntr0;
27103da42859SDinh Nguyen 	if (quick_write_mode)
27113da42859SDinh Nguyen 		writel(0x08, SOCFPGA_SDR_ADDRESS + addr);
27123da42859SDinh Nguyen 	else
27133da42859SDinh Nguyen 		writel(0x40, SOCFPGA_SDR_ADDRESS + addr);
27143da42859SDinh Nguyen 
27156afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add0;
27163da42859SDinh Nguyen 	writel(mcc_instruction, SOCFPGA_SDR_ADDRESS + addr);
27173da42859SDinh Nguyen 
27183da42859SDinh Nguyen 	/*
27193da42859SDinh Nguyen 	 * CNTR 1 - This is used to ensure enough time elapses
27203da42859SDinh Nguyen 	 * for read data to come back.
27213da42859SDinh Nguyen 	 */
27226afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_mgr_regs->load_cntr1;
27233da42859SDinh Nguyen 	writel(0x30, SOCFPGA_SDR_ADDRESS + addr);
27243da42859SDinh Nguyen 
27256afb4fe2SMarek Vasut 	addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add1;
27263da42859SDinh Nguyen 	if (test_dm) {
27273da42859SDinh Nguyen 		writel(RW_MGR_LFSR_WR_RD_DM_BANK_0_WAIT, SOCFPGA_SDR_ADDRESS + addr);
27283da42859SDinh Nguyen 	} else {
27293da42859SDinh Nguyen 		writel(RW_MGR_LFSR_WR_RD_BANK_0_WAIT, SOCFPGA_SDR_ADDRESS + addr);
27303da42859SDinh Nguyen 	}
27313da42859SDinh Nguyen 
2732*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
27333da42859SDinh Nguyen 	writel(mcc_instruction, SOCFPGA_SDR_ADDRESS + addr + (group << 2));
27343da42859SDinh Nguyen }
27353da42859SDinh Nguyen 
27363da42859SDinh Nguyen /* Test writes, can check for a single bit pass or multiple bit pass */
27373da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_write_test(uint32_t rank_bgn,
27383da42859SDinh Nguyen 	uint32_t write_group, uint32_t use_dm, uint32_t all_correct,
27393da42859SDinh Nguyen 	uint32_t *bit_chk, uint32_t all_ranks)
27403da42859SDinh Nguyen {
27413da42859SDinh Nguyen 	uint32_t addr;
27423da42859SDinh Nguyen 	uint32_t r;
27433da42859SDinh Nguyen 	uint32_t correct_mask_vg;
27443da42859SDinh Nguyen 	uint32_t tmp_bit_chk;
27453da42859SDinh Nguyen 	uint32_t vg;
27463da42859SDinh Nguyen 	uint32_t rank_end = all_ranks ? RW_MGR_MEM_NUMBER_OF_RANKS :
27473da42859SDinh Nguyen 		(rank_bgn + NUM_RANKS_PER_SHADOW_REG);
27483da42859SDinh Nguyen 	uint32_t addr_rw_mgr;
27493da42859SDinh Nguyen 	uint32_t base_rw_mgr;
27503da42859SDinh Nguyen 
27513da42859SDinh Nguyen 	*bit_chk = param->write_correct_mask;
27523da42859SDinh Nguyen 	correct_mask_vg = param->write_correct_mask_vg;
27533da42859SDinh Nguyen 
27543da42859SDinh Nguyen 	for (r = rank_bgn; r < rank_end; r++) {
27553da42859SDinh Nguyen 		if (param->skip_ranks[r]) {
27563da42859SDinh Nguyen 			/* request to skip the rank */
27573da42859SDinh Nguyen 			continue;
27583da42859SDinh Nguyen 		}
27593da42859SDinh Nguyen 
27603da42859SDinh Nguyen 		/* set rank */
27613da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_READ_WRITE);
27623da42859SDinh Nguyen 
27633da42859SDinh Nguyen 		tmp_bit_chk = 0;
27641bc6f14aSMarek Vasut 		addr = (u32)&phy_mgr_cmd->fifo_reset;
2765a4bfa463SMarek Vasut 		addr_rw_mgr = SDR_PHYGRP_RWMGRGRP_ADDRESS;
27663da42859SDinh Nguyen 		for (vg = RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS-1; ; vg--) {
27673da42859SDinh Nguyen 			/* reset the fifos to get pointers to known state */
27683da42859SDinh Nguyen 			writel(0, SOCFPGA_SDR_ADDRESS + addr);
27693da42859SDinh Nguyen 
27703da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk <<
27713da42859SDinh Nguyen 				(RW_MGR_MEM_DQ_PER_WRITE_DQS /
27723da42859SDinh Nguyen 				RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS);
27733da42859SDinh Nguyen 			rw_mgr_mem_calibrate_write_test_issue(write_group *
27743da42859SDinh Nguyen 				RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS+vg,
27753da42859SDinh Nguyen 				use_dm);
27763da42859SDinh Nguyen 
27773da42859SDinh Nguyen 			base_rw_mgr = readl(SOCFPGA_SDR_ADDRESS + addr_rw_mgr);
27783da42859SDinh Nguyen 			tmp_bit_chk = tmp_bit_chk | (correct_mask_vg & ~(base_rw_mgr));
27793da42859SDinh Nguyen 			if (vg == 0)
27803da42859SDinh Nguyen 				break;
27813da42859SDinh Nguyen 		}
27823da42859SDinh Nguyen 		*bit_chk &= tmp_bit_chk;
27833da42859SDinh Nguyen 	}
27843da42859SDinh Nguyen 
27853da42859SDinh Nguyen 	if (all_correct) {
27863da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
27873da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_test(%u,%u,ALL) : %u == \
27883da42859SDinh Nguyen 			   %u => %lu", write_group, use_dm,
27893da42859SDinh Nguyen 			   *bit_chk, param->write_correct_mask,
27903da42859SDinh Nguyen 			   (long unsigned int)(*bit_chk ==
27913da42859SDinh Nguyen 			   param->write_correct_mask));
27923da42859SDinh Nguyen 		return *bit_chk == param->write_correct_mask;
27933da42859SDinh Nguyen 	} else {
27943da42859SDinh Nguyen 		set_rank_and_odt_mask(0, RW_MGR_ODT_MODE_OFF);
27953da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_test(%u,%u,ONE) : %u != ",
27963da42859SDinh Nguyen 		       write_group, use_dm, *bit_chk);
27973da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%lu" " => %lu", (long unsigned int)0,
27983da42859SDinh Nguyen 			(long unsigned int)(*bit_chk != 0));
27993da42859SDinh Nguyen 		return *bit_chk != 0x00;
28003da42859SDinh Nguyen 	}
28013da42859SDinh Nguyen }
28023da42859SDinh Nguyen 
28033da42859SDinh Nguyen /*
28043da42859SDinh Nguyen  * center all windows. do per-bit-deskew to possibly increase size of
28053da42859SDinh Nguyen  * certain windows.
28063da42859SDinh Nguyen  */
28073da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_writes_center(uint32_t rank_bgn,
28083da42859SDinh Nguyen 	uint32_t write_group, uint32_t test_bgn)
28093da42859SDinh Nguyen {
28103da42859SDinh Nguyen 	uint32_t i, p, min_index;
28113da42859SDinh Nguyen 	int32_t d;
28123da42859SDinh Nguyen 	/*
28133da42859SDinh Nguyen 	 * Store these as signed since there are comparisons with
28143da42859SDinh Nguyen 	 * signed numbers.
28153da42859SDinh Nguyen 	 */
28163da42859SDinh Nguyen 	uint32_t bit_chk;
28173da42859SDinh Nguyen 	uint32_t sticky_bit_chk;
28183da42859SDinh Nguyen 	int32_t left_edge[RW_MGR_MEM_DQ_PER_WRITE_DQS];
28193da42859SDinh Nguyen 	int32_t right_edge[RW_MGR_MEM_DQ_PER_WRITE_DQS];
28203da42859SDinh Nguyen 	int32_t mid;
28213da42859SDinh Nguyen 	int32_t mid_min, orig_mid_min;
28223da42859SDinh Nguyen 	int32_t new_dqs, start_dqs, shift_dq;
28233da42859SDinh Nguyen 	int32_t dq_margin, dqs_margin, dm_margin;
28243da42859SDinh Nguyen 	uint32_t stop;
28253da42859SDinh Nguyen 	uint32_t temp_dq_out1_delay;
28263da42859SDinh Nguyen 	uint32_t addr;
28273da42859SDinh Nguyen 
28283da42859SDinh Nguyen 	debug("%s:%d %u %u", __func__, __LINE__, write_group, test_bgn);
28293da42859SDinh Nguyen 
28303da42859SDinh Nguyen 	dm_margin = 0;
28313da42859SDinh Nguyen 
2832*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
28333da42859SDinh Nguyen 	start_dqs = readl(SOCFPGA_SDR_ADDRESS + addr +
28343da42859SDinh Nguyen 			  (RW_MGR_MEM_DQ_PER_WRITE_DQS << 2));
28353da42859SDinh Nguyen 
28363da42859SDinh Nguyen 	/* per-bit deskew */
28373da42859SDinh Nguyen 
28383da42859SDinh Nguyen 	/*
28393da42859SDinh Nguyen 	 * set the left and right edge of each bit to an illegal value
28403da42859SDinh Nguyen 	 * use (IO_IO_OUT1_DELAY_MAX + 1) as an illegal value.
28413da42859SDinh Nguyen 	 */
28423da42859SDinh Nguyen 	sticky_bit_chk = 0;
28433da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
28443da42859SDinh Nguyen 		left_edge[i]  = IO_IO_OUT1_DELAY_MAX + 1;
28453da42859SDinh Nguyen 		right_edge[i] = IO_IO_OUT1_DELAY_MAX + 1;
28463da42859SDinh Nguyen 	}
28473da42859SDinh Nguyen 
28483da42859SDinh Nguyen 	/* Search for the left edge of the window for each bit */
2849e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
28503da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_OUT1_DELAY_MAX; d++) {
28513da42859SDinh Nguyen 		scc_mgr_apply_group_dq_out1_delay(write_group, test_bgn, d);
28523da42859SDinh Nguyen 
28533da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
28543da42859SDinh Nguyen 
28553da42859SDinh Nguyen 		/*
28563da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
28573da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
28583da42859SDinh Nguyen 		 */
28593da42859SDinh Nguyen 		stop = !rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
28603da42859SDinh Nguyen 			0, PASS_ONE_BIT, &bit_chk, 0);
28613da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
28623da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->write_correct_mask);
28633da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center(left): dtap=%d => %u \
28643da42859SDinh Nguyen 			   == %u && %u [bit_chk= %u ]\n",
28653da42859SDinh Nguyen 			d, sticky_bit_chk, param->write_correct_mask,
28663da42859SDinh Nguyen 			stop, bit_chk);
28673da42859SDinh Nguyen 
28683da42859SDinh Nguyen 		if (stop == 1) {
28693da42859SDinh Nguyen 			break;
28703da42859SDinh Nguyen 		} else {
28713da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
28723da42859SDinh Nguyen 				if (bit_chk & 1) {
28733da42859SDinh Nguyen 					/*
28743da42859SDinh Nguyen 					 * Remember a passing test as the
28753da42859SDinh Nguyen 					 * left_edge.
28763da42859SDinh Nguyen 					 */
28773da42859SDinh Nguyen 					left_edge[i] = d;
28783da42859SDinh Nguyen 				} else {
28793da42859SDinh Nguyen 					/*
28803da42859SDinh Nguyen 					 * If a left edge has not been seen
28813da42859SDinh Nguyen 					 * yet, then a future passing test will
28823da42859SDinh Nguyen 					 * mark this edge as the right edge.
28833da42859SDinh Nguyen 					 */
28843da42859SDinh Nguyen 					if (left_edge[i] ==
28853da42859SDinh Nguyen 						IO_IO_OUT1_DELAY_MAX + 1) {
28863da42859SDinh Nguyen 						right_edge[i] = -(d + 1);
28873da42859SDinh Nguyen 					}
28883da42859SDinh Nguyen 				}
28893da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "write_center[l,d=%d):", d);
28903da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "bit_chk_test=%d left_edge[%u]: %d",
28913da42859SDinh Nguyen 					   (int)(bit_chk & 1), i, left_edge[i]);
28923da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "right_edge[%u]: %d\n", i,
28933da42859SDinh Nguyen 				       right_edge[i]);
28943da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
28953da42859SDinh Nguyen 			}
28963da42859SDinh Nguyen 		}
28973da42859SDinh Nguyen 	}
28983da42859SDinh Nguyen 
28993da42859SDinh Nguyen 	/* Reset DQ delay chains to 0 */
29003da42859SDinh Nguyen 	scc_mgr_apply_group_dq_out1_delay(write_group, test_bgn, 0);
29013da42859SDinh Nguyen 	sticky_bit_chk = 0;
29023da42859SDinh Nguyen 	for (i = RW_MGR_MEM_DQ_PER_WRITE_DQS - 1;; i--) {
29033da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d write_center: left_edge[%u]: \
29043da42859SDinh Nguyen 			   %d right_edge[%u]: %d\n", __func__, __LINE__,
29053da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
29063da42859SDinh Nguyen 
29073da42859SDinh Nguyen 		/*
29083da42859SDinh Nguyen 		 * Check for cases where we haven't found the left edge,
29093da42859SDinh Nguyen 		 * which makes our assignment of the the right edge invalid.
29103da42859SDinh Nguyen 		 * Reset it to the illegal value.
29113da42859SDinh Nguyen 		 */
29123da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_OUT1_DELAY_MAX + 1) &&
29133da42859SDinh Nguyen 		    (right_edge[i] != IO_IO_OUT1_DELAY_MAX + 1)) {
29143da42859SDinh Nguyen 			right_edge[i] = IO_IO_OUT1_DELAY_MAX + 1;
29153da42859SDinh Nguyen 			debug_cond(DLEVEL == 2, "%s:%d write_center: reset \
29163da42859SDinh Nguyen 				   right_edge[%u]: %d\n", __func__, __LINE__,
29173da42859SDinh Nguyen 				   i, right_edge[i]);
29183da42859SDinh Nguyen 		}
29193da42859SDinh Nguyen 
29203da42859SDinh Nguyen 		/*
29213da42859SDinh Nguyen 		 * Reset sticky bit (except for bits where we have
29223da42859SDinh Nguyen 		 * seen the left edge).
29233da42859SDinh Nguyen 		 */
29243da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk << 1;
29253da42859SDinh Nguyen 		if ((left_edge[i] != IO_IO_OUT1_DELAY_MAX + 1))
29263da42859SDinh Nguyen 			sticky_bit_chk = sticky_bit_chk | 1;
29273da42859SDinh Nguyen 
29283da42859SDinh Nguyen 		if (i == 0)
29293da42859SDinh Nguyen 			break;
29303da42859SDinh Nguyen 	}
29313da42859SDinh Nguyen 
29323da42859SDinh Nguyen 	/* Search for the right edge of the window for each bit */
2933e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
29343da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_OUT1_DELAY_MAX - start_dqs; d++) {
29353da42859SDinh Nguyen 		scc_mgr_apply_group_dqs_io_and_oct_out1(write_group,
29363da42859SDinh Nguyen 							d + start_dqs);
29373da42859SDinh Nguyen 
29383da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
29393da42859SDinh Nguyen 
29403da42859SDinh Nguyen 		/*
29413da42859SDinh Nguyen 		 * Stop searching when the read test doesn't pass AND when
29423da42859SDinh Nguyen 		 * we've seen a passing read on every bit.
29433da42859SDinh Nguyen 		 */
29443da42859SDinh Nguyen 		stop = !rw_mgr_mem_calibrate_write_test(rank_bgn, write_group,
29453da42859SDinh Nguyen 			0, PASS_ONE_BIT, &bit_chk, 0);
29463da42859SDinh Nguyen 
29473da42859SDinh Nguyen 		sticky_bit_chk = sticky_bit_chk | bit_chk;
29483da42859SDinh Nguyen 		stop = stop && (sticky_bit_chk == param->write_correct_mask);
29493da42859SDinh Nguyen 
29503da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center (right): dtap=%u => %u == \
29513da42859SDinh Nguyen 			   %u && %u\n", d, sticky_bit_chk,
29523da42859SDinh Nguyen 			   param->write_correct_mask, stop);
29533da42859SDinh Nguyen 
29543da42859SDinh Nguyen 		if (stop == 1) {
29553da42859SDinh Nguyen 			if (d == 0) {
29563da42859SDinh Nguyen 				for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS;
29573da42859SDinh Nguyen 					i++) {
29583da42859SDinh Nguyen 					/* d = 0 failed, but it passed when
29593da42859SDinh Nguyen 					testing the left edge, so it must be
29603da42859SDinh Nguyen 					marginal, set it to -1 */
29613da42859SDinh Nguyen 					if (right_edge[i] ==
29623da42859SDinh Nguyen 						IO_IO_OUT1_DELAY_MAX + 1 &&
29633da42859SDinh Nguyen 						left_edge[i] !=
29643da42859SDinh Nguyen 						IO_IO_OUT1_DELAY_MAX + 1) {
29653da42859SDinh Nguyen 						right_edge[i] = -1;
29663da42859SDinh Nguyen 					}
29673da42859SDinh Nguyen 				}
29683da42859SDinh Nguyen 			}
29693da42859SDinh Nguyen 			break;
29703da42859SDinh Nguyen 		} else {
29713da42859SDinh Nguyen 			for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
29723da42859SDinh Nguyen 				if (bit_chk & 1) {
29733da42859SDinh Nguyen 					/*
29743da42859SDinh Nguyen 					 * Remember a passing test as
29753da42859SDinh Nguyen 					 * the right_edge.
29763da42859SDinh Nguyen 					 */
29773da42859SDinh Nguyen 					right_edge[i] = d;
29783da42859SDinh Nguyen 				} else {
29793da42859SDinh Nguyen 					if (d != 0) {
29803da42859SDinh Nguyen 						/*
29813da42859SDinh Nguyen 						 * If a right edge has not
29823da42859SDinh Nguyen 						 * been seen yet, then a future
29833da42859SDinh Nguyen 						 * passing test will mark this
29843da42859SDinh Nguyen 						 * edge as the left edge.
29853da42859SDinh Nguyen 						 */
29863da42859SDinh Nguyen 						if (right_edge[i] ==
29873da42859SDinh Nguyen 						    IO_IO_OUT1_DELAY_MAX + 1)
29883da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
29893da42859SDinh Nguyen 					} else {
29903da42859SDinh Nguyen 						/*
29913da42859SDinh Nguyen 						 * d = 0 failed, but it passed
29923da42859SDinh Nguyen 						 * when testing the left edge,
29933da42859SDinh Nguyen 						 * so it must be marginal, set
29943da42859SDinh Nguyen 						 * it to -1.
29953da42859SDinh Nguyen 						 */
29963da42859SDinh Nguyen 						if (right_edge[i] ==
29973da42859SDinh Nguyen 						    IO_IO_OUT1_DELAY_MAX + 1 &&
29983da42859SDinh Nguyen 						    left_edge[i] !=
29993da42859SDinh Nguyen 						    IO_IO_OUT1_DELAY_MAX + 1)
30003da42859SDinh Nguyen 							right_edge[i] = -1;
30013da42859SDinh Nguyen 						/*
30023da42859SDinh Nguyen 						 * If a right edge has not been
30033da42859SDinh Nguyen 						 * seen yet, then a future
30043da42859SDinh Nguyen 						 * passing test will mark this
30053da42859SDinh Nguyen 						 * edge as the left edge.
30063da42859SDinh Nguyen 						 */
30073da42859SDinh Nguyen 						else if (right_edge[i] ==
30083da42859SDinh Nguyen 							IO_IO_OUT1_DELAY_MAX +
30093da42859SDinh Nguyen 							1)
30103da42859SDinh Nguyen 							left_edge[i] = -(d + 1);
30113da42859SDinh Nguyen 					}
30123da42859SDinh Nguyen 				}
30133da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "write_center[r,d=%d):", d);
30143da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "bit_chk_test=%d left_edge[%u]: %d",
30153da42859SDinh Nguyen 					   (int)(bit_chk & 1), i, left_edge[i]);
30163da42859SDinh Nguyen 				debug_cond(DLEVEL == 2, "right_edge[%u]: %d\n", i,
30173da42859SDinh Nguyen 					   right_edge[i]);
30183da42859SDinh Nguyen 				bit_chk = bit_chk >> 1;
30193da42859SDinh Nguyen 			}
30203da42859SDinh Nguyen 		}
30213da42859SDinh Nguyen 	}
30223da42859SDinh Nguyen 
30233da42859SDinh Nguyen 	/* Check that all bits have a window */
30243da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
30253da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d write_center: left_edge[%u]: \
30263da42859SDinh Nguyen 			   %d right_edge[%u]: %d", __func__, __LINE__,
30273da42859SDinh Nguyen 			   i, left_edge[i], i, right_edge[i]);
30283da42859SDinh Nguyen 		if ((left_edge[i] == IO_IO_OUT1_DELAY_MAX + 1) ||
30293da42859SDinh Nguyen 		    (right_edge[i] == IO_IO_OUT1_DELAY_MAX + 1)) {
30303da42859SDinh Nguyen 			set_failing_group_stage(test_bgn + i,
30313da42859SDinh Nguyen 						CAL_STAGE_WRITES,
30323da42859SDinh Nguyen 						CAL_SUBSTAGE_WRITES_CENTER);
30333da42859SDinh Nguyen 			return 0;
30343da42859SDinh Nguyen 		}
30353da42859SDinh Nguyen 	}
30363da42859SDinh Nguyen 
30373da42859SDinh Nguyen 	/* Find middle of window for each DQ bit */
30383da42859SDinh Nguyen 	mid_min = left_edge[0] - right_edge[0];
30393da42859SDinh Nguyen 	min_index = 0;
30403da42859SDinh Nguyen 	for (i = 1; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++) {
30413da42859SDinh Nguyen 		mid = left_edge[i] - right_edge[i];
30423da42859SDinh Nguyen 		if (mid < mid_min) {
30433da42859SDinh Nguyen 			mid_min = mid;
30443da42859SDinh Nguyen 			min_index = i;
30453da42859SDinh Nguyen 		}
30463da42859SDinh Nguyen 	}
30473da42859SDinh Nguyen 
30483da42859SDinh Nguyen 	/*
30493da42859SDinh Nguyen 	 * -mid_min/2 represents the amount that we need to move DQS.
30503da42859SDinh Nguyen 	 * If mid_min is odd and positive we'll need to add one to
30513da42859SDinh Nguyen 	 * make sure the rounding in further calculations is correct
30523da42859SDinh Nguyen 	 * (always bias to the right), so just add 1 for all positive values.
30533da42859SDinh Nguyen 	 */
30543da42859SDinh Nguyen 	if (mid_min > 0)
30553da42859SDinh Nguyen 		mid_min++;
30563da42859SDinh Nguyen 	mid_min = mid_min / 2;
30573da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d write_center: mid_min=%d\n", __func__,
30583da42859SDinh Nguyen 		   __LINE__, mid_min);
30593da42859SDinh Nguyen 
30603da42859SDinh Nguyen 	/* Determine the amount we can change DQS (which is -mid_min) */
30613da42859SDinh Nguyen 	orig_mid_min = mid_min;
30623da42859SDinh Nguyen 	new_dqs = start_dqs;
30633da42859SDinh Nguyen 	mid_min = 0;
30643da42859SDinh Nguyen 	debug_cond(DLEVEL == 1, "%s:%d write_center: start_dqs=%d new_dqs=%d \
30653da42859SDinh Nguyen 		   mid_min=%d\n", __func__, __LINE__, start_dqs, new_dqs, mid_min);
30663da42859SDinh Nguyen 	/* Initialize data for export structures */
30673da42859SDinh Nguyen 	dqs_margin = IO_IO_OUT1_DELAY_MAX + 1;
30683da42859SDinh Nguyen 	dq_margin  = IO_IO_OUT1_DELAY_MAX + 1;
30693da42859SDinh Nguyen 
30703da42859SDinh Nguyen 	/* add delay to bring centre of all DQ windows to the same "level" */
3071*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_IO_OUT1_DELAY_OFFSET;
30723da42859SDinh Nguyen 	for (i = 0, p = test_bgn; i < RW_MGR_MEM_DQ_PER_WRITE_DQS; i++, p++) {
30733da42859SDinh Nguyen 		/* Use values before divide by 2 to reduce round off error */
30743da42859SDinh Nguyen 		shift_dq = (left_edge[i] - right_edge[i] -
30753da42859SDinh Nguyen 			(left_edge[min_index] - right_edge[min_index]))/2  +
30763da42859SDinh Nguyen 		(orig_mid_min - mid_min);
30773da42859SDinh Nguyen 
30783da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "%s:%d write_center: before: shift_dq \
30793da42859SDinh Nguyen 			   [%u]=%d\n", __func__, __LINE__, i, shift_dq);
30803da42859SDinh Nguyen 
30813da42859SDinh Nguyen 		temp_dq_out1_delay = readl(SOCFPGA_SDR_ADDRESS + addr + (i << 2));
30823da42859SDinh Nguyen 		if (shift_dq + (int32_t)temp_dq_out1_delay >
30833da42859SDinh Nguyen 			(int32_t)IO_IO_OUT1_DELAY_MAX) {
30843da42859SDinh Nguyen 			shift_dq = (int32_t)IO_IO_OUT1_DELAY_MAX - temp_dq_out1_delay;
30853da42859SDinh Nguyen 		} else if (shift_dq + (int32_t)temp_dq_out1_delay < 0) {
30863da42859SDinh Nguyen 			shift_dq = -(int32_t)temp_dq_out1_delay;
30873da42859SDinh Nguyen 		}
30883da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center: after: shift_dq[%u]=%d\n",
30893da42859SDinh Nguyen 			   i, shift_dq);
30903da42859SDinh Nguyen 		scc_mgr_set_dq_out1_delay(write_group, i, temp_dq_out1_delay +
30913da42859SDinh Nguyen 					  shift_dq);
30923da42859SDinh Nguyen 		scc_mgr_load_dq(i);
30933da42859SDinh Nguyen 
30943da42859SDinh Nguyen 		debug_cond(DLEVEL == 2, "write_center: margin[%u]=[%d,%d]\n", i,
30953da42859SDinh Nguyen 			   left_edge[i] - shift_dq + (-mid_min),
30963da42859SDinh Nguyen 			   right_edge[i] + shift_dq - (-mid_min));
30973da42859SDinh Nguyen 		/* To determine values for export structures */
30983da42859SDinh Nguyen 		if (left_edge[i] - shift_dq + (-mid_min) < dq_margin)
30993da42859SDinh Nguyen 			dq_margin = left_edge[i] - shift_dq + (-mid_min);
31003da42859SDinh Nguyen 
31013da42859SDinh Nguyen 		if (right_edge[i] + shift_dq - (-mid_min) < dqs_margin)
31023da42859SDinh Nguyen 			dqs_margin = right_edge[i] + shift_dq - (-mid_min);
31033da42859SDinh Nguyen 	}
31043da42859SDinh Nguyen 
31053da42859SDinh Nguyen 	/* Move DQS */
31063da42859SDinh Nguyen 	scc_mgr_apply_group_dqs_io_and_oct_out1(write_group, new_dqs);
3107e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
31083da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
31093da42859SDinh Nguyen 
31103da42859SDinh Nguyen 	/* Centre DM */
31113da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d write_center: DM\n", __func__, __LINE__);
31123da42859SDinh Nguyen 
31133da42859SDinh Nguyen 	/*
31143da42859SDinh Nguyen 	 * set the left and right edge of each bit to an illegal value,
31153da42859SDinh Nguyen 	 * use (IO_IO_OUT1_DELAY_MAX + 1) as an illegal value,
31163da42859SDinh Nguyen 	 */
31173da42859SDinh Nguyen 	left_edge[0]  = IO_IO_OUT1_DELAY_MAX + 1;
31183da42859SDinh Nguyen 	right_edge[0] = IO_IO_OUT1_DELAY_MAX + 1;
31193da42859SDinh Nguyen 	int32_t bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
31203da42859SDinh Nguyen 	int32_t end_curr = IO_IO_OUT1_DELAY_MAX + 1;
31213da42859SDinh Nguyen 	int32_t bgn_best = IO_IO_OUT1_DELAY_MAX + 1;
31223da42859SDinh Nguyen 	int32_t end_best = IO_IO_OUT1_DELAY_MAX + 1;
31233da42859SDinh Nguyen 	int32_t win_best = 0;
31243da42859SDinh Nguyen 
31253da42859SDinh Nguyen 	/* Search for the/part of the window with DM shift */
3126e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
31273da42859SDinh Nguyen 	for (d = IO_IO_OUT1_DELAY_MAX; d >= 0; d -= DELTA_D) {
31283da42859SDinh Nguyen 		scc_mgr_apply_group_dm_out1_delay(write_group, d);
31293da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
31303da42859SDinh Nguyen 
31313da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_write_test(rank_bgn, write_group, 1,
31323da42859SDinh Nguyen 						    PASS_ALL_BITS, &bit_chk,
31333da42859SDinh Nguyen 						    0)) {
31343da42859SDinh Nguyen 			/* USE Set current end of the window */
31353da42859SDinh Nguyen 			end_curr = -d;
31363da42859SDinh Nguyen 			/*
31373da42859SDinh Nguyen 			 * If a starting edge of our window has not been seen
31383da42859SDinh Nguyen 			 * this is our current start of the DM window.
31393da42859SDinh Nguyen 			 */
31403da42859SDinh Nguyen 			if (bgn_curr == IO_IO_OUT1_DELAY_MAX + 1)
31413da42859SDinh Nguyen 				bgn_curr = -d;
31423da42859SDinh Nguyen 
31433da42859SDinh Nguyen 			/*
31443da42859SDinh Nguyen 			 * If current window is bigger than best seen.
31453da42859SDinh Nguyen 			 * Set best seen to be current window.
31463da42859SDinh Nguyen 			 */
31473da42859SDinh Nguyen 			if ((end_curr-bgn_curr+1) > win_best) {
31483da42859SDinh Nguyen 				win_best = end_curr-bgn_curr+1;
31493da42859SDinh Nguyen 				bgn_best = bgn_curr;
31503da42859SDinh Nguyen 				end_best = end_curr;
31513da42859SDinh Nguyen 			}
31523da42859SDinh Nguyen 		} else {
31533da42859SDinh Nguyen 			/* We just saw a failing test. Reset temp edge */
31543da42859SDinh Nguyen 			bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
31553da42859SDinh Nguyen 			end_curr = IO_IO_OUT1_DELAY_MAX + 1;
31563da42859SDinh Nguyen 			}
31573da42859SDinh Nguyen 		}
31583da42859SDinh Nguyen 
31593da42859SDinh Nguyen 
31603da42859SDinh Nguyen 	/* Reset DM delay chains to 0 */
31613da42859SDinh Nguyen 	scc_mgr_apply_group_dm_out1_delay(write_group, 0);
31623da42859SDinh Nguyen 
31633da42859SDinh Nguyen 	/*
31643da42859SDinh Nguyen 	 * Check to see if the current window nudges up aganist 0 delay.
31653da42859SDinh Nguyen 	 * If so we need to continue the search by shifting DQS otherwise DQS
31663da42859SDinh Nguyen 	 * search begins as a new search. */
31673da42859SDinh Nguyen 	if (end_curr != 0) {
31683da42859SDinh Nguyen 		bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
31693da42859SDinh Nguyen 		end_curr = IO_IO_OUT1_DELAY_MAX + 1;
31703da42859SDinh Nguyen 	}
31713da42859SDinh Nguyen 
31723da42859SDinh Nguyen 	/* Search for the/part of the window with DQS shifts */
3173e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
31743da42859SDinh Nguyen 	for (d = 0; d <= IO_IO_OUT1_DELAY_MAX - new_dqs; d += DELTA_D) {
31753da42859SDinh Nguyen 		/*
31763da42859SDinh Nguyen 		 * Note: This only shifts DQS, so are we limiting ourselve to
31773da42859SDinh Nguyen 		 * width of DQ unnecessarily.
31783da42859SDinh Nguyen 		 */
31793da42859SDinh Nguyen 		scc_mgr_apply_group_dqs_io_and_oct_out1(write_group,
31803da42859SDinh Nguyen 							d + new_dqs);
31813da42859SDinh Nguyen 
31823da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
31833da42859SDinh Nguyen 		if (rw_mgr_mem_calibrate_write_test(rank_bgn, write_group, 1,
31843da42859SDinh Nguyen 						    PASS_ALL_BITS, &bit_chk,
31853da42859SDinh Nguyen 						    0)) {
31863da42859SDinh Nguyen 			/* USE Set current end of the window */
31873da42859SDinh Nguyen 			end_curr = d;
31883da42859SDinh Nguyen 			/*
31893da42859SDinh Nguyen 			 * If a beginning edge of our window has not been seen
31903da42859SDinh Nguyen 			 * this is our current begin of the DM window.
31913da42859SDinh Nguyen 			 */
31923da42859SDinh Nguyen 			if (bgn_curr == IO_IO_OUT1_DELAY_MAX + 1)
31933da42859SDinh Nguyen 				bgn_curr = d;
31943da42859SDinh Nguyen 
31953da42859SDinh Nguyen 			/*
31963da42859SDinh Nguyen 			 * If current window is bigger than best seen. Set best
31973da42859SDinh Nguyen 			 * seen to be current window.
31983da42859SDinh Nguyen 			 */
31993da42859SDinh Nguyen 			if ((end_curr-bgn_curr+1) > win_best) {
32003da42859SDinh Nguyen 				win_best = end_curr-bgn_curr+1;
32013da42859SDinh Nguyen 				bgn_best = bgn_curr;
32023da42859SDinh Nguyen 				end_best = end_curr;
32033da42859SDinh Nguyen 			}
32043da42859SDinh Nguyen 		} else {
32053da42859SDinh Nguyen 			/* We just saw a failing test. Reset temp edge */
32063da42859SDinh Nguyen 			bgn_curr = IO_IO_OUT1_DELAY_MAX + 1;
32073da42859SDinh Nguyen 			end_curr = IO_IO_OUT1_DELAY_MAX + 1;
32083da42859SDinh Nguyen 
32093da42859SDinh Nguyen 			/* Early exit optimization: if ther remaining delay
32103da42859SDinh Nguyen 			chain space is less than already seen largest window
32113da42859SDinh Nguyen 			we can exit */
32123da42859SDinh Nguyen 			if ((win_best-1) >
32133da42859SDinh Nguyen 				(IO_IO_OUT1_DELAY_MAX - new_dqs - d)) {
32143da42859SDinh Nguyen 					break;
32153da42859SDinh Nguyen 				}
32163da42859SDinh Nguyen 			}
32173da42859SDinh Nguyen 		}
32183da42859SDinh Nguyen 
32193da42859SDinh Nguyen 	/* assign left and right edge for cal and reporting; */
32203da42859SDinh Nguyen 	left_edge[0] = -1*bgn_best;
32213da42859SDinh Nguyen 	right_edge[0] = end_best;
32223da42859SDinh Nguyen 
32233da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d dm_calib: left=%d right=%d\n", __func__,
32243da42859SDinh Nguyen 		   __LINE__, left_edge[0], right_edge[0]);
32253da42859SDinh Nguyen 
32263da42859SDinh Nguyen 	/* Move DQS (back to orig) */
32273da42859SDinh Nguyen 	scc_mgr_apply_group_dqs_io_and_oct_out1(write_group, new_dqs);
32283da42859SDinh Nguyen 
32293da42859SDinh Nguyen 	/* Move DM */
32303da42859SDinh Nguyen 
32313da42859SDinh Nguyen 	/* Find middle of window for the DM bit */
32323da42859SDinh Nguyen 	mid = (left_edge[0] - right_edge[0]) / 2;
32333da42859SDinh Nguyen 
32343da42859SDinh Nguyen 	/* only move right, since we are not moving DQS/DQ */
32353da42859SDinh Nguyen 	if (mid < 0)
32363da42859SDinh Nguyen 		mid = 0;
32373da42859SDinh Nguyen 
32383da42859SDinh Nguyen 	/* dm_marign should fail if we never find a window */
32393da42859SDinh Nguyen 	if (win_best == 0)
32403da42859SDinh Nguyen 		dm_margin = -1;
32413da42859SDinh Nguyen 	else
32423da42859SDinh Nguyen 		dm_margin = left_edge[0] - mid;
32433da42859SDinh Nguyen 
32443da42859SDinh Nguyen 	scc_mgr_apply_group_dm_out1_delay(write_group, mid);
3245e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
32463da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
32473da42859SDinh Nguyen 
32483da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d dm_calib: left=%d right=%d mid=%d \
32493da42859SDinh Nguyen 		   dm_margin=%d\n", __func__, __LINE__, left_edge[0],
32503da42859SDinh Nguyen 		   right_edge[0], mid, dm_margin);
32513da42859SDinh Nguyen 	/* Export values */
32523da42859SDinh Nguyen 	gbl->fom_out += dq_margin + dqs_margin;
32533da42859SDinh Nguyen 
32543da42859SDinh Nguyen 	debug_cond(DLEVEL == 2, "%s:%d write_center: dq_margin=%d \
32553da42859SDinh Nguyen 		   dqs_margin=%d dm_margin=%d\n", __func__, __LINE__,
32563da42859SDinh Nguyen 		   dq_margin, dqs_margin, dm_margin);
32573da42859SDinh Nguyen 
32583da42859SDinh Nguyen 	/*
32593da42859SDinh Nguyen 	 * Do not remove this line as it makes sure all of our
32603da42859SDinh Nguyen 	 * decisions have been applied.
32613da42859SDinh Nguyen 	 */
3262e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
32633da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
32643da42859SDinh Nguyen 	return (dq_margin >= 0) && (dqs_margin >= 0) && (dm_margin >= 0);
32653da42859SDinh Nguyen }
32663da42859SDinh Nguyen 
32673da42859SDinh Nguyen /* calibrate the write operations */
32683da42859SDinh Nguyen static uint32_t rw_mgr_mem_calibrate_writes(uint32_t rank_bgn, uint32_t g,
32693da42859SDinh Nguyen 	uint32_t test_bgn)
32703da42859SDinh Nguyen {
32713da42859SDinh Nguyen 	/* update info for sims */
32723da42859SDinh Nguyen 	debug("%s:%d %u %u\n", __func__, __LINE__, g, test_bgn);
32733da42859SDinh Nguyen 
32743da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_WRITES);
32753da42859SDinh Nguyen 	reg_file_set_sub_stage(CAL_SUBSTAGE_WRITES_CENTER);
32763da42859SDinh Nguyen 
32773da42859SDinh Nguyen 	reg_file_set_group(g);
32783da42859SDinh Nguyen 
32793da42859SDinh Nguyen 	if (!rw_mgr_mem_calibrate_writes_center(rank_bgn, g, test_bgn)) {
32803da42859SDinh Nguyen 		set_failing_group_stage(g, CAL_STAGE_WRITES,
32813da42859SDinh Nguyen 					CAL_SUBSTAGE_WRITES_CENTER);
32823da42859SDinh Nguyen 		return 0;
32833da42859SDinh Nguyen 	}
32843da42859SDinh Nguyen 
32853da42859SDinh Nguyen 	return 1;
32863da42859SDinh Nguyen }
32873da42859SDinh Nguyen 
32883da42859SDinh Nguyen /* precharge all banks and activate row 0 in bank "000..." and bank "111..." */
32893da42859SDinh Nguyen static void mem_precharge_and_activate(void)
32903da42859SDinh Nguyen {
32913da42859SDinh Nguyen 	uint32_t r;
32923da42859SDinh Nguyen 	uint32_t addr;
32933da42859SDinh Nguyen 
32943da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS; r++) {
32953da42859SDinh Nguyen 		if (param->skip_ranks[r]) {
32963da42859SDinh Nguyen 			/* request to skip the rank */
32973da42859SDinh Nguyen 			continue;
32983da42859SDinh Nguyen 		}
32993da42859SDinh Nguyen 
33003da42859SDinh Nguyen 		/* set rank */
33013da42859SDinh Nguyen 		set_rank_and_odt_mask(r, RW_MGR_ODT_MODE_OFF);
33023da42859SDinh Nguyen 
33033da42859SDinh Nguyen 		/* precharge all banks ... */
3304*c4815f76SMarek Vasut 		addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
33053da42859SDinh Nguyen 		writel(RW_MGR_PRECHARGE_ALL, SOCFPGA_SDR_ADDRESS + addr);
33063da42859SDinh Nguyen 
33076afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr0;
33083da42859SDinh Nguyen 		writel(0x0F, SOCFPGA_SDR_ADDRESS + addr);
33096afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add0;
33103da42859SDinh Nguyen 		writel(RW_MGR_ACTIVATE_0_AND_1_WAIT1, SOCFPGA_SDR_ADDRESS + addr);
33113da42859SDinh Nguyen 
33126afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_mgr_regs->load_cntr1;
33133da42859SDinh Nguyen 		writel(0x0F, SOCFPGA_SDR_ADDRESS + addr);
33146afb4fe2SMarek Vasut 		addr = (u32)&sdr_rw_load_jump_mgr_regs->load_jump_add1;
33153da42859SDinh Nguyen 		writel(RW_MGR_ACTIVATE_0_AND_1_WAIT2, SOCFPGA_SDR_ADDRESS + addr);
33163da42859SDinh Nguyen 
33173da42859SDinh Nguyen 		/* activate rows */
3318*c4815f76SMarek Vasut 		addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_RUN_SINGLE_GROUP_OFFSET;
33193da42859SDinh Nguyen 		writel(RW_MGR_ACTIVATE_0_AND_1, SOCFPGA_SDR_ADDRESS + addr);
33203da42859SDinh Nguyen 	}
33213da42859SDinh Nguyen }
33223da42859SDinh Nguyen 
33233da42859SDinh Nguyen /* Configure various memory related parameters. */
33243da42859SDinh Nguyen static void mem_config(void)
33253da42859SDinh Nguyen {
33263da42859SDinh Nguyen 	uint32_t rlat, wlat;
33273da42859SDinh Nguyen 	uint32_t rw_wl_nop_cycles;
33283da42859SDinh Nguyen 	uint32_t max_latency;
33293da42859SDinh Nguyen 	uint32_t addr;
33303da42859SDinh Nguyen 
33313da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
33323da42859SDinh Nguyen 	/* read in write and read latency */
3333*c4815f76SMarek Vasut 	addr = (u32)&data_mgr->t_wl_add;
33343da42859SDinh Nguyen 	wlat = readl(SOCFPGA_SDR_ADDRESS + addr);
33353da42859SDinh Nguyen 
3336*c4815f76SMarek Vasut 	addr = (u32)&data_mgr->mem_t_add;
33373da42859SDinh Nguyen 	wlat += readl(SOCFPGA_SDR_ADDRESS + addr);
33383da42859SDinh Nguyen 	/* WL for hard phy does not include additive latency */
33393da42859SDinh Nguyen 
33403da42859SDinh Nguyen 	/*
33413da42859SDinh Nguyen 	 * add addtional write latency to offset the address/command extra
33423da42859SDinh Nguyen 	 * clock cycle. We change the AC mux setting causing AC to be delayed
33433da42859SDinh Nguyen 	 * by one mem clock cycle. Only do this for DDR3
33443da42859SDinh Nguyen 	 */
33453da42859SDinh Nguyen 	wlat = wlat + 1;
33463da42859SDinh Nguyen 
3347*c4815f76SMarek Vasut 	addr = (u32)&data_mgr->t_rl_add;
33483da42859SDinh Nguyen 	rlat = readl(SOCFPGA_SDR_ADDRESS + addr);
33493da42859SDinh Nguyen 
33503da42859SDinh Nguyen 	rw_wl_nop_cycles = wlat - 2;
33513da42859SDinh Nguyen 	gbl->rw_wl_nop_cycles = rw_wl_nop_cycles;
33523da42859SDinh Nguyen 
33533da42859SDinh Nguyen 	/*
33543da42859SDinh Nguyen 	 * For AV/CV, lfifo is hardened and always runs at full rate so
33553da42859SDinh Nguyen 	 * max latency in AFI clocks, used here, is correspondingly smaller.
33563da42859SDinh Nguyen 	 */
33573da42859SDinh Nguyen 	max_latency = (1<<MAX_LATENCY_COUNT_WIDTH)/1 - 1;
33583da42859SDinh Nguyen 	/* configure for a burst length of 8 */
33593da42859SDinh Nguyen 
33603da42859SDinh Nguyen 	/* write latency */
33613da42859SDinh Nguyen 	/* Adjust Write Latency for Hard PHY */
33623da42859SDinh Nguyen 	wlat = wlat + 1;
33633da42859SDinh Nguyen 
33643da42859SDinh Nguyen 	/* set a pretty high read latency initially */
33653da42859SDinh Nguyen 	gbl->curr_read_lat = rlat + 16;
33663da42859SDinh Nguyen 
33673da42859SDinh Nguyen 	if (gbl->curr_read_lat > max_latency)
33683da42859SDinh Nguyen 		gbl->curr_read_lat = max_latency;
33693da42859SDinh Nguyen 
33701bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cfg->phy_rlat;
33713da42859SDinh Nguyen 	writel(gbl->curr_read_lat, SOCFPGA_SDR_ADDRESS + addr);
33723da42859SDinh Nguyen 
33733da42859SDinh Nguyen 	/* advertise write latency */
33743da42859SDinh Nguyen 	gbl->curr_write_lat = wlat;
33751bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cfg->afi_wlat;
33763da42859SDinh Nguyen 	writel(wlat - 2, SOCFPGA_SDR_ADDRESS + addr);
33773da42859SDinh Nguyen 
33783da42859SDinh Nguyen 	/* initialize bit slips */
33793da42859SDinh Nguyen 	mem_precharge_and_activate();
33803da42859SDinh Nguyen }
33813da42859SDinh Nguyen 
33823da42859SDinh Nguyen /* Set VFIFO and LFIFO to instant-on settings in skip calibration mode */
33833da42859SDinh Nguyen static void mem_skip_calibrate(void)
33843da42859SDinh Nguyen {
33853da42859SDinh Nguyen 	uint32_t vfifo_offset;
33863da42859SDinh Nguyen 	uint32_t i, j, r;
33873da42859SDinh Nguyen 	uint32_t addr;
33883da42859SDinh Nguyen 
33893da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
33903da42859SDinh Nguyen 	/* Need to update every shadow register set used by the interface */
33913da42859SDinh Nguyen 	for (r = 0; r < RW_MGR_MEM_NUMBER_OF_RANKS;
33923da42859SDinh Nguyen 		r += NUM_RANKS_PER_SHADOW_REG) {
33933da42859SDinh Nguyen 		/*
33943da42859SDinh Nguyen 		 * Set output phase alignment settings appropriate for
33953da42859SDinh Nguyen 		 * skip calibration.
33963da42859SDinh Nguyen 		 */
33973da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
33983da42859SDinh Nguyen 			scc_mgr_set_dqs_en_phase(i, 0);
33993da42859SDinh Nguyen #if IO_DLL_CHAIN_LENGTH == 6
34003da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, 6);
34013da42859SDinh Nguyen #else
34023da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, 7);
34033da42859SDinh Nguyen #endif
34043da42859SDinh Nguyen 			/*
34053da42859SDinh Nguyen 			 * Case:33398
34063da42859SDinh Nguyen 			 *
34073da42859SDinh Nguyen 			 * Write data arrives to the I/O two cycles before write
34083da42859SDinh Nguyen 			 * latency is reached (720 deg).
34093da42859SDinh Nguyen 			 *   -> due to bit-slip in a/c bus
34103da42859SDinh Nguyen 			 *   -> to allow board skew where dqs is longer than ck
34113da42859SDinh Nguyen 			 *      -> how often can this happen!?
34123da42859SDinh Nguyen 			 *      -> can claim back some ptaps for high freq
34133da42859SDinh Nguyen 			 *       support if we can relax this, but i digress...
34143da42859SDinh Nguyen 			 *
34153da42859SDinh Nguyen 			 * The write_clk leads mem_ck by 90 deg
34163da42859SDinh Nguyen 			 * The minimum ptap of the OPA is 180 deg
34173da42859SDinh Nguyen 			 * Each ptap has (360 / IO_DLL_CHAIN_LENGH) deg of delay
34183da42859SDinh Nguyen 			 * The write_clk is always delayed by 2 ptaps
34193da42859SDinh Nguyen 			 *
34203da42859SDinh Nguyen 			 * Hence, to make DQS aligned to CK, we need to delay
34213da42859SDinh Nguyen 			 * DQS by:
34223da42859SDinh Nguyen 			 *    (720 - 90 - 180 - 2 * (360 / IO_DLL_CHAIN_LENGTH))
34233da42859SDinh Nguyen 			 *
34243da42859SDinh Nguyen 			 * Dividing the above by (360 / IO_DLL_CHAIN_LENGTH)
34253da42859SDinh Nguyen 			 * gives us the number of ptaps, which simplies to:
34263da42859SDinh Nguyen 			 *
34273da42859SDinh Nguyen 			 *    (1.25 * IO_DLL_CHAIN_LENGTH - 2)
34283da42859SDinh Nguyen 			 */
34293da42859SDinh Nguyen 			scc_mgr_set_dqdqs_output_phase(i, (1.25 *
34303da42859SDinh Nguyen 				IO_DLL_CHAIN_LENGTH - 2));
34313da42859SDinh Nguyen 		}
3432e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->dqs_ena;
34333da42859SDinh Nguyen 		writel(0xff, SOCFPGA_SDR_ADDRESS + addr);
3434e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->dqs_io_ena;
34353da42859SDinh Nguyen 		writel(0xff, SOCFPGA_SDR_ADDRESS + addr);
34363da42859SDinh Nguyen 
3437*c4815f76SMarek Vasut 		addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_GROUP_COUNTER_OFFSET;
34383da42859SDinh Nguyen 		for (i = 0; i < RW_MGR_MEM_IF_WRITE_DQS_WIDTH; i++) {
34393da42859SDinh Nguyen 			writel(i, SOCFPGA_SDR_ADDRESS + addr);
34403da42859SDinh Nguyen 		}
3441e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->dq_ena;
34423da42859SDinh Nguyen 		writel(0xff, SOCFPGA_SDR_ADDRESS + addr);
3443e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->dm_ena;
34443da42859SDinh Nguyen 		writel(0xff, SOCFPGA_SDR_ADDRESS + addr);
3445e79025a7SMarek Vasut 		addr = (u32)&sdr_scc_mgr->update;
34463da42859SDinh Nguyen 		writel(0, SOCFPGA_SDR_ADDRESS + addr);
34473da42859SDinh Nguyen 	}
34483da42859SDinh Nguyen 
34493da42859SDinh Nguyen 	/* Compensate for simulation model behaviour */
34503da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
34513da42859SDinh Nguyen 		scc_mgr_set_dqs_bus_in_delay(i, 10);
34523da42859SDinh Nguyen 		scc_mgr_load_dqs(i);
34533da42859SDinh Nguyen 	}
3454e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
34553da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
34563da42859SDinh Nguyen 
34573da42859SDinh Nguyen 	/*
34583da42859SDinh Nguyen 	 * ArriaV has hard FIFOs that can only be initialized by incrementing
34593da42859SDinh Nguyen 	 * in sequencer.
34603da42859SDinh Nguyen 	 */
34613da42859SDinh Nguyen 	vfifo_offset = CALIB_VFIFO_OFFSET;
34621bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cmd->inc_vfifo_hard_phy;
34633da42859SDinh Nguyen 	for (j = 0; j < vfifo_offset; j++) {
34643da42859SDinh Nguyen 		writel(0xff, SOCFPGA_SDR_ADDRESS + addr);
34653da42859SDinh Nguyen 	}
34661bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cmd->fifo_reset;
34673da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
34683da42859SDinh Nguyen 
34693da42859SDinh Nguyen 	/*
34703da42859SDinh Nguyen 	 * For ACV with hard lfifo, we get the skip-cal setting from
34713da42859SDinh Nguyen 	 * generation-time constant.
34723da42859SDinh Nguyen 	 */
34733da42859SDinh Nguyen 	gbl->curr_read_lat = CALIB_LFIFO_OFFSET;
34741bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cfg->phy_rlat;
34753da42859SDinh Nguyen 	writel(gbl->curr_read_lat, SOCFPGA_SDR_ADDRESS + addr);
34763da42859SDinh Nguyen }
34773da42859SDinh Nguyen 
34783da42859SDinh Nguyen /* Memory calibration entry point */
34793da42859SDinh Nguyen static uint32_t mem_calibrate(void)
34803da42859SDinh Nguyen {
34813da42859SDinh Nguyen 	uint32_t i;
34823da42859SDinh Nguyen 	uint32_t rank_bgn, sr;
34833da42859SDinh Nguyen 	uint32_t write_group, write_test_bgn;
34843da42859SDinh Nguyen 	uint32_t read_group, read_test_bgn;
34853da42859SDinh Nguyen 	uint32_t run_groups, current_run;
34863da42859SDinh Nguyen 	uint32_t failing_groups = 0;
34873da42859SDinh Nguyen 	uint32_t group_failed = 0;
34883da42859SDinh Nguyen 	uint32_t sr_failed = 0;
34893da42859SDinh Nguyen 	uint32_t addr;
34903da42859SDinh Nguyen 
34913da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
34923da42859SDinh Nguyen 	/* Initialize the data settings */
34933da42859SDinh Nguyen 
34943da42859SDinh Nguyen 	gbl->error_substage = CAL_SUBSTAGE_NIL;
34953da42859SDinh Nguyen 	gbl->error_stage = CAL_STAGE_NIL;
34963da42859SDinh Nguyen 	gbl->error_group = 0xff;
34973da42859SDinh Nguyen 	gbl->fom_in = 0;
34983da42859SDinh Nguyen 	gbl->fom_out = 0;
34993da42859SDinh Nguyen 
35003da42859SDinh Nguyen 	mem_config();
35013da42859SDinh Nguyen 
35023da42859SDinh Nguyen 	uint32_t bypass_mode = 0x1;
3503*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_GROUP_COUNTER_OFFSET;
35043da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_IF_READ_DQS_WIDTH; i++) {
35053da42859SDinh Nguyen 		writel(i, SOCFPGA_SDR_ADDRESS + addr);
35063da42859SDinh Nguyen 		scc_set_bypass_mode(i, bypass_mode);
35073da42859SDinh Nguyen 	}
35083da42859SDinh Nguyen 
35093da42859SDinh Nguyen 	if ((dyn_calib_steps & CALIB_SKIP_ALL) == CALIB_SKIP_ALL) {
35103da42859SDinh Nguyen 		/*
35113da42859SDinh Nguyen 		 * Set VFIFO and LFIFO to instant-on settings in skip
35123da42859SDinh Nguyen 		 * calibration mode.
35133da42859SDinh Nguyen 		 */
35143da42859SDinh Nguyen 		mem_skip_calibrate();
35153da42859SDinh Nguyen 	} else {
35163da42859SDinh Nguyen 		for (i = 0; i < NUM_CALIB_REPEAT; i++) {
35173da42859SDinh Nguyen 			/*
35183da42859SDinh Nguyen 			 * Zero all delay chain/phase settings for all
35193da42859SDinh Nguyen 			 * groups and all shadow register sets.
35203da42859SDinh Nguyen 			 */
35213da42859SDinh Nguyen 			scc_mgr_zero_all();
35223da42859SDinh Nguyen 
35233da42859SDinh Nguyen 			run_groups = ~param->skip_groups;
35243da42859SDinh Nguyen 
35253da42859SDinh Nguyen 			for (write_group = 0, write_test_bgn = 0; write_group
35263da42859SDinh Nguyen 				< RW_MGR_MEM_IF_WRITE_DQS_WIDTH; write_group++,
35273da42859SDinh Nguyen 				write_test_bgn += RW_MGR_MEM_DQ_PER_WRITE_DQS) {
35283da42859SDinh Nguyen 				/* Initialized the group failure */
35293da42859SDinh Nguyen 				group_failed = 0;
35303da42859SDinh Nguyen 
35313da42859SDinh Nguyen 				current_run = run_groups & ((1 <<
35323da42859SDinh Nguyen 					RW_MGR_NUM_DQS_PER_WRITE_GROUP) - 1);
35333da42859SDinh Nguyen 				run_groups = run_groups >>
35343da42859SDinh Nguyen 					RW_MGR_NUM_DQS_PER_WRITE_GROUP;
35353da42859SDinh Nguyen 
35363da42859SDinh Nguyen 				if (current_run == 0)
35373da42859SDinh Nguyen 					continue;
35383da42859SDinh Nguyen 
3539*c4815f76SMarek Vasut 				addr = SDR_PHYGRP_SCCGRP_ADDRESS | SCC_MGR_GROUP_COUNTER_OFFSET;
35403da42859SDinh Nguyen 				writel(write_group, SOCFPGA_SDR_ADDRESS + addr);
35413da42859SDinh Nguyen 				scc_mgr_zero_group(write_group, write_test_bgn,
35423da42859SDinh Nguyen 						   0);
35433da42859SDinh Nguyen 
35443da42859SDinh Nguyen 				for (read_group = write_group *
35453da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
35463da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH,
35473da42859SDinh Nguyen 					read_test_bgn = 0;
35483da42859SDinh Nguyen 					read_group < (write_group + 1) *
35493da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
35503da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH &&
35513da42859SDinh Nguyen 					group_failed == 0;
35523da42859SDinh Nguyen 					read_group++, read_test_bgn +=
35533da42859SDinh Nguyen 					RW_MGR_MEM_DQ_PER_READ_DQS) {
35543da42859SDinh Nguyen 					/* Calibrate the VFIFO */
35553da42859SDinh Nguyen 					if (!((STATIC_CALIB_STEPS) &
35563da42859SDinh Nguyen 						CALIB_SKIP_VFIFO)) {
35573da42859SDinh Nguyen 						if (!rw_mgr_mem_calibrate_vfifo
35583da42859SDinh Nguyen 							(read_group,
35593da42859SDinh Nguyen 							read_test_bgn)) {
35603da42859SDinh Nguyen 							group_failed = 1;
35613da42859SDinh Nguyen 
35623da42859SDinh Nguyen 							if (!(gbl->
35633da42859SDinh Nguyen 							phy_debug_mode_flags &
35643da42859SDinh Nguyen 						PHY_DEBUG_SWEEP_ALL_GROUPS)) {
35653da42859SDinh Nguyen 								return 0;
35663da42859SDinh Nguyen 							}
35673da42859SDinh Nguyen 						}
35683da42859SDinh Nguyen 					}
35693da42859SDinh Nguyen 				}
35703da42859SDinh Nguyen 
35713da42859SDinh Nguyen 				/* Calibrate the output side */
35723da42859SDinh Nguyen 				if (group_failed == 0)	{
35733da42859SDinh Nguyen 					for (rank_bgn = 0, sr = 0; rank_bgn
35743da42859SDinh Nguyen 						< RW_MGR_MEM_NUMBER_OF_RANKS;
35753da42859SDinh Nguyen 						rank_bgn +=
35763da42859SDinh Nguyen 						NUM_RANKS_PER_SHADOW_REG,
35773da42859SDinh Nguyen 						++sr) {
35783da42859SDinh Nguyen 						sr_failed = 0;
35793da42859SDinh Nguyen 						if (!((STATIC_CALIB_STEPS) &
35803da42859SDinh Nguyen 						CALIB_SKIP_WRITES)) {
35813da42859SDinh Nguyen 							if ((STATIC_CALIB_STEPS)
35823da42859SDinh Nguyen 						& CALIB_SKIP_DELAY_SWEEPS) {
35833da42859SDinh Nguyen 						/* not needed in quick mode! */
35843da42859SDinh Nguyen 							} else {
35853da42859SDinh Nguyen 						/*
35863da42859SDinh Nguyen 						 * Determine if this set of
35873da42859SDinh Nguyen 						 * ranks should be skipped
35883da42859SDinh Nguyen 						 * entirely.
35893da42859SDinh Nguyen 						 */
35903da42859SDinh Nguyen 					if (!param->skip_shadow_regs[sr]) {
35913da42859SDinh Nguyen 						if (!rw_mgr_mem_calibrate_writes
35923da42859SDinh Nguyen 						(rank_bgn, write_group,
35933da42859SDinh Nguyen 						write_test_bgn)) {
35943da42859SDinh Nguyen 							sr_failed = 1;
35953da42859SDinh Nguyen 							if (!(gbl->
35963da42859SDinh Nguyen 							phy_debug_mode_flags &
35973da42859SDinh Nguyen 						PHY_DEBUG_SWEEP_ALL_GROUPS)) {
35983da42859SDinh Nguyen 								return 0;
35993da42859SDinh Nguyen 									}
36003da42859SDinh Nguyen 									}
36013da42859SDinh Nguyen 								}
36023da42859SDinh Nguyen 							}
36033da42859SDinh Nguyen 						}
36043da42859SDinh Nguyen 						if (sr_failed != 0)
36053da42859SDinh Nguyen 							group_failed = 1;
36063da42859SDinh Nguyen 					}
36073da42859SDinh Nguyen 				}
36083da42859SDinh Nguyen 
36093da42859SDinh Nguyen 				if (group_failed == 0) {
36103da42859SDinh Nguyen 					for (read_group = write_group *
36113da42859SDinh Nguyen 					RW_MGR_MEM_IF_READ_DQS_WIDTH /
36123da42859SDinh Nguyen 					RW_MGR_MEM_IF_WRITE_DQS_WIDTH,
36133da42859SDinh Nguyen 					read_test_bgn = 0;
36143da42859SDinh Nguyen 						read_group < (write_group + 1)
36153da42859SDinh Nguyen 						* RW_MGR_MEM_IF_READ_DQS_WIDTH
36163da42859SDinh Nguyen 						/ RW_MGR_MEM_IF_WRITE_DQS_WIDTH &&
36173da42859SDinh Nguyen 						group_failed == 0;
36183da42859SDinh Nguyen 						read_group++, read_test_bgn +=
36193da42859SDinh Nguyen 						RW_MGR_MEM_DQ_PER_READ_DQS) {
36203da42859SDinh Nguyen 						if (!((STATIC_CALIB_STEPS) &
36213da42859SDinh Nguyen 							CALIB_SKIP_WRITES)) {
36223da42859SDinh Nguyen 					if (!rw_mgr_mem_calibrate_vfifo_end
36233da42859SDinh Nguyen 						(read_group, read_test_bgn)) {
36243da42859SDinh Nguyen 							group_failed = 1;
36253da42859SDinh Nguyen 
36263da42859SDinh Nguyen 						if (!(gbl->phy_debug_mode_flags
36273da42859SDinh Nguyen 						& PHY_DEBUG_SWEEP_ALL_GROUPS)) {
36283da42859SDinh Nguyen 								return 0;
36293da42859SDinh Nguyen 								}
36303da42859SDinh Nguyen 							}
36313da42859SDinh Nguyen 						}
36323da42859SDinh Nguyen 					}
36333da42859SDinh Nguyen 				}
36343da42859SDinh Nguyen 
36353da42859SDinh Nguyen 				if (group_failed != 0)
36363da42859SDinh Nguyen 					failing_groups++;
36373da42859SDinh Nguyen 			}
36383da42859SDinh Nguyen 
36393da42859SDinh Nguyen 			/*
36403da42859SDinh Nguyen 			 * USER If there are any failing groups then report
36413da42859SDinh Nguyen 			 * the failure.
36423da42859SDinh Nguyen 			 */
36433da42859SDinh Nguyen 			if (failing_groups != 0)
36443da42859SDinh Nguyen 				return 0;
36453da42859SDinh Nguyen 
36463da42859SDinh Nguyen 			/* Calibrate the LFIFO */
36473da42859SDinh Nguyen 			if (!((STATIC_CALIB_STEPS) & CALIB_SKIP_LFIFO)) {
36483da42859SDinh Nguyen 				/*
36493da42859SDinh Nguyen 				 * If we're skipping groups as part of debug,
36503da42859SDinh Nguyen 				 * don't calibrate LFIFO.
36513da42859SDinh Nguyen 				 */
36523da42859SDinh Nguyen 				if (param->skip_groups == 0) {
36533da42859SDinh Nguyen 					if (!rw_mgr_mem_calibrate_lfifo())
36543da42859SDinh Nguyen 						return 0;
36553da42859SDinh Nguyen 				}
36563da42859SDinh Nguyen 			}
36573da42859SDinh Nguyen 		}
36583da42859SDinh Nguyen 	}
36593da42859SDinh Nguyen 
36603da42859SDinh Nguyen 	/*
36613da42859SDinh Nguyen 	 * Do not remove this line as it makes sure all of our decisions
36623da42859SDinh Nguyen 	 * have been applied.
36633da42859SDinh Nguyen 	 */
3664e79025a7SMarek Vasut 	addr = (u32)&sdr_scc_mgr->update;
36653da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
36663da42859SDinh Nguyen 	return 1;
36673da42859SDinh Nguyen }
36683da42859SDinh Nguyen 
36693da42859SDinh Nguyen static uint32_t run_mem_calibrate(void)
36703da42859SDinh Nguyen {
36713da42859SDinh Nguyen 	uint32_t pass;
36723da42859SDinh Nguyen 	uint32_t debug_info;
36733da42859SDinh Nguyen 	uint32_t addr;
36743da42859SDinh Nguyen 
36753da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
36763da42859SDinh Nguyen 
36773da42859SDinh Nguyen 	/* Reset pass/fail status shown on afi_cal_success/fail */
36781bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cfg->cal_status;
36793da42859SDinh Nguyen 	writel(PHY_MGR_CAL_RESET, SOCFPGA_SDR_ADDRESS + addr);
36803da42859SDinh Nguyen 
3681*c4815f76SMarek Vasut 	addr = SDR_CTRLGRP_ADDRESS;
36823da42859SDinh Nguyen 	/* stop tracking manger */
36833da42859SDinh Nguyen 	uint32_t ctrlcfg = readl(SOCFPGA_SDR_ADDRESS + addr);
36843da42859SDinh Nguyen 
3685*c4815f76SMarek Vasut 	addr = SDR_CTRLGRP_ADDRESS;
36863da42859SDinh Nguyen 	writel(ctrlcfg & 0xFFBFFFFF, SOCFPGA_SDR_ADDRESS + addr);
36873da42859SDinh Nguyen 
36883da42859SDinh Nguyen 	initialize();
36893da42859SDinh Nguyen 	rw_mgr_mem_initialize();
36903da42859SDinh Nguyen 
36913da42859SDinh Nguyen 	pass = mem_calibrate();
36923da42859SDinh Nguyen 
36933da42859SDinh Nguyen 	mem_precharge_and_activate();
36941bc6f14aSMarek Vasut 	addr = (u32)&phy_mgr_cmd->fifo_reset;
36953da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
36963da42859SDinh Nguyen 
36973da42859SDinh Nguyen 	/*
36983da42859SDinh Nguyen 	 * Handoff:
36993da42859SDinh Nguyen 	 * Don't return control of the PHY back to AFI when in debug mode.
37003da42859SDinh Nguyen 	 */
37013da42859SDinh Nguyen 	if ((gbl->phy_debug_mode_flags & PHY_DEBUG_IN_DEBUG_MODE) == 0) {
37023da42859SDinh Nguyen 		rw_mgr_mem_handoff();
37033da42859SDinh Nguyen 		/*
37043da42859SDinh Nguyen 		 * In Hard PHY this is a 2-bit control:
37053da42859SDinh Nguyen 		 * 0: AFI Mux Select
37063da42859SDinh Nguyen 		 * 1: DDIO Mux Select
37073da42859SDinh Nguyen 		 */
37081bc6f14aSMarek Vasut 		addr = (u32)&phy_mgr_cfg->mux_sel;
37093da42859SDinh Nguyen 		writel(0x2, SOCFPGA_SDR_ADDRESS + addr);
37103da42859SDinh Nguyen 	}
37113da42859SDinh Nguyen 
3712*c4815f76SMarek Vasut 	addr = SDR_CTRLGRP_ADDRESS;
37133da42859SDinh Nguyen 	writel(ctrlcfg, SOCFPGA_SDR_ADDRESS + addr);
37143da42859SDinh Nguyen 
37153da42859SDinh Nguyen 	if (pass) {
37163da42859SDinh Nguyen 		printf("%s: CALIBRATION PASSED\n", __FILE__);
37173da42859SDinh Nguyen 
37183da42859SDinh Nguyen 		gbl->fom_in /= 2;
37193da42859SDinh Nguyen 		gbl->fom_out /= 2;
37203da42859SDinh Nguyen 
37213da42859SDinh Nguyen 		if (gbl->fom_in > 0xff)
37223da42859SDinh Nguyen 			gbl->fom_in = 0xff;
37233da42859SDinh Nguyen 
37243da42859SDinh Nguyen 		if (gbl->fom_out > 0xff)
37253da42859SDinh Nguyen 			gbl->fom_out = 0xff;
37263da42859SDinh Nguyen 
37273da42859SDinh Nguyen 		/* Update the FOM in the register file */
37283da42859SDinh Nguyen 		debug_info = gbl->fom_in;
37293da42859SDinh Nguyen 		debug_info |= gbl->fom_out << 8;
3730a1c654a8SMarek Vasut 		addr = (u32)&sdr_reg_file->fom;
37313da42859SDinh Nguyen 		writel(debug_info, SOCFPGA_SDR_ADDRESS + addr);
37323da42859SDinh Nguyen 
37331bc6f14aSMarek Vasut 		addr = (u32)&phy_mgr_cfg->cal_debug_info;
37343da42859SDinh Nguyen 		writel(debug_info, SOCFPGA_SDR_ADDRESS + addr);
37351bc6f14aSMarek Vasut 		addr = (u32)&phy_mgr_cfg->cal_status;
37363da42859SDinh Nguyen 		writel(PHY_MGR_CAL_SUCCESS, SOCFPGA_SDR_ADDRESS + addr);
37373da42859SDinh Nguyen 	} else {
37383da42859SDinh Nguyen 		printf("%s: CALIBRATION FAILED\n", __FILE__);
37393da42859SDinh Nguyen 
37403da42859SDinh Nguyen 		debug_info = gbl->error_stage;
37413da42859SDinh Nguyen 		debug_info |= gbl->error_substage << 8;
37423da42859SDinh Nguyen 		debug_info |= gbl->error_group << 16;
37433da42859SDinh Nguyen 
3744a1c654a8SMarek Vasut 		addr = (u32)&sdr_reg_file->failing_stage;
37453da42859SDinh Nguyen 		writel(debug_info, SOCFPGA_SDR_ADDRESS + addr);
37461bc6f14aSMarek Vasut 		addr = (u32)&phy_mgr_cfg->cal_debug_info;
37473da42859SDinh Nguyen 		writel(debug_info, SOCFPGA_SDR_ADDRESS + addr);
37481bc6f14aSMarek Vasut 		addr = (u32)&phy_mgr_cfg->cal_status;
37493da42859SDinh Nguyen 		writel(PHY_MGR_CAL_FAIL, SOCFPGA_SDR_ADDRESS + addr);
37503da42859SDinh Nguyen 
37513da42859SDinh Nguyen 		/* Update the failing group/stage in the register file */
37523da42859SDinh Nguyen 		debug_info = gbl->error_stage;
37533da42859SDinh Nguyen 		debug_info |= gbl->error_substage << 8;
37543da42859SDinh Nguyen 		debug_info |= gbl->error_group << 16;
3755a1c654a8SMarek Vasut 		addr = (u32)&sdr_reg_file->failing_stage;
37563da42859SDinh Nguyen 		writel(debug_info, SOCFPGA_SDR_ADDRESS + addr);
37573da42859SDinh Nguyen 	}
37583da42859SDinh Nguyen 
37593da42859SDinh Nguyen 	return pass;
37603da42859SDinh Nguyen }
37613da42859SDinh Nguyen 
37623da42859SDinh Nguyen static void hc_initialize_rom_data(void)
37633da42859SDinh Nguyen {
37643da42859SDinh Nguyen 	uint32_t i;
37653da42859SDinh Nguyen 	uint32_t addr;
37663da42859SDinh Nguyen 
3767*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_INST_ROM_WRITE_OFFSET;
37683da42859SDinh Nguyen 	for (i = 0; i < ARRAY_SIZE(inst_rom_init); i++) {
37693da42859SDinh Nguyen 		uint32_t data = inst_rom_init[i];
37703da42859SDinh Nguyen 		writel(data, SOCFPGA_SDR_ADDRESS + addr + (i << 2));
37713da42859SDinh Nguyen 	}
37723da42859SDinh Nguyen 
3773*c4815f76SMarek Vasut 	addr = SDR_PHYGRP_RWMGRGRP_ADDRESS | RW_MGR_AC_ROM_WRITE_OFFSET;
37743da42859SDinh Nguyen 	for (i = 0; i < ARRAY_SIZE(ac_rom_init); i++) {
37753da42859SDinh Nguyen 		uint32_t data = ac_rom_init[i];
37763da42859SDinh Nguyen 		writel(data, SOCFPGA_SDR_ADDRESS + addr + (i << 2));
37773da42859SDinh Nguyen 	}
37783da42859SDinh Nguyen }
37793da42859SDinh Nguyen 
37803da42859SDinh Nguyen static void initialize_reg_file(void)
37813da42859SDinh Nguyen {
37823da42859SDinh Nguyen 	uint32_t addr;
37833da42859SDinh Nguyen 
37843da42859SDinh Nguyen 	/* Initialize the register file with the correct data */
3785a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->signature;
37863da42859SDinh Nguyen 	writel(REG_FILE_INIT_SEQ_SIGNATURE, SOCFPGA_SDR_ADDRESS + addr);
37873da42859SDinh Nguyen 
3788a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->debug_data_addr;
37893da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
37903da42859SDinh Nguyen 
3791a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->cur_stage;
37923da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
37933da42859SDinh Nguyen 
3794a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->fom;
37953da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
37963da42859SDinh Nguyen 
3797a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->failing_stage;
37983da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
37993da42859SDinh Nguyen 
3800a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->debug1;
38013da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
38023da42859SDinh Nguyen 
3803a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->debug2;
38043da42859SDinh Nguyen 	writel(0, SOCFPGA_SDR_ADDRESS + addr);
38053da42859SDinh Nguyen }
38063da42859SDinh Nguyen 
38073da42859SDinh Nguyen static void initialize_hps_phy(void)
38083da42859SDinh Nguyen {
38093da42859SDinh Nguyen 	uint32_t reg;
38103da42859SDinh Nguyen 	uint32_t addr;
38113da42859SDinh Nguyen 	/*
38123da42859SDinh Nguyen 	 * Tracking also gets configured here because it's in the
38133da42859SDinh Nguyen 	 * same register.
38143da42859SDinh Nguyen 	 */
38153da42859SDinh Nguyen 	uint32_t trk_sample_count = 7500;
38163da42859SDinh Nguyen 	uint32_t trk_long_idle_sample_count = (10 << 16) | 100;
38173da42859SDinh Nguyen 	/*
38183da42859SDinh Nguyen 	 * Format is number of outer loops in the 16 MSB, sample
38193da42859SDinh Nguyen 	 * count in 16 LSB.
38203da42859SDinh Nguyen 	 */
38213da42859SDinh Nguyen 
38223da42859SDinh Nguyen 	reg = 0;
38233da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_ACDELAYEN_SET(2);
38243da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_DQDELAYEN_SET(1);
38253da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_DQSDELAYEN_SET(1);
38263da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_DQSLOGICDELAYEN_SET(1);
38273da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_RESETDELAYEN_SET(0);
38283da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_LPDDRDIS_SET(1);
38293da42859SDinh Nguyen 	/*
38303da42859SDinh Nguyen 	 * This field selects the intrinsic latency to RDATA_EN/FULL path.
38313da42859SDinh Nguyen 	 * 00-bypass, 01- add 5 cycles, 10- add 10 cycles, 11- add 15 cycles.
38323da42859SDinh Nguyen 	 */
38333da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_ADDLATSEL_SET(0);
38343da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_SAMPLECOUNT_19_0_SET(
38353da42859SDinh Nguyen 		trk_sample_count);
3836*c4815f76SMarek Vasut 	addr = SDR_CTRLGRP_ADDRESS;
38373da42859SDinh Nguyen 	writel(reg, SOCFPGA_SDR_ADDRESS + addr + SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_OFFSET);
38383da42859SDinh Nguyen 
38393da42859SDinh Nguyen 	reg = 0;
38403da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_1_SAMPLECOUNT_31_20_SET(
38413da42859SDinh Nguyen 		trk_sample_count >>
38423da42859SDinh Nguyen 		SDR_CTRLGRP_PHYCTRL_PHYCTRL_0_SAMPLECOUNT_19_0_WIDTH);
38433da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_1_LONGIDLESAMPLECOUNT_19_0_SET(
38443da42859SDinh Nguyen 		trk_long_idle_sample_count);
38453da42859SDinh Nguyen 	writel(reg, SOCFPGA_SDR_ADDRESS + addr + SDR_CTRLGRP_PHYCTRL_PHYCTRL_1_OFFSET);
38463da42859SDinh Nguyen 
38473da42859SDinh Nguyen 	reg = 0;
38483da42859SDinh Nguyen 	reg |= SDR_CTRLGRP_PHYCTRL_PHYCTRL_2_LONGIDLESAMPLECOUNT_31_20_SET(
38493da42859SDinh Nguyen 		trk_long_idle_sample_count >>
38503da42859SDinh Nguyen 		SDR_CTRLGRP_PHYCTRL_PHYCTRL_1_LONGIDLESAMPLECOUNT_19_0_WIDTH);
38513da42859SDinh Nguyen 	writel(reg, SOCFPGA_SDR_ADDRESS + addr + SDR_CTRLGRP_PHYCTRL_PHYCTRL_2_OFFSET);
38523da42859SDinh Nguyen }
38533da42859SDinh Nguyen 
38543da42859SDinh Nguyen static void initialize_tracking(void)
38553da42859SDinh Nguyen {
38563da42859SDinh Nguyen 	uint32_t concatenated_longidle = 0x0;
38573da42859SDinh Nguyen 	uint32_t concatenated_delays = 0x0;
38583da42859SDinh Nguyen 	uint32_t concatenated_rw_addr = 0x0;
38593da42859SDinh Nguyen 	uint32_t concatenated_refresh = 0x0;
38603da42859SDinh Nguyen 	uint32_t trk_sample_count = 7500;
38613da42859SDinh Nguyen 	uint32_t dtaps_per_ptap;
38623da42859SDinh Nguyen 	uint32_t tmp_delay;
38633da42859SDinh Nguyen 	uint32_t addr;
38643da42859SDinh Nguyen 
38653da42859SDinh Nguyen 	/*
38663da42859SDinh Nguyen 	 * compute usable version of value in case we skip full
38673da42859SDinh Nguyen 	 * computation later
38683da42859SDinh Nguyen 	 */
38693da42859SDinh Nguyen 	dtaps_per_ptap = 0;
38703da42859SDinh Nguyen 	tmp_delay = 0;
38713da42859SDinh Nguyen 	while (tmp_delay < IO_DELAY_PER_OPA_TAP) {
38723da42859SDinh Nguyen 		dtaps_per_ptap++;
38733da42859SDinh Nguyen 		tmp_delay += IO_DELAY_PER_DCHAIN_TAP;
38743da42859SDinh Nguyen 	}
38753da42859SDinh Nguyen 	dtaps_per_ptap--;
38763da42859SDinh Nguyen 
38773da42859SDinh Nguyen 	concatenated_longidle = concatenated_longidle ^ 10;
38783da42859SDinh Nguyen 		/*longidle outer loop */
38793da42859SDinh Nguyen 	concatenated_longidle = concatenated_longidle << 16;
38803da42859SDinh Nguyen 	concatenated_longidle = concatenated_longidle ^ 100;
38813da42859SDinh Nguyen 		/*longidle sample count */
38823da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 243;
38833da42859SDinh Nguyen 		/* trfc, worst case of 933Mhz 4Gb */
38843da42859SDinh Nguyen 	concatenated_delays = concatenated_delays << 8;
38853da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 14;
38863da42859SDinh Nguyen 		/* trcd, worst case */
38873da42859SDinh Nguyen 	concatenated_delays = concatenated_delays << 8;
38883da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 10;
38893da42859SDinh Nguyen 		/* vfifo wait */
38903da42859SDinh Nguyen 	concatenated_delays = concatenated_delays << 8;
38913da42859SDinh Nguyen 	concatenated_delays = concatenated_delays ^ 4;
38923da42859SDinh Nguyen 		/* mux delay */
38933da42859SDinh Nguyen 
38943da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_IDLE;
38953da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr << 8;
38963da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_ACTIVATE_1;
38973da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr << 8;
38983da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_SGLE_READ;
38993da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr << 8;
39003da42859SDinh Nguyen 	concatenated_rw_addr = concatenated_rw_addr ^ RW_MGR_PRECHARGE_ALL;
39013da42859SDinh Nguyen 
39023da42859SDinh Nguyen 	concatenated_refresh = concatenated_refresh ^ RW_MGR_REFRESH_ALL;
39033da42859SDinh Nguyen 	concatenated_refresh = concatenated_refresh << 24;
39043da42859SDinh Nguyen 	concatenated_refresh = concatenated_refresh ^ 1000; /* trefi */
39053da42859SDinh Nguyen 
39063da42859SDinh Nguyen 	/* Initialize the register file with the correct data */
3907a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->dtaps_per_ptap;
39083da42859SDinh Nguyen 	writel(dtaps_per_ptap, SOCFPGA_SDR_ADDRESS + addr);
39093da42859SDinh Nguyen 
3910a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->trk_sample_count;
39113da42859SDinh Nguyen 	writel(trk_sample_count, SOCFPGA_SDR_ADDRESS + addr);
39123da42859SDinh Nguyen 
3913a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->trk_longidle;
39143da42859SDinh Nguyen 	writel(concatenated_longidle, SOCFPGA_SDR_ADDRESS + addr);
39153da42859SDinh Nguyen 
3916a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->delays;
39173da42859SDinh Nguyen 	writel(concatenated_delays, SOCFPGA_SDR_ADDRESS + addr);
39183da42859SDinh Nguyen 
3919a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->trk_rw_mgr_addr;
39203da42859SDinh Nguyen 	writel(concatenated_rw_addr, SOCFPGA_SDR_ADDRESS + addr);
39213da42859SDinh Nguyen 
3922a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->trk_read_dqs_width;
39233da42859SDinh Nguyen 	writel(RW_MGR_MEM_IF_READ_DQS_WIDTH, SOCFPGA_SDR_ADDRESS + addr);
39243da42859SDinh Nguyen 
3925a1c654a8SMarek Vasut 	addr = (u32)&sdr_reg_file->trk_rfsh;
39263da42859SDinh Nguyen 	writel(concatenated_refresh, SOCFPGA_SDR_ADDRESS + addr);
39273da42859SDinh Nguyen }
39283da42859SDinh Nguyen 
39293da42859SDinh Nguyen int sdram_calibration_full(void)
39303da42859SDinh Nguyen {
39313da42859SDinh Nguyen 	struct param_type my_param;
39323da42859SDinh Nguyen 	struct gbl_type my_gbl;
39333da42859SDinh Nguyen 	uint32_t pass;
39343da42859SDinh Nguyen 	uint32_t i;
39353da42859SDinh Nguyen 
39363da42859SDinh Nguyen 	param = &my_param;
39373da42859SDinh Nguyen 	gbl = &my_gbl;
39383da42859SDinh Nguyen 
39393da42859SDinh Nguyen 	/* Initialize the debug mode flags */
39403da42859SDinh Nguyen 	gbl->phy_debug_mode_flags = 0;
39413da42859SDinh Nguyen 	/* Set the calibration enabled by default */
39423da42859SDinh Nguyen 	gbl->phy_debug_mode_flags |= PHY_DEBUG_ENABLE_CAL_RPT;
39433da42859SDinh Nguyen 	/*
39443da42859SDinh Nguyen 	 * Only sweep all groups (regardless of fail state) by default
39453da42859SDinh Nguyen 	 * Set enabled read test by default.
39463da42859SDinh Nguyen 	 */
39473da42859SDinh Nguyen #if DISABLE_GUARANTEED_READ
39483da42859SDinh Nguyen 	gbl->phy_debug_mode_flags |= PHY_DEBUG_DISABLE_GUARANTEED_READ;
39493da42859SDinh Nguyen #endif
39503da42859SDinh Nguyen 	/* Initialize the register file */
39513da42859SDinh Nguyen 	initialize_reg_file();
39523da42859SDinh Nguyen 
39533da42859SDinh Nguyen 	/* Initialize any PHY CSR */
39543da42859SDinh Nguyen 	initialize_hps_phy();
39553da42859SDinh Nguyen 
39563da42859SDinh Nguyen 	scc_mgr_initialize();
39573da42859SDinh Nguyen 
39583da42859SDinh Nguyen 	initialize_tracking();
39593da42859SDinh Nguyen 
39603da42859SDinh Nguyen 	/* USER Enable all ranks, groups */
39613da42859SDinh Nguyen 	for (i = 0; i < RW_MGR_MEM_NUMBER_OF_RANKS; i++)
39623da42859SDinh Nguyen 		param->skip_ranks[i] = 0;
39633da42859SDinh Nguyen 	for (i = 0; i < NUM_SHADOW_REGS; ++i)
39643da42859SDinh Nguyen 		param->skip_shadow_regs[i] = 0;
39653da42859SDinh Nguyen 	param->skip_groups = 0;
39663da42859SDinh Nguyen 
39673da42859SDinh Nguyen 	printf("%s: Preparing to start memory calibration\n", __FILE__);
39683da42859SDinh Nguyen 
39693da42859SDinh Nguyen 	debug("%s:%d\n", __func__, __LINE__);
397023f62b36SMarek Vasut 	debug_cond(DLEVEL == 1,
397123f62b36SMarek Vasut 		   "DDR3 FULL_RATE ranks=%u cs/dimm=%u dq/dqs=%u,%u vg/dqs=%u,%u ",
397223f62b36SMarek Vasut 		   RW_MGR_MEM_NUMBER_OF_RANKS, RW_MGR_MEM_NUMBER_OF_CS_PER_DIMM,
397323f62b36SMarek Vasut 		   RW_MGR_MEM_DQ_PER_READ_DQS, RW_MGR_MEM_DQ_PER_WRITE_DQS,
397423f62b36SMarek Vasut 		   RW_MGR_MEM_VIRTUAL_GROUPS_PER_READ_DQS,
397523f62b36SMarek Vasut 		   RW_MGR_MEM_VIRTUAL_GROUPS_PER_WRITE_DQS);
397623f62b36SMarek Vasut 	debug_cond(DLEVEL == 1,
397723f62b36SMarek Vasut 		   "dqs=%u,%u dq=%u dm=%u ptap_delay=%u dtap_delay=%u ",
397823f62b36SMarek Vasut 		   RW_MGR_MEM_IF_READ_DQS_WIDTH, RW_MGR_MEM_IF_WRITE_DQS_WIDTH,
397923f62b36SMarek Vasut 		   RW_MGR_MEM_DATA_WIDTH, RW_MGR_MEM_DATA_MASK_WIDTH,
398023f62b36SMarek Vasut 		   IO_DELAY_PER_OPA_TAP, IO_DELAY_PER_DCHAIN_TAP);
398123f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "dtap_dqsen_delay=%u, dll=%u",
398223f62b36SMarek Vasut 		   IO_DELAY_PER_DQS_EN_DCHAIN_TAP, IO_DLL_CHAIN_LENGTH);
398323f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "max values: en_p=%u dqdqs_p=%u en_d=%u dqs_in_d=%u ",
398423f62b36SMarek Vasut 		   IO_DQS_EN_PHASE_MAX, IO_DQDQS_OUT_PHASE_MAX,
398523f62b36SMarek Vasut 		   IO_DQS_EN_DELAY_MAX, IO_DQS_IN_DELAY_MAX);
398623f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "io_in_d=%u io_out1_d=%u io_out2_d=%u ",
398723f62b36SMarek Vasut 		   IO_IO_IN_DELAY_MAX, IO_IO_OUT1_DELAY_MAX,
398823f62b36SMarek Vasut 		   IO_IO_OUT2_DELAY_MAX);
398923f62b36SMarek Vasut 	debug_cond(DLEVEL == 1, "dqs_in_reserve=%u dqs_out_reserve=%u\n",
399023f62b36SMarek Vasut 		   IO_DQS_IN_RESERVE, IO_DQS_OUT_RESERVE);
39913da42859SDinh Nguyen 
39923da42859SDinh Nguyen 	hc_initialize_rom_data();
39933da42859SDinh Nguyen 
39943da42859SDinh Nguyen 	/* update info for sims */
39953da42859SDinh Nguyen 	reg_file_set_stage(CAL_STAGE_NIL);
39963da42859SDinh Nguyen 	reg_file_set_group(0);
39973da42859SDinh Nguyen 
39983da42859SDinh Nguyen 	/*
39993da42859SDinh Nguyen 	 * Load global needed for those actions that require
40003da42859SDinh Nguyen 	 * some dynamic calibration support.
40013da42859SDinh Nguyen 	 */
40023da42859SDinh Nguyen 	dyn_calib_steps = STATIC_CALIB_STEPS;
40033da42859SDinh Nguyen 	/*
40043da42859SDinh Nguyen 	 * Load global to allow dynamic selection of delay loop settings
40053da42859SDinh Nguyen 	 * based on calibration mode.
40063da42859SDinh Nguyen 	 */
40073da42859SDinh Nguyen 	if (!(dyn_calib_steps & CALIB_SKIP_DELAY_LOOPS))
40083da42859SDinh Nguyen 		skip_delay_mask = 0xff;
40093da42859SDinh Nguyen 	else
40103da42859SDinh Nguyen 		skip_delay_mask = 0x0;
40113da42859SDinh Nguyen 
40123da42859SDinh Nguyen 	pass = run_mem_calibrate();
40133da42859SDinh Nguyen 
40143da42859SDinh Nguyen 	printf("%s: Calibration complete\n", __FILE__);
40153da42859SDinh Nguyen 	return pass;
40163da42859SDinh Nguyen }
4017