xref: /OK3568_Linux_fs/u-boot/board/xes/xpedite537x/ddr.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * Copyright 2008 Extreme Engineering Solutions, Inc.
3*4882a593Smuzhiyun  * Copyright 2008 Freescale Semiconductor, Inc.
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * SPDX-License-Identifier:	GPL-2.0+
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun 
8*4882a593Smuzhiyun #include <common.h>
9*4882a593Smuzhiyun #include <i2c.h>
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun #include <fsl_ddr_sdram.h>
12*4882a593Smuzhiyun #include <fsl_ddr_dimm_params.h>
13*4882a593Smuzhiyun 
get_spd(ddr2_spd_eeprom_t * spd,u8 i2c_address)14*4882a593Smuzhiyun void get_spd(ddr2_spd_eeprom_t *spd, u8 i2c_address)
15*4882a593Smuzhiyun {
16*4882a593Smuzhiyun 	i2c_read(i2c_address, SPD_EEPROM_OFFSET, 2, (uchar *)spd,
17*4882a593Smuzhiyun 		 sizeof(ddr2_spd_eeprom_t));
18*4882a593Smuzhiyun }
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun /*
21*4882a593Smuzhiyun  * There are four board-specific SDRAM timing parameters which must be
22*4882a593Smuzhiyun  * calculated based on the particular PCB artwork.  These are:
23*4882a593Smuzhiyun  *   1.) CPO (Read Capture Delay)
24*4882a593Smuzhiyun  *           - TIMING_CFG_2 register
25*4882a593Smuzhiyun  *           Source: Calculation based on board trace lengths and
26*4882a593Smuzhiyun  *                   chip-specific internal delays.
27*4882a593Smuzhiyun  *   2.) WR_DATA_DELAY (Write Command to Data Strobe Delay)
28*4882a593Smuzhiyun  *           - TIMING_CFG_2 register
29*4882a593Smuzhiyun  *           Source: Calculation based on board trace lengths.
30*4882a593Smuzhiyun  *                   Unless clock and DQ lanes are very different
31*4882a593Smuzhiyun  *                   lengths (>2"), this should be set to the nominal value
32*4882a593Smuzhiyun  *                   of 1/2 clock delay.
33*4882a593Smuzhiyun  *   3.) CLK_ADJUST (Clock and Addr/Cmd alignment control)
34*4882a593Smuzhiyun  *           - DDR_SDRAM_CLK_CNTL register
35*4882a593Smuzhiyun  *           Source: Signal Integrity Simulations
36*4882a593Smuzhiyun  *   4.) 2T Timing on Addr/Ctl
37*4882a593Smuzhiyun  *           - TIMING_CFG_2 register
38*4882a593Smuzhiyun  *           Source: Signal Integrity Simulations
39*4882a593Smuzhiyun  *           Usually only needed with heavy load/very high speed (>DDR2-800)
40*4882a593Smuzhiyun  *
41*4882a593Smuzhiyun  *     ====== XPedite5370 DDR2-600 read delay calculations ======
42*4882a593Smuzhiyun  *
43*4882a593Smuzhiyun  *     See Freescale's App Note AN2583 as refrence.  This document also
44*4882a593Smuzhiyun  *     contains the chip-specific delays for 8548E, 8572, etc.
45*4882a593Smuzhiyun  *
46*4882a593Smuzhiyun  *     For MPC8572E
47*4882a593Smuzhiyun  *     Minimum chip delay (Ch 0): 1.372ns
48*4882a593Smuzhiyun  *     Maximum chip delay (Ch 0): 2.914ns
49*4882a593Smuzhiyun  *     Minimum chip delay (Ch 1): 1.220ns
50*4882a593Smuzhiyun  *     Maximum chip delay (Ch 1): 2.595ns
51*4882a593Smuzhiyun  *
52*4882a593Smuzhiyun  *     CLK adjust = 5 (from simulations) = 5/8* 3.33ns = 2080ps
53*4882a593Smuzhiyun  *
54*4882a593Smuzhiyun  *     Minimum delay calc (Ch 0):
55*4882a593Smuzhiyun  *     clock prop - dram skew + min dqs prop delay + clk_adjust + min chip dly
56*4882a593Smuzhiyun  *     2.3" * 180 - 400ps     + 1.9" * 180         + 2080ps     + 1372ps
57*4882a593Smuzhiyun  *                                                 = 3808ps
58*4882a593Smuzhiyun  *                                                 = 3.808ns
59*4882a593Smuzhiyun  *
60*4882a593Smuzhiyun  *     Maximum delay calc (Ch 0):
61*4882a593Smuzhiyun  *     clock prop + dram skew + max dqs prop delay + clk_adjust + max chip dly
62*4882a593Smuzhiyun  *     2.3" * 180 + 400ps     + 2.4" * 180         + 2080ps     + 2914ps
63*4882a593Smuzhiyun  *                                                 = 6240ps
64*4882a593Smuzhiyun  *                                                 = 6.240ns
65*4882a593Smuzhiyun  *
66*4882a593Smuzhiyun  *     Minimum delay calc (Ch 1):
67*4882a593Smuzhiyun  *     clock prop - dram skew + min dqs prop delay + clk_adjust + min chip dly
68*4882a593Smuzhiyun  *     1.46" * 180- 400ps     + 0.7" * 180         + 2080ps     + 1220ps
69*4882a593Smuzhiyun  *                                                 = 3288ps
70*4882a593Smuzhiyun  *                                                 = 3.288ns
71*4882a593Smuzhiyun  *
72*4882a593Smuzhiyun  *     Maximum delay calc (Ch 1):
73*4882a593Smuzhiyun  *     clock prop + dram skew + max dqs prop delay + clk_adjust + min chip dly
74*4882a593Smuzhiyun  *     1.46" * 180+ 400ps     + 1.1" * 180         + 2080ps     + 2595ps
75*4882a593Smuzhiyun  *                                                 = 5536ps
76*4882a593Smuzhiyun  *                                                 = 5.536ns
77*4882a593Smuzhiyun  *
78*4882a593Smuzhiyun  *     Ch.0: 3.808ns to 6.240ns additional delay needed  (pick 5ns as target)
79*4882a593Smuzhiyun  *              This is 1.5 clock cycles, pick CPO = READ_LAT + 3/2 (0x8)
80*4882a593Smuzhiyun  *     Ch.1: 3.288ns to 5.536ns additional delay needed  (pick 4.4ns as target)
81*4882a593Smuzhiyun  *              This is 1.32 clock cycles, pick CPO = READ_LAT + 5/4 (0x7)
82*4882a593Smuzhiyun  *
83*4882a593Smuzhiyun  *
84*4882a593Smuzhiyun  *     ====== XPedite5370 DDR2-800 read delay calculations ======
85*4882a593Smuzhiyun  *
86*4882a593Smuzhiyun  *     See Freescale's App Note AN2583 as refrence.  This document also
87*4882a593Smuzhiyun  *     contains the chip-specific delays for 8548E, 8572, etc.
88*4882a593Smuzhiyun  *
89*4882a593Smuzhiyun  *     For MPC8572E
90*4882a593Smuzhiyun  *     Minimum chip delay (Ch 0): 1.372ns
91*4882a593Smuzhiyun  *     Maximum chip delay (Ch 0): 2.914ns
92*4882a593Smuzhiyun  *     Minimum chip delay (Ch 1): 1.220ns
93*4882a593Smuzhiyun  *     Maximum chip delay (Ch 1): 2.595ns
94*4882a593Smuzhiyun  *
95*4882a593Smuzhiyun  *     CLK adjust = 5 (from simulations) = 5/8* 2.5ns = 1563ps
96*4882a593Smuzhiyun  *
97*4882a593Smuzhiyun  *     Minimum delay calc (Ch 0):
98*4882a593Smuzhiyun  *     clock prop - dram skew + min dqs prop delay + clk_adjust + min chip dly
99*4882a593Smuzhiyun  *     2.3" * 180 - 350ps     + 1.9" * 180         + 1563ps     + 1372ps
100*4882a593Smuzhiyun  *                                                 = 3341ps
101*4882a593Smuzhiyun  *                                                 = 3.341ns
102*4882a593Smuzhiyun  *
103*4882a593Smuzhiyun  *     Maximum delay calc (Ch 0):
104*4882a593Smuzhiyun  *     clock prop + dram skew + max dqs prop delay + clk_adjust + max chip dly
105*4882a593Smuzhiyun  *     2.3" * 180 + 350ps     + 2.4" * 180         + 1563ps     + 2914ps
106*4882a593Smuzhiyun  *                                                 = 5673ps
107*4882a593Smuzhiyun  *                                                 = 5.673ns
108*4882a593Smuzhiyun  *
109*4882a593Smuzhiyun  *     Minimum delay calc (Ch 1):
110*4882a593Smuzhiyun  *     clock prop - dram skew + min dqs prop delay + clk_adjust + min chip dly
111*4882a593Smuzhiyun  *     1.46" * 180- 350ps     + 0.7" * 180         + 1563ps     + 1220ps
112*4882a593Smuzhiyun  *                                                 = 2822ps
113*4882a593Smuzhiyun  *                                                 = 2.822ns
114*4882a593Smuzhiyun  *
115*4882a593Smuzhiyun  *     Maximum delay calc (Ch 1):
116*4882a593Smuzhiyun  *     clock prop + dram skew + max dqs prop delay + clk_adjust + min chip dly
117*4882a593Smuzhiyun  *     1.46" * 180+ 350ps     + 1.1" * 180         + 1563ps     + 2595ps
118*4882a593Smuzhiyun  *                                                 = 4968ps
119*4882a593Smuzhiyun  *                                                 = 4.968ns
120*4882a593Smuzhiyun  *
121*4882a593Smuzhiyun  *     Ch.0: 3.341ns to 5.673ns additional delay needed  (pick 4.5ns as target)
122*4882a593Smuzhiyun  *              This is 1.8 clock cycles, pick CPO = READ_LAT + 7/4 (0x9)
123*4882a593Smuzhiyun  *     Ch.1: 2.822ns to 4.968ns additional delay needed  (pick 3.9ns as target)
124*4882a593Smuzhiyun  *              This is 1.56 clock cycles, pick CPO = READ_LAT + 3/2 (0x8)
125*4882a593Smuzhiyun  *
126*4882a593Smuzhiyun  * Write latency (WR_DATA_DELAY) is calculated by doing the following:
127*4882a593Smuzhiyun  *
128*4882a593Smuzhiyun  *      The DDR SDRAM specification requires DQS be received no sooner than
129*4882a593Smuzhiyun  *      75% of an SDRAM clock period—and no later than 125% of a clock
130*4882a593Smuzhiyun  *      period—from the capturing clock edge of the command/address at the
131*4882a593Smuzhiyun  *      SDRAM.
132*4882a593Smuzhiyun  *
133*4882a593Smuzhiyun  * Based on the above tracelengths, the following are calculated:
134*4882a593Smuzhiyun  *      Ch. 0 8572 to DRAM propagation (DQ lanes) : 1.9" * 180 =  0.342ns
135*4882a593Smuzhiyun  *      Ch. 0 8572 to DRAM propagation (CLKs) :     2.3" * 180 =  0.414ns
136*4882a593Smuzhiyun  *      Ch. 1 8572 to DRAM propagation (DQ lanes) : 0.7" * 180 =  0.126ns
137*4882a593Smuzhiyun  *      Ch. 1 8572 to DRAM propagation (CLKs   ) : 1.47" * 180 =  0.264ns
138*4882a593Smuzhiyun  *
139*4882a593Smuzhiyun  * Difference in arrival time CLK vs. DQS:
140*4882a593Smuzhiyun  *      Ch. 0 0.072ns
141*4882a593Smuzhiyun  *      Ch. 1 0.138ns
142*4882a593Smuzhiyun  *
143*4882a593Smuzhiyun  *      Both of these values are much less than 25% of the clock
144*4882a593Smuzhiyun  *      period at DDR2-600 or DDR2-800, so no additional delay is needed over
145*4882a593Smuzhiyun  *      the 1/2 cycle which normally aligns the first DQS transition
146*4882a593Smuzhiyun  *      exactly WL (CAS latency minus one cycle) after the CAS strobe.
147*4882a593Smuzhiyun  *      See Figure 9-53 in MPC8572E manual: "1/2 delay" in Freescale's
148*4882a593Smuzhiyun  *      terminology corresponds to exactly one clock period delay after
149*4882a593Smuzhiyun  *      the CAS strobe. (due to the fact that the "delay" is referenced
150*4882a593Smuzhiyun  *      from the *falling* edge of the CLK, just after the rising edge
151*4882a593Smuzhiyun  *      which the CAS strobe is latched on.
152*4882a593Smuzhiyun  */
153*4882a593Smuzhiyun 
154*4882a593Smuzhiyun typedef struct board_memctl_options {
155*4882a593Smuzhiyun 	uint16_t datarate_mhz_low;
156*4882a593Smuzhiyun 	uint16_t datarate_mhz_high;
157*4882a593Smuzhiyun 	uint8_t clk_adjust;
158*4882a593Smuzhiyun 	uint8_t cpo_override;
159*4882a593Smuzhiyun 	uint8_t write_data_delay;
160*4882a593Smuzhiyun } board_memctl_options_t;
161*4882a593Smuzhiyun 
162*4882a593Smuzhiyun static struct board_memctl_options bopts_ctrl[][2] = {
163*4882a593Smuzhiyun 	{
164*4882a593Smuzhiyun 		/* Controller 0 */
165*4882a593Smuzhiyun 		{
166*4882a593Smuzhiyun 			/* DDR2 600/667 */
167*4882a593Smuzhiyun 			.datarate_mhz_low	= 500,
168*4882a593Smuzhiyun 			.datarate_mhz_high	= 750,
169*4882a593Smuzhiyun 			.clk_adjust		= 5,
170*4882a593Smuzhiyun 			.cpo_override		= 8,
171*4882a593Smuzhiyun 			.write_data_delay	= 2,
172*4882a593Smuzhiyun 		},
173*4882a593Smuzhiyun 		{
174*4882a593Smuzhiyun 			/* DDR2 800 */
175*4882a593Smuzhiyun 			.datarate_mhz_low	= 750,
176*4882a593Smuzhiyun 			.datarate_mhz_high	= 850,
177*4882a593Smuzhiyun 			.clk_adjust		= 5,
178*4882a593Smuzhiyun 			.cpo_override		= 9,
179*4882a593Smuzhiyun 			.write_data_delay	= 2,
180*4882a593Smuzhiyun 		},
181*4882a593Smuzhiyun 	},
182*4882a593Smuzhiyun 	{
183*4882a593Smuzhiyun 		/* Controller 1 */
184*4882a593Smuzhiyun 		{
185*4882a593Smuzhiyun 			/* DDR2 600/667 */
186*4882a593Smuzhiyun 			.datarate_mhz_low	= 500,
187*4882a593Smuzhiyun 			.datarate_mhz_high	= 750,
188*4882a593Smuzhiyun 			.clk_adjust		= 5,
189*4882a593Smuzhiyun 			.cpo_override		= 7,
190*4882a593Smuzhiyun 			.write_data_delay	= 2,
191*4882a593Smuzhiyun 		},
192*4882a593Smuzhiyun 		{
193*4882a593Smuzhiyun 			/* DDR2 800 */
194*4882a593Smuzhiyun 			.datarate_mhz_low	= 750,
195*4882a593Smuzhiyun 			.datarate_mhz_high	= 850,
196*4882a593Smuzhiyun 			.clk_adjust		= 5,
197*4882a593Smuzhiyun 			.cpo_override		= 8,
198*4882a593Smuzhiyun 			.write_data_delay	= 2,
199*4882a593Smuzhiyun 		},
200*4882a593Smuzhiyun 	},
201*4882a593Smuzhiyun };
202*4882a593Smuzhiyun 
fsl_ddr_board_options(memctl_options_t * popts,dimm_params_t * pdimm,unsigned int ctrl_num)203*4882a593Smuzhiyun void fsl_ddr_board_options(memctl_options_t *popts,
204*4882a593Smuzhiyun 			   dimm_params_t *pdimm,
205*4882a593Smuzhiyun 			   unsigned int ctrl_num)
206*4882a593Smuzhiyun {
207*4882a593Smuzhiyun 	struct board_memctl_options *bopts = bopts_ctrl[ctrl_num];
208*4882a593Smuzhiyun 	sys_info_t sysinfo;
209*4882a593Smuzhiyun 	int i;
210*4882a593Smuzhiyun 	unsigned int datarate;
211*4882a593Smuzhiyun 
212*4882a593Smuzhiyun 	get_sys_info(&sysinfo);
213*4882a593Smuzhiyun 	datarate = sysinfo.freq_ddrbus / 1000 / 1000;
214*4882a593Smuzhiyun 
215*4882a593Smuzhiyun 	for (i = 0; i < ARRAY_SIZE(bopts_ctrl[ctrl_num]); i++) {
216*4882a593Smuzhiyun 		if ((bopts[i].datarate_mhz_low <= datarate) &&
217*4882a593Smuzhiyun 		    (bopts[i].datarate_mhz_high >= datarate)) {
218*4882a593Smuzhiyun 			debug("controller %d:\n", ctrl_num);
219*4882a593Smuzhiyun 			debug(" clk_adjust = %d\n", bopts[i].clk_adjust);
220*4882a593Smuzhiyun 			debug(" cpo = %d\n", bopts[i].cpo_override);
221*4882a593Smuzhiyun 			debug(" write_data_delay = %d\n",
222*4882a593Smuzhiyun 			      bopts[i].write_data_delay);
223*4882a593Smuzhiyun 			popts->clk_adjust = bopts[i].clk_adjust;
224*4882a593Smuzhiyun 			popts->cpo_override = bopts[i].cpo_override;
225*4882a593Smuzhiyun 			popts->write_data_delay = bopts[i].write_data_delay;
226*4882a593Smuzhiyun 		}
227*4882a593Smuzhiyun 	}
228*4882a593Smuzhiyun 
229*4882a593Smuzhiyun 	/*
230*4882a593Smuzhiyun 	 * Factors to consider for half-strength driver enable:
231*4882a593Smuzhiyun 	 *	- number of DIMMs installed
232*4882a593Smuzhiyun 	 */
233*4882a593Smuzhiyun 	popts->half_strength_driver_enable = 0;
234*4882a593Smuzhiyun }
235