1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * Copyright 2008 Extreme Engineering Solutions, Inc.
3*4882a593Smuzhiyun * Copyright 2008 Freescale Semiconductor, Inc.
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * SPDX-License-Identifier: GPL-2.0+
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <common.h>
9*4882a593Smuzhiyun #include <i2c.h>
10*4882a593Smuzhiyun
11*4882a593Smuzhiyun #include <fsl_ddr_sdram.h>
12*4882a593Smuzhiyun #include <fsl_ddr_dimm_params.h>
13*4882a593Smuzhiyun
get_spd(ddr2_spd_eeprom_t * spd,u8 i2c_address)14*4882a593Smuzhiyun void get_spd(ddr2_spd_eeprom_t *spd, u8 i2c_address)
15*4882a593Smuzhiyun {
16*4882a593Smuzhiyun i2c_read(i2c_address, SPD_EEPROM_OFFSET, 2, (uchar *)spd,
17*4882a593Smuzhiyun sizeof(ddr2_spd_eeprom_t));
18*4882a593Smuzhiyun }
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun /*
21*4882a593Smuzhiyun * There are four board-specific SDRAM timing parameters which must be
22*4882a593Smuzhiyun * calculated based on the particular PCB artwork. These are:
23*4882a593Smuzhiyun * 1.) CPO (Read Capture Delay)
24*4882a593Smuzhiyun * - TIMING_CFG_2 register
25*4882a593Smuzhiyun * Source: Calculation based on board trace lengths and
26*4882a593Smuzhiyun * chip-specific internal delays.
27*4882a593Smuzhiyun * 2.) WR_DATA_DELAY (Write Command to Data Strobe Delay)
28*4882a593Smuzhiyun * - TIMING_CFG_2 register
29*4882a593Smuzhiyun * Source: Calculation based on board trace lengths.
30*4882a593Smuzhiyun * Unless clock and DQ lanes are very different
31*4882a593Smuzhiyun * lengths (>2"), this should be set to the nominal value
32*4882a593Smuzhiyun * of 1/2 clock delay.
33*4882a593Smuzhiyun * 3.) CLK_ADJUST (Clock and Addr/Cmd alignment control)
34*4882a593Smuzhiyun * - DDR_SDRAM_CLK_CNTL register
35*4882a593Smuzhiyun * Source: Signal Integrity Simulations
36*4882a593Smuzhiyun * 4.) 2T Timing on Addr/Ctl
37*4882a593Smuzhiyun * - TIMING_CFG_2 register
38*4882a593Smuzhiyun * Source: Signal Integrity Simulations
39*4882a593Smuzhiyun * Usually only needed with heavy load/very high speed (>DDR2-800)
40*4882a593Smuzhiyun *
41*4882a593Smuzhiyun * ====== XPedite5370 DDR2-600 read delay calculations ======
42*4882a593Smuzhiyun *
43*4882a593Smuzhiyun * See Freescale's App Note AN2583 as refrence. This document also
44*4882a593Smuzhiyun * contains the chip-specific delays for 8548E, 8572, etc.
45*4882a593Smuzhiyun *
46*4882a593Smuzhiyun * For MPC8572E
47*4882a593Smuzhiyun * Minimum chip delay (Ch 0): 1.372ns
48*4882a593Smuzhiyun * Maximum chip delay (Ch 0): 2.914ns
49*4882a593Smuzhiyun * Minimum chip delay (Ch 1): 1.220ns
50*4882a593Smuzhiyun * Maximum chip delay (Ch 1): 2.595ns
51*4882a593Smuzhiyun *
52*4882a593Smuzhiyun * CLK adjust = 5 (from simulations) = 5/8* 3.33ns = 2080ps
53*4882a593Smuzhiyun *
54*4882a593Smuzhiyun * Minimum delay calc (Ch 0):
55*4882a593Smuzhiyun * clock prop - dram skew + min dqs prop delay + clk_adjust + min chip dly
56*4882a593Smuzhiyun * 2.3" * 180 - 400ps + 1.9" * 180 + 2080ps + 1372ps
57*4882a593Smuzhiyun * = 3808ps
58*4882a593Smuzhiyun * = 3.808ns
59*4882a593Smuzhiyun *
60*4882a593Smuzhiyun * Maximum delay calc (Ch 0):
61*4882a593Smuzhiyun * clock prop + dram skew + max dqs prop delay + clk_adjust + max chip dly
62*4882a593Smuzhiyun * 2.3" * 180 + 400ps + 2.4" * 180 + 2080ps + 2914ps
63*4882a593Smuzhiyun * = 6240ps
64*4882a593Smuzhiyun * = 6.240ns
65*4882a593Smuzhiyun *
66*4882a593Smuzhiyun * Minimum delay calc (Ch 1):
67*4882a593Smuzhiyun * clock prop - dram skew + min dqs prop delay + clk_adjust + min chip dly
68*4882a593Smuzhiyun * 1.46" * 180- 400ps + 0.7" * 180 + 2080ps + 1220ps
69*4882a593Smuzhiyun * = 3288ps
70*4882a593Smuzhiyun * = 3.288ns
71*4882a593Smuzhiyun *
72*4882a593Smuzhiyun * Maximum delay calc (Ch 1):
73*4882a593Smuzhiyun * clock prop + dram skew + max dqs prop delay + clk_adjust + min chip dly
74*4882a593Smuzhiyun * 1.46" * 180+ 400ps + 1.1" * 180 + 2080ps + 2595ps
75*4882a593Smuzhiyun * = 5536ps
76*4882a593Smuzhiyun * = 5.536ns
77*4882a593Smuzhiyun *
78*4882a593Smuzhiyun * Ch.0: 3.808ns to 6.240ns additional delay needed (pick 5ns as target)
79*4882a593Smuzhiyun * This is 1.5 clock cycles, pick CPO = READ_LAT + 3/2 (0x8)
80*4882a593Smuzhiyun * Ch.1: 3.288ns to 5.536ns additional delay needed (pick 4.4ns as target)
81*4882a593Smuzhiyun * This is 1.32 clock cycles, pick CPO = READ_LAT + 5/4 (0x7)
82*4882a593Smuzhiyun *
83*4882a593Smuzhiyun *
84*4882a593Smuzhiyun * ====== XPedite5370 DDR2-800 read delay calculations ======
85*4882a593Smuzhiyun *
86*4882a593Smuzhiyun * See Freescale's App Note AN2583 as refrence. This document also
87*4882a593Smuzhiyun * contains the chip-specific delays for 8548E, 8572, etc.
88*4882a593Smuzhiyun *
89*4882a593Smuzhiyun * For MPC8572E
90*4882a593Smuzhiyun * Minimum chip delay (Ch 0): 1.372ns
91*4882a593Smuzhiyun * Maximum chip delay (Ch 0): 2.914ns
92*4882a593Smuzhiyun * Minimum chip delay (Ch 1): 1.220ns
93*4882a593Smuzhiyun * Maximum chip delay (Ch 1): 2.595ns
94*4882a593Smuzhiyun *
95*4882a593Smuzhiyun * CLK adjust = 5 (from simulations) = 5/8* 2.5ns = 1563ps
96*4882a593Smuzhiyun *
97*4882a593Smuzhiyun * Minimum delay calc (Ch 0):
98*4882a593Smuzhiyun * clock prop - dram skew + min dqs prop delay + clk_adjust + min chip dly
99*4882a593Smuzhiyun * 2.3" * 180 - 350ps + 1.9" * 180 + 1563ps + 1372ps
100*4882a593Smuzhiyun * = 3341ps
101*4882a593Smuzhiyun * = 3.341ns
102*4882a593Smuzhiyun *
103*4882a593Smuzhiyun * Maximum delay calc (Ch 0):
104*4882a593Smuzhiyun * clock prop + dram skew + max dqs prop delay + clk_adjust + max chip dly
105*4882a593Smuzhiyun * 2.3" * 180 + 350ps + 2.4" * 180 + 1563ps + 2914ps
106*4882a593Smuzhiyun * = 5673ps
107*4882a593Smuzhiyun * = 5.673ns
108*4882a593Smuzhiyun *
109*4882a593Smuzhiyun * Minimum delay calc (Ch 1):
110*4882a593Smuzhiyun * clock prop - dram skew + min dqs prop delay + clk_adjust + min chip dly
111*4882a593Smuzhiyun * 1.46" * 180- 350ps + 0.7" * 180 + 1563ps + 1220ps
112*4882a593Smuzhiyun * = 2822ps
113*4882a593Smuzhiyun * = 2.822ns
114*4882a593Smuzhiyun *
115*4882a593Smuzhiyun * Maximum delay calc (Ch 1):
116*4882a593Smuzhiyun * clock prop + dram skew + max dqs prop delay + clk_adjust + min chip dly
117*4882a593Smuzhiyun * 1.46" * 180+ 350ps + 1.1" * 180 + 1563ps + 2595ps
118*4882a593Smuzhiyun * = 4968ps
119*4882a593Smuzhiyun * = 4.968ns
120*4882a593Smuzhiyun *
121*4882a593Smuzhiyun * Ch.0: 3.341ns to 5.673ns additional delay needed (pick 4.5ns as target)
122*4882a593Smuzhiyun * This is 1.8 clock cycles, pick CPO = READ_LAT + 7/4 (0x9)
123*4882a593Smuzhiyun * Ch.1: 2.822ns to 4.968ns additional delay needed (pick 3.9ns as target)
124*4882a593Smuzhiyun * This is 1.56 clock cycles, pick CPO = READ_LAT + 3/2 (0x8)
125*4882a593Smuzhiyun *
126*4882a593Smuzhiyun * Write latency (WR_DATA_DELAY) is calculated by doing the following:
127*4882a593Smuzhiyun *
128*4882a593Smuzhiyun * The DDR SDRAM specification requires DQS be received no sooner than
129*4882a593Smuzhiyun * 75% of an SDRAM clock period—and no later than 125% of a clock
130*4882a593Smuzhiyun * period—from the capturing clock edge of the command/address at the
131*4882a593Smuzhiyun * SDRAM.
132*4882a593Smuzhiyun *
133*4882a593Smuzhiyun * Based on the above tracelengths, the following are calculated:
134*4882a593Smuzhiyun * Ch. 0 8572 to DRAM propagation (DQ lanes) : 1.9" * 180 = 0.342ns
135*4882a593Smuzhiyun * Ch. 0 8572 to DRAM propagation (CLKs) : 2.3" * 180 = 0.414ns
136*4882a593Smuzhiyun * Ch. 1 8572 to DRAM propagation (DQ lanes) : 0.7" * 180 = 0.126ns
137*4882a593Smuzhiyun * Ch. 1 8572 to DRAM propagation (CLKs ) : 1.47" * 180 = 0.264ns
138*4882a593Smuzhiyun *
139*4882a593Smuzhiyun * Difference in arrival time CLK vs. DQS:
140*4882a593Smuzhiyun * Ch. 0 0.072ns
141*4882a593Smuzhiyun * Ch. 1 0.138ns
142*4882a593Smuzhiyun *
143*4882a593Smuzhiyun * Both of these values are much less than 25% of the clock
144*4882a593Smuzhiyun * period at DDR2-600 or DDR2-800, so no additional delay is needed over
145*4882a593Smuzhiyun * the 1/2 cycle which normally aligns the first DQS transition
146*4882a593Smuzhiyun * exactly WL (CAS latency minus one cycle) after the CAS strobe.
147*4882a593Smuzhiyun * See Figure 9-53 in MPC8572E manual: "1/2 delay" in Freescale's
148*4882a593Smuzhiyun * terminology corresponds to exactly one clock period delay after
149*4882a593Smuzhiyun * the CAS strobe. (due to the fact that the "delay" is referenced
150*4882a593Smuzhiyun * from the *falling* edge of the CLK, just after the rising edge
151*4882a593Smuzhiyun * which the CAS strobe is latched on.
152*4882a593Smuzhiyun */
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun typedef struct board_memctl_options {
155*4882a593Smuzhiyun uint16_t datarate_mhz_low;
156*4882a593Smuzhiyun uint16_t datarate_mhz_high;
157*4882a593Smuzhiyun uint8_t clk_adjust;
158*4882a593Smuzhiyun uint8_t cpo_override;
159*4882a593Smuzhiyun uint8_t write_data_delay;
160*4882a593Smuzhiyun } board_memctl_options_t;
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun static struct board_memctl_options bopts_ctrl[][2] = {
163*4882a593Smuzhiyun {
164*4882a593Smuzhiyun /* Controller 0 */
165*4882a593Smuzhiyun {
166*4882a593Smuzhiyun /* DDR2 600/667 */
167*4882a593Smuzhiyun .datarate_mhz_low = 500,
168*4882a593Smuzhiyun .datarate_mhz_high = 750,
169*4882a593Smuzhiyun .clk_adjust = 5,
170*4882a593Smuzhiyun .cpo_override = 8,
171*4882a593Smuzhiyun .write_data_delay = 2,
172*4882a593Smuzhiyun },
173*4882a593Smuzhiyun {
174*4882a593Smuzhiyun /* DDR2 800 */
175*4882a593Smuzhiyun .datarate_mhz_low = 750,
176*4882a593Smuzhiyun .datarate_mhz_high = 850,
177*4882a593Smuzhiyun .clk_adjust = 5,
178*4882a593Smuzhiyun .cpo_override = 9,
179*4882a593Smuzhiyun .write_data_delay = 2,
180*4882a593Smuzhiyun },
181*4882a593Smuzhiyun },
182*4882a593Smuzhiyun {
183*4882a593Smuzhiyun /* Controller 1 */
184*4882a593Smuzhiyun {
185*4882a593Smuzhiyun /* DDR2 600/667 */
186*4882a593Smuzhiyun .datarate_mhz_low = 500,
187*4882a593Smuzhiyun .datarate_mhz_high = 750,
188*4882a593Smuzhiyun .clk_adjust = 5,
189*4882a593Smuzhiyun .cpo_override = 7,
190*4882a593Smuzhiyun .write_data_delay = 2,
191*4882a593Smuzhiyun },
192*4882a593Smuzhiyun {
193*4882a593Smuzhiyun /* DDR2 800 */
194*4882a593Smuzhiyun .datarate_mhz_low = 750,
195*4882a593Smuzhiyun .datarate_mhz_high = 850,
196*4882a593Smuzhiyun .clk_adjust = 5,
197*4882a593Smuzhiyun .cpo_override = 8,
198*4882a593Smuzhiyun .write_data_delay = 2,
199*4882a593Smuzhiyun },
200*4882a593Smuzhiyun },
201*4882a593Smuzhiyun };
202*4882a593Smuzhiyun
fsl_ddr_board_options(memctl_options_t * popts,dimm_params_t * pdimm,unsigned int ctrl_num)203*4882a593Smuzhiyun void fsl_ddr_board_options(memctl_options_t *popts,
204*4882a593Smuzhiyun dimm_params_t *pdimm,
205*4882a593Smuzhiyun unsigned int ctrl_num)
206*4882a593Smuzhiyun {
207*4882a593Smuzhiyun struct board_memctl_options *bopts = bopts_ctrl[ctrl_num];
208*4882a593Smuzhiyun sys_info_t sysinfo;
209*4882a593Smuzhiyun int i;
210*4882a593Smuzhiyun unsigned int datarate;
211*4882a593Smuzhiyun
212*4882a593Smuzhiyun get_sys_info(&sysinfo);
213*4882a593Smuzhiyun datarate = sysinfo.freq_ddrbus / 1000 / 1000;
214*4882a593Smuzhiyun
215*4882a593Smuzhiyun for (i = 0; i < ARRAY_SIZE(bopts_ctrl[ctrl_num]); i++) {
216*4882a593Smuzhiyun if ((bopts[i].datarate_mhz_low <= datarate) &&
217*4882a593Smuzhiyun (bopts[i].datarate_mhz_high >= datarate)) {
218*4882a593Smuzhiyun debug("controller %d:\n", ctrl_num);
219*4882a593Smuzhiyun debug(" clk_adjust = %d\n", bopts[i].clk_adjust);
220*4882a593Smuzhiyun debug(" cpo = %d\n", bopts[i].cpo_override);
221*4882a593Smuzhiyun debug(" write_data_delay = %d\n",
222*4882a593Smuzhiyun bopts[i].write_data_delay);
223*4882a593Smuzhiyun popts->clk_adjust = bopts[i].clk_adjust;
224*4882a593Smuzhiyun popts->cpo_override = bopts[i].cpo_override;
225*4882a593Smuzhiyun popts->write_data_delay = bopts[i].write_data_delay;
226*4882a593Smuzhiyun }
227*4882a593Smuzhiyun }
228*4882a593Smuzhiyun
229*4882a593Smuzhiyun /*
230*4882a593Smuzhiyun * Factors to consider for half-strength driver enable:
231*4882a593Smuzhiyun * - number of DIMMs installed
232*4882a593Smuzhiyun */
233*4882a593Smuzhiyun popts->half_strength_driver_enable = 0;
234*4882a593Smuzhiyun }
235