1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * linux/arch/arm/mach-sa1100/cpu-sa1110.c
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 2001 Russell King
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * Note: there are two erratas that apply to the SA1110 here:
8*4882a593Smuzhiyun * 7 - SDRAM auto-power-up failure (rev A0)
9*4882a593Smuzhiyun * 13 - Corruption of internal register reads/writes following
10*4882a593Smuzhiyun * SDRAM reads (rev A0, B0, B1)
11*4882a593Smuzhiyun *
12*4882a593Smuzhiyun * We ignore rev. A0 and B0 devices; I don't think they're worth supporting.
13*4882a593Smuzhiyun *
14*4882a593Smuzhiyun * The SDRAM type can be passed on the command line as cpu_sa1110.sdram=type
15*4882a593Smuzhiyun */
16*4882a593Smuzhiyun #include <linux/cpufreq.h>
17*4882a593Smuzhiyun #include <linux/delay.h>
18*4882a593Smuzhiyun #include <linux/init.h>
19*4882a593Smuzhiyun #include <linux/io.h>
20*4882a593Smuzhiyun #include <linux/kernel.h>
21*4882a593Smuzhiyun #include <linux/moduleparam.h>
22*4882a593Smuzhiyun #include <linux/types.h>
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun #include <asm/cputype.h>
25*4882a593Smuzhiyun #include <asm/mach-types.h>
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun #include <mach/generic.h>
28*4882a593Smuzhiyun #include <mach/hardware.h>
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun #undef DEBUG
31*4882a593Smuzhiyun
32*4882a593Smuzhiyun struct sdram_params {
33*4882a593Smuzhiyun const char name[20];
34*4882a593Smuzhiyun u_char rows; /* bits */
35*4882a593Smuzhiyun u_char cas_latency; /* cycles */
36*4882a593Smuzhiyun u_char tck; /* clock cycle time (ns) */
37*4882a593Smuzhiyun u_char trcd; /* activate to r/w (ns) */
38*4882a593Smuzhiyun u_char trp; /* precharge to activate (ns) */
39*4882a593Smuzhiyun u_char twr; /* write recovery time (ns) */
40*4882a593Smuzhiyun u_short refresh; /* refresh time for array (us) */
41*4882a593Smuzhiyun };
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun struct sdram_info {
44*4882a593Smuzhiyun u_int mdcnfg;
45*4882a593Smuzhiyun u_int mdrefr;
46*4882a593Smuzhiyun u_int mdcas[3];
47*4882a593Smuzhiyun };
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun static struct sdram_params sdram_tbl[] __initdata = {
50*4882a593Smuzhiyun { /* Toshiba TC59SM716 CL2 */
51*4882a593Smuzhiyun .name = "TC59SM716-CL2",
52*4882a593Smuzhiyun .rows = 12,
53*4882a593Smuzhiyun .tck = 10,
54*4882a593Smuzhiyun .trcd = 20,
55*4882a593Smuzhiyun .trp = 20,
56*4882a593Smuzhiyun .twr = 10,
57*4882a593Smuzhiyun .refresh = 64000,
58*4882a593Smuzhiyun .cas_latency = 2,
59*4882a593Smuzhiyun }, { /* Toshiba TC59SM716 CL3 */
60*4882a593Smuzhiyun .name = "TC59SM716-CL3",
61*4882a593Smuzhiyun .rows = 12,
62*4882a593Smuzhiyun .tck = 8,
63*4882a593Smuzhiyun .trcd = 20,
64*4882a593Smuzhiyun .trp = 20,
65*4882a593Smuzhiyun .twr = 8,
66*4882a593Smuzhiyun .refresh = 64000,
67*4882a593Smuzhiyun .cas_latency = 3,
68*4882a593Smuzhiyun }, { /* Samsung K4S641632D TC75 */
69*4882a593Smuzhiyun .name = "K4S641632D",
70*4882a593Smuzhiyun .rows = 14,
71*4882a593Smuzhiyun .tck = 9,
72*4882a593Smuzhiyun .trcd = 27,
73*4882a593Smuzhiyun .trp = 20,
74*4882a593Smuzhiyun .twr = 9,
75*4882a593Smuzhiyun .refresh = 64000,
76*4882a593Smuzhiyun .cas_latency = 3,
77*4882a593Smuzhiyun }, { /* Samsung K4S281632B-1H */
78*4882a593Smuzhiyun .name = "K4S281632B-1H",
79*4882a593Smuzhiyun .rows = 12,
80*4882a593Smuzhiyun .tck = 10,
81*4882a593Smuzhiyun .trp = 20,
82*4882a593Smuzhiyun .twr = 10,
83*4882a593Smuzhiyun .refresh = 64000,
84*4882a593Smuzhiyun .cas_latency = 3,
85*4882a593Smuzhiyun }, { /* Samsung KM416S4030CT */
86*4882a593Smuzhiyun .name = "KM416S4030CT",
87*4882a593Smuzhiyun .rows = 13,
88*4882a593Smuzhiyun .tck = 8,
89*4882a593Smuzhiyun .trcd = 24, /* 3 CLKs */
90*4882a593Smuzhiyun .trp = 24, /* 3 CLKs */
91*4882a593Smuzhiyun .twr = 16, /* Trdl: 2 CLKs */
92*4882a593Smuzhiyun .refresh = 64000,
93*4882a593Smuzhiyun .cas_latency = 3,
94*4882a593Smuzhiyun }, { /* Winbond W982516AH75L CL3 */
95*4882a593Smuzhiyun .name = "W982516AH75L",
96*4882a593Smuzhiyun .rows = 16,
97*4882a593Smuzhiyun .tck = 8,
98*4882a593Smuzhiyun .trcd = 20,
99*4882a593Smuzhiyun .trp = 20,
100*4882a593Smuzhiyun .twr = 8,
101*4882a593Smuzhiyun .refresh = 64000,
102*4882a593Smuzhiyun .cas_latency = 3,
103*4882a593Smuzhiyun }, { /* Micron MT48LC8M16A2TG-75 */
104*4882a593Smuzhiyun .name = "MT48LC8M16A2TG-75",
105*4882a593Smuzhiyun .rows = 12,
106*4882a593Smuzhiyun .tck = 8,
107*4882a593Smuzhiyun .trcd = 20,
108*4882a593Smuzhiyun .trp = 20,
109*4882a593Smuzhiyun .twr = 8,
110*4882a593Smuzhiyun .refresh = 64000,
111*4882a593Smuzhiyun .cas_latency = 3,
112*4882a593Smuzhiyun },
113*4882a593Smuzhiyun };
114*4882a593Smuzhiyun
115*4882a593Smuzhiyun static struct sdram_params sdram_params;
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun /*
118*4882a593Smuzhiyun * Given a period in ns and frequency in khz, calculate the number of
119*4882a593Smuzhiyun * cycles of frequency in period. Note that we round up to the next
120*4882a593Smuzhiyun * cycle, even if we are only slightly over.
121*4882a593Smuzhiyun */
ns_to_cycles(u_int ns,u_int khz)122*4882a593Smuzhiyun static inline u_int ns_to_cycles(u_int ns, u_int khz)
123*4882a593Smuzhiyun {
124*4882a593Smuzhiyun return (ns * khz + 999999) / 1000000;
125*4882a593Smuzhiyun }
126*4882a593Smuzhiyun
127*4882a593Smuzhiyun /*
128*4882a593Smuzhiyun * Create the MDCAS register bit pattern.
129*4882a593Smuzhiyun */
set_mdcas(u_int * mdcas,int delayed,u_int rcd)130*4882a593Smuzhiyun static inline void set_mdcas(u_int *mdcas, int delayed, u_int rcd)
131*4882a593Smuzhiyun {
132*4882a593Smuzhiyun u_int shift;
133*4882a593Smuzhiyun
134*4882a593Smuzhiyun rcd = 2 * rcd - 1;
135*4882a593Smuzhiyun shift = delayed + 1 + rcd;
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun mdcas[0] = (1 << rcd) - 1;
138*4882a593Smuzhiyun mdcas[0] |= 0x55555555 << shift;
139*4882a593Smuzhiyun mdcas[1] = mdcas[2] = 0x55555555 << (shift & 1);
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun
142*4882a593Smuzhiyun static void
sdram_calculate_timing(struct sdram_info * sd,u_int cpu_khz,struct sdram_params * sdram)143*4882a593Smuzhiyun sdram_calculate_timing(struct sdram_info *sd, u_int cpu_khz,
144*4882a593Smuzhiyun struct sdram_params *sdram)
145*4882a593Smuzhiyun {
146*4882a593Smuzhiyun u_int mem_khz, sd_khz, trp, twr;
147*4882a593Smuzhiyun
148*4882a593Smuzhiyun mem_khz = cpu_khz / 2;
149*4882a593Smuzhiyun sd_khz = mem_khz;
150*4882a593Smuzhiyun
151*4882a593Smuzhiyun /*
152*4882a593Smuzhiyun * If SDCLK would invalidate the SDRAM timings,
153*4882a593Smuzhiyun * run SDCLK at half speed.
154*4882a593Smuzhiyun *
155*4882a593Smuzhiyun * CPU steppings prior to B2 must either run the memory at
156*4882a593Smuzhiyun * half speed or use delayed read latching (errata 13).
157*4882a593Smuzhiyun */
158*4882a593Smuzhiyun if ((ns_to_cycles(sdram->tck, sd_khz) > 1) ||
159*4882a593Smuzhiyun (read_cpuid_revision() < ARM_CPU_REV_SA1110_B2 && sd_khz < 62000))
160*4882a593Smuzhiyun sd_khz /= 2;
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun sd->mdcnfg = MDCNFG & 0x007f007f;
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun twr = ns_to_cycles(sdram->twr, mem_khz);
165*4882a593Smuzhiyun
166*4882a593Smuzhiyun /* trp should always be >1 */
167*4882a593Smuzhiyun trp = ns_to_cycles(sdram->trp, mem_khz) - 1;
168*4882a593Smuzhiyun if (trp < 1)
169*4882a593Smuzhiyun trp = 1;
170*4882a593Smuzhiyun
171*4882a593Smuzhiyun sd->mdcnfg |= trp << 8;
172*4882a593Smuzhiyun sd->mdcnfg |= trp << 24;
173*4882a593Smuzhiyun sd->mdcnfg |= sdram->cas_latency << 12;
174*4882a593Smuzhiyun sd->mdcnfg |= sdram->cas_latency << 28;
175*4882a593Smuzhiyun sd->mdcnfg |= twr << 14;
176*4882a593Smuzhiyun sd->mdcnfg |= twr << 30;
177*4882a593Smuzhiyun
178*4882a593Smuzhiyun sd->mdrefr = MDREFR & 0xffbffff0;
179*4882a593Smuzhiyun sd->mdrefr |= 7;
180*4882a593Smuzhiyun
181*4882a593Smuzhiyun if (sd_khz != mem_khz)
182*4882a593Smuzhiyun sd->mdrefr |= MDREFR_K1DB2;
183*4882a593Smuzhiyun
184*4882a593Smuzhiyun /* initial number of '1's in MDCAS + 1 */
185*4882a593Smuzhiyun set_mdcas(sd->mdcas, sd_khz >= 62000,
186*4882a593Smuzhiyun ns_to_cycles(sdram->trcd, mem_khz));
187*4882a593Smuzhiyun
188*4882a593Smuzhiyun #ifdef DEBUG
189*4882a593Smuzhiyun printk(KERN_DEBUG "MDCNFG: %08x MDREFR: %08x MDCAS0: %08x MDCAS1: %08x MDCAS2: %08x\n",
190*4882a593Smuzhiyun sd->mdcnfg, sd->mdrefr, sd->mdcas[0], sd->mdcas[1],
191*4882a593Smuzhiyun sd->mdcas[2]);
192*4882a593Smuzhiyun #endif
193*4882a593Smuzhiyun }
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun /*
196*4882a593Smuzhiyun * Set the SDRAM refresh rate.
197*4882a593Smuzhiyun */
sdram_set_refresh(u_int dri)198*4882a593Smuzhiyun static inline void sdram_set_refresh(u_int dri)
199*4882a593Smuzhiyun {
200*4882a593Smuzhiyun MDREFR = (MDREFR & 0xffff000f) | (dri << 4);
201*4882a593Smuzhiyun (void) MDREFR;
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun
204*4882a593Smuzhiyun /*
205*4882a593Smuzhiyun * Update the refresh period. We do this such that we always refresh
206*4882a593Smuzhiyun * the SDRAMs within their permissible period. The refresh period is
207*4882a593Smuzhiyun * always a multiple of the memory clock (fixed at cpu_clock / 2).
208*4882a593Smuzhiyun *
209*4882a593Smuzhiyun * FIXME: we don't currently take account of burst accesses here,
210*4882a593Smuzhiyun * but neither do Intels DM nor Angel.
211*4882a593Smuzhiyun */
212*4882a593Smuzhiyun static void
sdram_update_refresh(u_int cpu_khz,struct sdram_params * sdram)213*4882a593Smuzhiyun sdram_update_refresh(u_int cpu_khz, struct sdram_params *sdram)
214*4882a593Smuzhiyun {
215*4882a593Smuzhiyun u_int ns_row = (sdram->refresh * 1000) >> sdram->rows;
216*4882a593Smuzhiyun u_int dri = ns_to_cycles(ns_row, cpu_khz / 2) / 32;
217*4882a593Smuzhiyun
218*4882a593Smuzhiyun #ifdef DEBUG
219*4882a593Smuzhiyun mdelay(250);
220*4882a593Smuzhiyun printk(KERN_DEBUG "new dri value = %d\n", dri);
221*4882a593Smuzhiyun #endif
222*4882a593Smuzhiyun
223*4882a593Smuzhiyun sdram_set_refresh(dri);
224*4882a593Smuzhiyun }
225*4882a593Smuzhiyun
226*4882a593Smuzhiyun /*
227*4882a593Smuzhiyun * Ok, set the CPU frequency.
228*4882a593Smuzhiyun */
sa1110_target(struct cpufreq_policy * policy,unsigned int ppcr)229*4882a593Smuzhiyun static int sa1110_target(struct cpufreq_policy *policy, unsigned int ppcr)
230*4882a593Smuzhiyun {
231*4882a593Smuzhiyun struct sdram_params *sdram = &sdram_params;
232*4882a593Smuzhiyun struct sdram_info sd;
233*4882a593Smuzhiyun unsigned long flags;
234*4882a593Smuzhiyun unsigned int unused;
235*4882a593Smuzhiyun
236*4882a593Smuzhiyun sdram_calculate_timing(&sd, sa11x0_freq_table[ppcr].frequency, sdram);
237*4882a593Smuzhiyun
238*4882a593Smuzhiyun #if 0
239*4882a593Smuzhiyun /*
240*4882a593Smuzhiyun * These values are wrong according to the SA1110 documentation
241*4882a593Smuzhiyun * and errata, but they seem to work. Need to get a storage
242*4882a593Smuzhiyun * scope on to the SDRAM signals to work out why.
243*4882a593Smuzhiyun */
244*4882a593Smuzhiyun if (policy->max < 147500) {
245*4882a593Smuzhiyun sd.mdrefr |= MDREFR_K1DB2;
246*4882a593Smuzhiyun sd.mdcas[0] = 0xaaaaaa7f;
247*4882a593Smuzhiyun } else {
248*4882a593Smuzhiyun sd.mdrefr &= ~MDREFR_K1DB2;
249*4882a593Smuzhiyun sd.mdcas[0] = 0xaaaaaa9f;
250*4882a593Smuzhiyun }
251*4882a593Smuzhiyun sd.mdcas[1] = 0xaaaaaaaa;
252*4882a593Smuzhiyun sd.mdcas[2] = 0xaaaaaaaa;
253*4882a593Smuzhiyun #endif
254*4882a593Smuzhiyun
255*4882a593Smuzhiyun /*
256*4882a593Smuzhiyun * The clock could be going away for some time. Set the SDRAMs
257*4882a593Smuzhiyun * to refresh rapidly (every 64 memory clock cycles). To get
258*4882a593Smuzhiyun * through the whole array, we need to wait 262144 mclk cycles.
259*4882a593Smuzhiyun * We wait 20ms to be safe.
260*4882a593Smuzhiyun */
261*4882a593Smuzhiyun sdram_set_refresh(2);
262*4882a593Smuzhiyun if (!irqs_disabled())
263*4882a593Smuzhiyun msleep(20);
264*4882a593Smuzhiyun else
265*4882a593Smuzhiyun mdelay(20);
266*4882a593Smuzhiyun
267*4882a593Smuzhiyun /*
268*4882a593Smuzhiyun * Reprogram the DRAM timings with interrupts disabled, and
269*4882a593Smuzhiyun * ensure that we are doing this within a complete cache line.
270*4882a593Smuzhiyun * This means that we won't access SDRAM for the duration of
271*4882a593Smuzhiyun * the programming.
272*4882a593Smuzhiyun */
273*4882a593Smuzhiyun local_irq_save(flags);
274*4882a593Smuzhiyun asm("mcr p15, 0, %0, c7, c10, 4" : : "r" (0));
275*4882a593Smuzhiyun udelay(10);
276*4882a593Smuzhiyun __asm__ __volatile__("\n\
277*4882a593Smuzhiyun b 2f \n\
278*4882a593Smuzhiyun .align 5 \n\
279*4882a593Smuzhiyun 1: str %3, [%1, #0] @ MDCNFG \n\
280*4882a593Smuzhiyun str %4, [%1, #28] @ MDREFR \n\
281*4882a593Smuzhiyun str %5, [%1, #4] @ MDCAS0 \n\
282*4882a593Smuzhiyun str %6, [%1, #8] @ MDCAS1 \n\
283*4882a593Smuzhiyun str %7, [%1, #12] @ MDCAS2 \n\
284*4882a593Smuzhiyun str %8, [%2, #0] @ PPCR \n\
285*4882a593Smuzhiyun ldr %0, [%1, #0] \n\
286*4882a593Smuzhiyun b 3f \n\
287*4882a593Smuzhiyun 2: b 1b \n\
288*4882a593Smuzhiyun 3: nop \n\
289*4882a593Smuzhiyun nop"
290*4882a593Smuzhiyun : "=&r" (unused)
291*4882a593Smuzhiyun : "r" (&MDCNFG), "r" (&PPCR), "0" (sd.mdcnfg),
292*4882a593Smuzhiyun "r" (sd.mdrefr), "r" (sd.mdcas[0]),
293*4882a593Smuzhiyun "r" (sd.mdcas[1]), "r" (sd.mdcas[2]), "r" (ppcr));
294*4882a593Smuzhiyun local_irq_restore(flags);
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun /*
297*4882a593Smuzhiyun * Now, return the SDRAM refresh back to normal.
298*4882a593Smuzhiyun */
299*4882a593Smuzhiyun sdram_update_refresh(sa11x0_freq_table[ppcr].frequency, sdram);
300*4882a593Smuzhiyun
301*4882a593Smuzhiyun return 0;
302*4882a593Smuzhiyun }
303*4882a593Smuzhiyun
sa1110_cpu_init(struct cpufreq_policy * policy)304*4882a593Smuzhiyun static int __init sa1110_cpu_init(struct cpufreq_policy *policy)
305*4882a593Smuzhiyun {
306*4882a593Smuzhiyun cpufreq_generic_init(policy, sa11x0_freq_table, 0);
307*4882a593Smuzhiyun return 0;
308*4882a593Smuzhiyun }
309*4882a593Smuzhiyun
310*4882a593Smuzhiyun /* sa1110_driver needs __refdata because it must remain after init registers
311*4882a593Smuzhiyun * it with cpufreq_register_driver() */
312*4882a593Smuzhiyun static struct cpufreq_driver sa1110_driver __refdata = {
313*4882a593Smuzhiyun .flags = CPUFREQ_STICKY | CPUFREQ_NEED_INITIAL_FREQ_CHECK |
314*4882a593Smuzhiyun CPUFREQ_NO_AUTO_DYNAMIC_SWITCHING,
315*4882a593Smuzhiyun .verify = cpufreq_generic_frequency_table_verify,
316*4882a593Smuzhiyun .target_index = sa1110_target,
317*4882a593Smuzhiyun .get = sa11x0_getspeed,
318*4882a593Smuzhiyun .init = sa1110_cpu_init,
319*4882a593Smuzhiyun .name = "sa1110",
320*4882a593Smuzhiyun };
321*4882a593Smuzhiyun
sa1110_find_sdram(const char * name)322*4882a593Smuzhiyun static struct sdram_params *sa1110_find_sdram(const char *name)
323*4882a593Smuzhiyun {
324*4882a593Smuzhiyun struct sdram_params *sdram;
325*4882a593Smuzhiyun
326*4882a593Smuzhiyun for (sdram = sdram_tbl; sdram < sdram_tbl + ARRAY_SIZE(sdram_tbl);
327*4882a593Smuzhiyun sdram++)
328*4882a593Smuzhiyun if (strcmp(name, sdram->name) == 0)
329*4882a593Smuzhiyun return sdram;
330*4882a593Smuzhiyun
331*4882a593Smuzhiyun return NULL;
332*4882a593Smuzhiyun }
333*4882a593Smuzhiyun
334*4882a593Smuzhiyun static char sdram_name[16];
335*4882a593Smuzhiyun
sa1110_clk_init(void)336*4882a593Smuzhiyun static int __init sa1110_clk_init(void)
337*4882a593Smuzhiyun {
338*4882a593Smuzhiyun struct sdram_params *sdram;
339*4882a593Smuzhiyun const char *name = sdram_name;
340*4882a593Smuzhiyun
341*4882a593Smuzhiyun if (!cpu_is_sa1110())
342*4882a593Smuzhiyun return -ENODEV;
343*4882a593Smuzhiyun
344*4882a593Smuzhiyun if (!name[0]) {
345*4882a593Smuzhiyun if (machine_is_assabet())
346*4882a593Smuzhiyun name = "TC59SM716-CL3";
347*4882a593Smuzhiyun if (machine_is_pt_system3())
348*4882a593Smuzhiyun name = "K4S641632D";
349*4882a593Smuzhiyun if (machine_is_h3100())
350*4882a593Smuzhiyun name = "KM416S4030CT";
351*4882a593Smuzhiyun if (machine_is_jornada720() || machine_is_h3600())
352*4882a593Smuzhiyun name = "K4S281632B-1H";
353*4882a593Smuzhiyun if (machine_is_nanoengine())
354*4882a593Smuzhiyun name = "MT48LC8M16A2TG-75";
355*4882a593Smuzhiyun }
356*4882a593Smuzhiyun
357*4882a593Smuzhiyun sdram = sa1110_find_sdram(name);
358*4882a593Smuzhiyun if (sdram) {
359*4882a593Smuzhiyun printk(KERN_DEBUG "SDRAM: tck: %d trcd: %d trp: %d"
360*4882a593Smuzhiyun " twr: %d refresh: %d cas_latency: %d\n",
361*4882a593Smuzhiyun sdram->tck, sdram->trcd, sdram->trp,
362*4882a593Smuzhiyun sdram->twr, sdram->refresh, sdram->cas_latency);
363*4882a593Smuzhiyun
364*4882a593Smuzhiyun memcpy(&sdram_params, sdram, sizeof(sdram_params));
365*4882a593Smuzhiyun
366*4882a593Smuzhiyun return cpufreq_register_driver(&sa1110_driver);
367*4882a593Smuzhiyun }
368*4882a593Smuzhiyun
369*4882a593Smuzhiyun return 0;
370*4882a593Smuzhiyun }
371*4882a593Smuzhiyun
372*4882a593Smuzhiyun module_param_string(sdram, sdram_name, sizeof(sdram_name), 0);
373*4882a593Smuzhiyun arch_initcall(sa1110_clk_init);
374