1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (C) 2010, 2011, 2012, Lemote, Inc.
4*4882a593Smuzhiyun * Author: Chen Huacai, chenhc@lemote.com
5*4882a593Smuzhiyun */
6*4882a593Smuzhiyun
7*4882a593Smuzhiyun #include <irq.h>
8*4882a593Smuzhiyun #include <linux/init.h>
9*4882a593Smuzhiyun #include <linux/cpu.h>
10*4882a593Smuzhiyun #include <linux/sched.h>
11*4882a593Smuzhiyun #include <linux/sched/hotplug.h>
12*4882a593Smuzhiyun #include <linux/sched/task_stack.h>
13*4882a593Smuzhiyun #include <linux/smp.h>
14*4882a593Smuzhiyun #include <linux/cpufreq.h>
15*4882a593Smuzhiyun #include <linux/kexec.h>
16*4882a593Smuzhiyun #include <asm/processor.h>
17*4882a593Smuzhiyun #include <asm/time.h>
18*4882a593Smuzhiyun #include <asm/tlbflush.h>
19*4882a593Smuzhiyun #include <asm/cacheflush.h>
20*4882a593Smuzhiyun #include <loongson.h>
21*4882a593Smuzhiyun #include <loongson_regs.h>
22*4882a593Smuzhiyun #include <workarounds.h>
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun #include "smp.h"
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun DEFINE_PER_CPU(int, cpu_state);
27*4882a593Smuzhiyun
28*4882a593Smuzhiyun #define LS_IPI_IRQ (MIPS_CPU_IRQ_BASE + 6)
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun static void *ipi_set0_regs[16];
31*4882a593Smuzhiyun static void *ipi_clear0_regs[16];
32*4882a593Smuzhiyun static void *ipi_status0_regs[16];
33*4882a593Smuzhiyun static void *ipi_en0_regs[16];
34*4882a593Smuzhiyun static void *ipi_mailbox_buf[16];
35*4882a593Smuzhiyun static uint32_t core0_c0count[NR_CPUS];
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun /* read a 32bit value from ipi register */
38*4882a593Smuzhiyun #define loongson3_ipi_read32(addr) readl(addr)
39*4882a593Smuzhiyun /* read a 64bit value from ipi register */
40*4882a593Smuzhiyun #define loongson3_ipi_read64(addr) readq(addr)
41*4882a593Smuzhiyun /* write a 32bit value to ipi register */
42*4882a593Smuzhiyun #define loongson3_ipi_write32(action, addr) \
43*4882a593Smuzhiyun do { \
44*4882a593Smuzhiyun writel(action, addr); \
45*4882a593Smuzhiyun __wbflush(); \
46*4882a593Smuzhiyun } while (0)
47*4882a593Smuzhiyun /* write a 64bit value to ipi register */
48*4882a593Smuzhiyun #define loongson3_ipi_write64(action, addr) \
49*4882a593Smuzhiyun do { \
50*4882a593Smuzhiyun writeq(action, addr); \
51*4882a593Smuzhiyun __wbflush(); \
52*4882a593Smuzhiyun } while (0)
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun u32 (*ipi_read_clear)(int cpu);
55*4882a593Smuzhiyun void (*ipi_write_action)(int cpu, u32 action);
56*4882a593Smuzhiyun
csr_ipi_read_clear(int cpu)57*4882a593Smuzhiyun static u32 csr_ipi_read_clear(int cpu)
58*4882a593Smuzhiyun {
59*4882a593Smuzhiyun u32 action;
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun /* Load the ipi register to figure out what we're supposed to do */
62*4882a593Smuzhiyun action = csr_readl(LOONGSON_CSR_IPI_STATUS);
63*4882a593Smuzhiyun /* Clear the ipi register to clear the interrupt */
64*4882a593Smuzhiyun csr_writel(action, LOONGSON_CSR_IPI_CLEAR);
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun return action;
67*4882a593Smuzhiyun }
68*4882a593Smuzhiyun
csr_ipi_write_action(int cpu,u32 action)69*4882a593Smuzhiyun static void csr_ipi_write_action(int cpu, u32 action)
70*4882a593Smuzhiyun {
71*4882a593Smuzhiyun unsigned int irq = 0;
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun while ((irq = ffs(action))) {
74*4882a593Smuzhiyun uint32_t val = CSR_IPI_SEND_BLOCK;
75*4882a593Smuzhiyun val |= (irq - 1);
76*4882a593Smuzhiyun val |= (cpu << CSR_IPI_SEND_CPU_SHIFT);
77*4882a593Smuzhiyun csr_writel(val, LOONGSON_CSR_IPI_SEND);
78*4882a593Smuzhiyun action &= ~BIT(irq - 1);
79*4882a593Smuzhiyun }
80*4882a593Smuzhiyun }
81*4882a593Smuzhiyun
legacy_ipi_read_clear(int cpu)82*4882a593Smuzhiyun static u32 legacy_ipi_read_clear(int cpu)
83*4882a593Smuzhiyun {
84*4882a593Smuzhiyun u32 action;
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun /* Load the ipi register to figure out what we're supposed to do */
87*4882a593Smuzhiyun action = loongson3_ipi_read32(ipi_status0_regs[cpu_logical_map(cpu)]);
88*4882a593Smuzhiyun /* Clear the ipi register to clear the interrupt */
89*4882a593Smuzhiyun loongson3_ipi_write32(action, ipi_clear0_regs[cpu_logical_map(cpu)]);
90*4882a593Smuzhiyun
91*4882a593Smuzhiyun return action;
92*4882a593Smuzhiyun }
93*4882a593Smuzhiyun
legacy_ipi_write_action(int cpu,u32 action)94*4882a593Smuzhiyun static void legacy_ipi_write_action(int cpu, u32 action)
95*4882a593Smuzhiyun {
96*4882a593Smuzhiyun loongson3_ipi_write32((u32)action, ipi_set0_regs[cpu]);
97*4882a593Smuzhiyun }
98*4882a593Smuzhiyun
csr_ipi_probe(void)99*4882a593Smuzhiyun static void csr_ipi_probe(void)
100*4882a593Smuzhiyun {
101*4882a593Smuzhiyun if (cpu_has_csr() && csr_readl(LOONGSON_CSR_FEATURES) & LOONGSON_CSRF_IPI) {
102*4882a593Smuzhiyun ipi_read_clear = csr_ipi_read_clear;
103*4882a593Smuzhiyun ipi_write_action = csr_ipi_write_action;
104*4882a593Smuzhiyun } else {
105*4882a593Smuzhiyun ipi_read_clear = legacy_ipi_read_clear;
106*4882a593Smuzhiyun ipi_write_action = legacy_ipi_write_action;
107*4882a593Smuzhiyun }
108*4882a593Smuzhiyun }
109*4882a593Smuzhiyun
ipi_set0_regs_init(void)110*4882a593Smuzhiyun static void ipi_set0_regs_init(void)
111*4882a593Smuzhiyun {
112*4882a593Smuzhiyun ipi_set0_regs[0] = (void *)
113*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE0_OFFSET + SET0);
114*4882a593Smuzhiyun ipi_set0_regs[1] = (void *)
115*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE1_OFFSET + SET0);
116*4882a593Smuzhiyun ipi_set0_regs[2] = (void *)
117*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE2_OFFSET + SET0);
118*4882a593Smuzhiyun ipi_set0_regs[3] = (void *)
119*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE3_OFFSET + SET0);
120*4882a593Smuzhiyun ipi_set0_regs[4] = (void *)
121*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE0_OFFSET + SET0);
122*4882a593Smuzhiyun ipi_set0_regs[5] = (void *)
123*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE1_OFFSET + SET0);
124*4882a593Smuzhiyun ipi_set0_regs[6] = (void *)
125*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE2_OFFSET + SET0);
126*4882a593Smuzhiyun ipi_set0_regs[7] = (void *)
127*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE3_OFFSET + SET0);
128*4882a593Smuzhiyun ipi_set0_regs[8] = (void *)
129*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE0_OFFSET + SET0);
130*4882a593Smuzhiyun ipi_set0_regs[9] = (void *)
131*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE1_OFFSET + SET0);
132*4882a593Smuzhiyun ipi_set0_regs[10] = (void *)
133*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE2_OFFSET + SET0);
134*4882a593Smuzhiyun ipi_set0_regs[11] = (void *)
135*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE3_OFFSET + SET0);
136*4882a593Smuzhiyun ipi_set0_regs[12] = (void *)
137*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE0_OFFSET + SET0);
138*4882a593Smuzhiyun ipi_set0_regs[13] = (void *)
139*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE1_OFFSET + SET0);
140*4882a593Smuzhiyun ipi_set0_regs[14] = (void *)
141*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE2_OFFSET + SET0);
142*4882a593Smuzhiyun ipi_set0_regs[15] = (void *)
143*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE3_OFFSET + SET0);
144*4882a593Smuzhiyun }
145*4882a593Smuzhiyun
ipi_clear0_regs_init(void)146*4882a593Smuzhiyun static void ipi_clear0_regs_init(void)
147*4882a593Smuzhiyun {
148*4882a593Smuzhiyun ipi_clear0_regs[0] = (void *)
149*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE0_OFFSET + CLEAR0);
150*4882a593Smuzhiyun ipi_clear0_regs[1] = (void *)
151*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE1_OFFSET + CLEAR0);
152*4882a593Smuzhiyun ipi_clear0_regs[2] = (void *)
153*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE2_OFFSET + CLEAR0);
154*4882a593Smuzhiyun ipi_clear0_regs[3] = (void *)
155*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE3_OFFSET + CLEAR0);
156*4882a593Smuzhiyun ipi_clear0_regs[4] = (void *)
157*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE0_OFFSET + CLEAR0);
158*4882a593Smuzhiyun ipi_clear0_regs[5] = (void *)
159*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE1_OFFSET + CLEAR0);
160*4882a593Smuzhiyun ipi_clear0_regs[6] = (void *)
161*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE2_OFFSET + CLEAR0);
162*4882a593Smuzhiyun ipi_clear0_regs[7] = (void *)
163*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE3_OFFSET + CLEAR0);
164*4882a593Smuzhiyun ipi_clear0_regs[8] = (void *)
165*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE0_OFFSET + CLEAR0);
166*4882a593Smuzhiyun ipi_clear0_regs[9] = (void *)
167*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE1_OFFSET + CLEAR0);
168*4882a593Smuzhiyun ipi_clear0_regs[10] = (void *)
169*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE2_OFFSET + CLEAR0);
170*4882a593Smuzhiyun ipi_clear0_regs[11] = (void *)
171*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE3_OFFSET + CLEAR0);
172*4882a593Smuzhiyun ipi_clear0_regs[12] = (void *)
173*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE0_OFFSET + CLEAR0);
174*4882a593Smuzhiyun ipi_clear0_regs[13] = (void *)
175*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE1_OFFSET + CLEAR0);
176*4882a593Smuzhiyun ipi_clear0_regs[14] = (void *)
177*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE2_OFFSET + CLEAR0);
178*4882a593Smuzhiyun ipi_clear0_regs[15] = (void *)
179*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE3_OFFSET + CLEAR0);
180*4882a593Smuzhiyun }
181*4882a593Smuzhiyun
ipi_status0_regs_init(void)182*4882a593Smuzhiyun static void ipi_status0_regs_init(void)
183*4882a593Smuzhiyun {
184*4882a593Smuzhiyun ipi_status0_regs[0] = (void *)
185*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE0_OFFSET + STATUS0);
186*4882a593Smuzhiyun ipi_status0_regs[1] = (void *)
187*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE1_OFFSET + STATUS0);
188*4882a593Smuzhiyun ipi_status0_regs[2] = (void *)
189*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE2_OFFSET + STATUS0);
190*4882a593Smuzhiyun ipi_status0_regs[3] = (void *)
191*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE3_OFFSET + STATUS0);
192*4882a593Smuzhiyun ipi_status0_regs[4] = (void *)
193*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE0_OFFSET + STATUS0);
194*4882a593Smuzhiyun ipi_status0_regs[5] = (void *)
195*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE1_OFFSET + STATUS0);
196*4882a593Smuzhiyun ipi_status0_regs[6] = (void *)
197*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE2_OFFSET + STATUS0);
198*4882a593Smuzhiyun ipi_status0_regs[7] = (void *)
199*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE3_OFFSET + STATUS0);
200*4882a593Smuzhiyun ipi_status0_regs[8] = (void *)
201*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE0_OFFSET + STATUS0);
202*4882a593Smuzhiyun ipi_status0_regs[9] = (void *)
203*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE1_OFFSET + STATUS0);
204*4882a593Smuzhiyun ipi_status0_regs[10] = (void *)
205*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE2_OFFSET + STATUS0);
206*4882a593Smuzhiyun ipi_status0_regs[11] = (void *)
207*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE3_OFFSET + STATUS0);
208*4882a593Smuzhiyun ipi_status0_regs[12] = (void *)
209*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE0_OFFSET + STATUS0);
210*4882a593Smuzhiyun ipi_status0_regs[13] = (void *)
211*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE1_OFFSET + STATUS0);
212*4882a593Smuzhiyun ipi_status0_regs[14] = (void *)
213*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE2_OFFSET + STATUS0);
214*4882a593Smuzhiyun ipi_status0_regs[15] = (void *)
215*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE3_OFFSET + STATUS0);
216*4882a593Smuzhiyun }
217*4882a593Smuzhiyun
ipi_en0_regs_init(void)218*4882a593Smuzhiyun static void ipi_en0_regs_init(void)
219*4882a593Smuzhiyun {
220*4882a593Smuzhiyun ipi_en0_regs[0] = (void *)
221*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE0_OFFSET + EN0);
222*4882a593Smuzhiyun ipi_en0_regs[1] = (void *)
223*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE1_OFFSET + EN0);
224*4882a593Smuzhiyun ipi_en0_regs[2] = (void *)
225*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE2_OFFSET + EN0);
226*4882a593Smuzhiyun ipi_en0_regs[3] = (void *)
227*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE3_OFFSET + EN0);
228*4882a593Smuzhiyun ipi_en0_regs[4] = (void *)
229*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE0_OFFSET + EN0);
230*4882a593Smuzhiyun ipi_en0_regs[5] = (void *)
231*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE1_OFFSET + EN0);
232*4882a593Smuzhiyun ipi_en0_regs[6] = (void *)
233*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE2_OFFSET + EN0);
234*4882a593Smuzhiyun ipi_en0_regs[7] = (void *)
235*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE3_OFFSET + EN0);
236*4882a593Smuzhiyun ipi_en0_regs[8] = (void *)
237*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE0_OFFSET + EN0);
238*4882a593Smuzhiyun ipi_en0_regs[9] = (void *)
239*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE1_OFFSET + EN0);
240*4882a593Smuzhiyun ipi_en0_regs[10] = (void *)
241*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE2_OFFSET + EN0);
242*4882a593Smuzhiyun ipi_en0_regs[11] = (void *)
243*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE3_OFFSET + EN0);
244*4882a593Smuzhiyun ipi_en0_regs[12] = (void *)
245*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE0_OFFSET + EN0);
246*4882a593Smuzhiyun ipi_en0_regs[13] = (void *)
247*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE1_OFFSET + EN0);
248*4882a593Smuzhiyun ipi_en0_regs[14] = (void *)
249*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE2_OFFSET + EN0);
250*4882a593Smuzhiyun ipi_en0_regs[15] = (void *)
251*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE3_OFFSET + EN0);
252*4882a593Smuzhiyun }
253*4882a593Smuzhiyun
ipi_mailbox_buf_init(void)254*4882a593Smuzhiyun static void ipi_mailbox_buf_init(void)
255*4882a593Smuzhiyun {
256*4882a593Smuzhiyun ipi_mailbox_buf[0] = (void *)
257*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE0_OFFSET + BUF);
258*4882a593Smuzhiyun ipi_mailbox_buf[1] = (void *)
259*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE1_OFFSET + BUF);
260*4882a593Smuzhiyun ipi_mailbox_buf[2] = (void *)
261*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE2_OFFSET + BUF);
262*4882a593Smuzhiyun ipi_mailbox_buf[3] = (void *)
263*4882a593Smuzhiyun (SMP_CORE_GROUP0_BASE + SMP_CORE3_OFFSET + BUF);
264*4882a593Smuzhiyun ipi_mailbox_buf[4] = (void *)
265*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE0_OFFSET + BUF);
266*4882a593Smuzhiyun ipi_mailbox_buf[5] = (void *)
267*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE1_OFFSET + BUF);
268*4882a593Smuzhiyun ipi_mailbox_buf[6] = (void *)
269*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE2_OFFSET + BUF);
270*4882a593Smuzhiyun ipi_mailbox_buf[7] = (void *)
271*4882a593Smuzhiyun (SMP_CORE_GROUP1_BASE + SMP_CORE3_OFFSET + BUF);
272*4882a593Smuzhiyun ipi_mailbox_buf[8] = (void *)
273*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE0_OFFSET + BUF);
274*4882a593Smuzhiyun ipi_mailbox_buf[9] = (void *)
275*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE1_OFFSET + BUF);
276*4882a593Smuzhiyun ipi_mailbox_buf[10] = (void *)
277*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE2_OFFSET + BUF);
278*4882a593Smuzhiyun ipi_mailbox_buf[11] = (void *)
279*4882a593Smuzhiyun (SMP_CORE_GROUP2_BASE + SMP_CORE3_OFFSET + BUF);
280*4882a593Smuzhiyun ipi_mailbox_buf[12] = (void *)
281*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE0_OFFSET + BUF);
282*4882a593Smuzhiyun ipi_mailbox_buf[13] = (void *)
283*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE1_OFFSET + BUF);
284*4882a593Smuzhiyun ipi_mailbox_buf[14] = (void *)
285*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE2_OFFSET + BUF);
286*4882a593Smuzhiyun ipi_mailbox_buf[15] = (void *)
287*4882a593Smuzhiyun (SMP_CORE_GROUP3_BASE + SMP_CORE3_OFFSET + BUF);
288*4882a593Smuzhiyun }
289*4882a593Smuzhiyun
290*4882a593Smuzhiyun /*
291*4882a593Smuzhiyun * Simple enough, just poke the appropriate ipi register
292*4882a593Smuzhiyun */
loongson3_send_ipi_single(int cpu,unsigned int action)293*4882a593Smuzhiyun static void loongson3_send_ipi_single(int cpu, unsigned int action)
294*4882a593Smuzhiyun {
295*4882a593Smuzhiyun ipi_write_action(cpu_logical_map(cpu), (u32)action);
296*4882a593Smuzhiyun }
297*4882a593Smuzhiyun
298*4882a593Smuzhiyun static void
loongson3_send_ipi_mask(const struct cpumask * mask,unsigned int action)299*4882a593Smuzhiyun loongson3_send_ipi_mask(const struct cpumask *mask, unsigned int action)
300*4882a593Smuzhiyun {
301*4882a593Smuzhiyun unsigned int i;
302*4882a593Smuzhiyun
303*4882a593Smuzhiyun for_each_cpu(i, mask)
304*4882a593Smuzhiyun ipi_write_action(cpu_logical_map(i), (u32)action);
305*4882a593Smuzhiyun }
306*4882a593Smuzhiyun
307*4882a593Smuzhiyun
loongson3_ipi_interrupt(int irq,void * dev_id)308*4882a593Smuzhiyun static irqreturn_t loongson3_ipi_interrupt(int irq, void *dev_id)
309*4882a593Smuzhiyun {
310*4882a593Smuzhiyun int i, cpu = smp_processor_id();
311*4882a593Smuzhiyun unsigned int action, c0count;
312*4882a593Smuzhiyun
313*4882a593Smuzhiyun action = ipi_read_clear(cpu);
314*4882a593Smuzhiyun
315*4882a593Smuzhiyun if (action & SMP_RESCHEDULE_YOURSELF)
316*4882a593Smuzhiyun scheduler_ipi();
317*4882a593Smuzhiyun
318*4882a593Smuzhiyun if (action & SMP_CALL_FUNCTION) {
319*4882a593Smuzhiyun irq_enter();
320*4882a593Smuzhiyun generic_smp_call_function_interrupt();
321*4882a593Smuzhiyun irq_exit();
322*4882a593Smuzhiyun }
323*4882a593Smuzhiyun
324*4882a593Smuzhiyun if (action & SMP_ASK_C0COUNT) {
325*4882a593Smuzhiyun BUG_ON(cpu != 0);
326*4882a593Smuzhiyun c0count = read_c0_count();
327*4882a593Smuzhiyun c0count = c0count ? c0count : 1;
328*4882a593Smuzhiyun for (i = 1; i < nr_cpu_ids; i++)
329*4882a593Smuzhiyun core0_c0count[i] = c0count;
330*4882a593Smuzhiyun __wbflush(); /* Let others see the result ASAP */
331*4882a593Smuzhiyun }
332*4882a593Smuzhiyun
333*4882a593Smuzhiyun return IRQ_HANDLED;
334*4882a593Smuzhiyun }
335*4882a593Smuzhiyun
336*4882a593Smuzhiyun #define MAX_LOOPS 800
337*4882a593Smuzhiyun /*
338*4882a593Smuzhiyun * SMP init and finish on secondary CPUs
339*4882a593Smuzhiyun */
loongson3_init_secondary(void)340*4882a593Smuzhiyun static void loongson3_init_secondary(void)
341*4882a593Smuzhiyun {
342*4882a593Smuzhiyun int i;
343*4882a593Smuzhiyun uint32_t initcount;
344*4882a593Smuzhiyun unsigned int cpu = smp_processor_id();
345*4882a593Smuzhiyun unsigned int imask = STATUSF_IP7 | STATUSF_IP6 |
346*4882a593Smuzhiyun STATUSF_IP3 | STATUSF_IP2;
347*4882a593Smuzhiyun
348*4882a593Smuzhiyun /* Set interrupt mask, but don't enable */
349*4882a593Smuzhiyun change_c0_status(ST0_IM, imask);
350*4882a593Smuzhiyun
351*4882a593Smuzhiyun for (i = 0; i < num_possible_cpus(); i++)
352*4882a593Smuzhiyun loongson3_ipi_write32(0xffffffff, ipi_en0_regs[cpu_logical_map(i)]);
353*4882a593Smuzhiyun
354*4882a593Smuzhiyun per_cpu(cpu_state, cpu) = CPU_ONLINE;
355*4882a593Smuzhiyun cpu_set_core(&cpu_data[cpu],
356*4882a593Smuzhiyun cpu_logical_map(cpu) % loongson_sysconf.cores_per_package);
357*4882a593Smuzhiyun cpu_data[cpu].package =
358*4882a593Smuzhiyun cpu_logical_map(cpu) / loongson_sysconf.cores_per_package;
359*4882a593Smuzhiyun
360*4882a593Smuzhiyun i = 0;
361*4882a593Smuzhiyun core0_c0count[cpu] = 0;
362*4882a593Smuzhiyun loongson3_send_ipi_single(0, SMP_ASK_C0COUNT);
363*4882a593Smuzhiyun while (!core0_c0count[cpu]) {
364*4882a593Smuzhiyun i++;
365*4882a593Smuzhiyun cpu_relax();
366*4882a593Smuzhiyun }
367*4882a593Smuzhiyun
368*4882a593Smuzhiyun if (i > MAX_LOOPS)
369*4882a593Smuzhiyun i = MAX_LOOPS;
370*4882a593Smuzhiyun if (cpu_data[cpu].package)
371*4882a593Smuzhiyun initcount = core0_c0count[cpu] + i;
372*4882a593Smuzhiyun else /* Local access is faster for loops */
373*4882a593Smuzhiyun initcount = core0_c0count[cpu] + i/2;
374*4882a593Smuzhiyun
375*4882a593Smuzhiyun write_c0_count(initcount);
376*4882a593Smuzhiyun }
377*4882a593Smuzhiyun
loongson3_smp_finish(void)378*4882a593Smuzhiyun static void loongson3_smp_finish(void)
379*4882a593Smuzhiyun {
380*4882a593Smuzhiyun int cpu = smp_processor_id();
381*4882a593Smuzhiyun
382*4882a593Smuzhiyun write_c0_compare(read_c0_count() + mips_hpt_frequency/HZ);
383*4882a593Smuzhiyun local_irq_enable();
384*4882a593Smuzhiyun loongson3_ipi_write64(0,
385*4882a593Smuzhiyun ipi_mailbox_buf[cpu_logical_map(cpu)] + 0x0);
386*4882a593Smuzhiyun pr_info("CPU#%d finished, CP0_ST=%x\n",
387*4882a593Smuzhiyun smp_processor_id(), read_c0_status());
388*4882a593Smuzhiyun }
389*4882a593Smuzhiyun
loongson3_smp_setup(void)390*4882a593Smuzhiyun static void __init loongson3_smp_setup(void)
391*4882a593Smuzhiyun {
392*4882a593Smuzhiyun int i = 0, num = 0; /* i: physical id, num: logical id */
393*4882a593Smuzhiyun
394*4882a593Smuzhiyun init_cpu_possible(cpu_none_mask);
395*4882a593Smuzhiyun
396*4882a593Smuzhiyun /* For unified kernel, NR_CPUS is the maximum possible value,
397*4882a593Smuzhiyun * loongson_sysconf.nr_cpus is the really present value */
398*4882a593Smuzhiyun while (i < loongson_sysconf.nr_cpus) {
399*4882a593Smuzhiyun if (loongson_sysconf.reserved_cpus_mask & (1<<i)) {
400*4882a593Smuzhiyun /* Reserved physical CPU cores */
401*4882a593Smuzhiyun __cpu_number_map[i] = -1;
402*4882a593Smuzhiyun } else {
403*4882a593Smuzhiyun __cpu_number_map[i] = num;
404*4882a593Smuzhiyun __cpu_logical_map[num] = i;
405*4882a593Smuzhiyun set_cpu_possible(num, true);
406*4882a593Smuzhiyun num++;
407*4882a593Smuzhiyun }
408*4882a593Smuzhiyun i++;
409*4882a593Smuzhiyun }
410*4882a593Smuzhiyun pr_info("Detected %i available CPU(s)\n", num);
411*4882a593Smuzhiyun
412*4882a593Smuzhiyun while (num < loongson_sysconf.nr_cpus) {
413*4882a593Smuzhiyun __cpu_logical_map[num] = -1;
414*4882a593Smuzhiyun num++;
415*4882a593Smuzhiyun }
416*4882a593Smuzhiyun
417*4882a593Smuzhiyun csr_ipi_probe();
418*4882a593Smuzhiyun ipi_set0_regs_init();
419*4882a593Smuzhiyun ipi_clear0_regs_init();
420*4882a593Smuzhiyun ipi_status0_regs_init();
421*4882a593Smuzhiyun ipi_en0_regs_init();
422*4882a593Smuzhiyun ipi_mailbox_buf_init();
423*4882a593Smuzhiyun cpu_set_core(&cpu_data[0],
424*4882a593Smuzhiyun cpu_logical_map(0) % loongson_sysconf.cores_per_package);
425*4882a593Smuzhiyun cpu_data[0].package = cpu_logical_map(0) / loongson_sysconf.cores_per_package;
426*4882a593Smuzhiyun }
427*4882a593Smuzhiyun
loongson3_prepare_cpus(unsigned int max_cpus)428*4882a593Smuzhiyun static void __init loongson3_prepare_cpus(unsigned int max_cpus)
429*4882a593Smuzhiyun {
430*4882a593Smuzhiyun if (request_irq(LS_IPI_IRQ, loongson3_ipi_interrupt,
431*4882a593Smuzhiyun IRQF_PERCPU | IRQF_NO_SUSPEND, "SMP_IPI", NULL))
432*4882a593Smuzhiyun pr_err("Failed to request IPI IRQ\n");
433*4882a593Smuzhiyun init_cpu_present(cpu_possible_mask);
434*4882a593Smuzhiyun per_cpu(cpu_state, smp_processor_id()) = CPU_ONLINE;
435*4882a593Smuzhiyun }
436*4882a593Smuzhiyun
437*4882a593Smuzhiyun /*
438*4882a593Smuzhiyun * Setup the PC, SP, and GP of a secondary processor and start it runing!
439*4882a593Smuzhiyun */
loongson3_boot_secondary(int cpu,struct task_struct * idle)440*4882a593Smuzhiyun static int loongson3_boot_secondary(int cpu, struct task_struct *idle)
441*4882a593Smuzhiyun {
442*4882a593Smuzhiyun unsigned long startargs[4];
443*4882a593Smuzhiyun
444*4882a593Smuzhiyun pr_info("Booting CPU#%d...\n", cpu);
445*4882a593Smuzhiyun
446*4882a593Smuzhiyun /* startargs[] are initial PC, SP and GP for secondary CPU */
447*4882a593Smuzhiyun startargs[0] = (unsigned long)&smp_bootstrap;
448*4882a593Smuzhiyun startargs[1] = (unsigned long)__KSTK_TOS(idle);
449*4882a593Smuzhiyun startargs[2] = (unsigned long)task_thread_info(idle);
450*4882a593Smuzhiyun startargs[3] = 0;
451*4882a593Smuzhiyun
452*4882a593Smuzhiyun pr_debug("CPU#%d, func_pc=%lx, sp=%lx, gp=%lx\n",
453*4882a593Smuzhiyun cpu, startargs[0], startargs[1], startargs[2]);
454*4882a593Smuzhiyun
455*4882a593Smuzhiyun loongson3_ipi_write64(startargs[3],
456*4882a593Smuzhiyun ipi_mailbox_buf[cpu_logical_map(cpu)] + 0x18);
457*4882a593Smuzhiyun loongson3_ipi_write64(startargs[2],
458*4882a593Smuzhiyun ipi_mailbox_buf[cpu_logical_map(cpu)] + 0x10);
459*4882a593Smuzhiyun loongson3_ipi_write64(startargs[1],
460*4882a593Smuzhiyun ipi_mailbox_buf[cpu_logical_map(cpu)] + 0x8);
461*4882a593Smuzhiyun loongson3_ipi_write64(startargs[0],
462*4882a593Smuzhiyun ipi_mailbox_buf[cpu_logical_map(cpu)] + 0x0);
463*4882a593Smuzhiyun return 0;
464*4882a593Smuzhiyun }
465*4882a593Smuzhiyun
466*4882a593Smuzhiyun #ifdef CONFIG_HOTPLUG_CPU
467*4882a593Smuzhiyun
loongson3_cpu_disable(void)468*4882a593Smuzhiyun static int loongson3_cpu_disable(void)
469*4882a593Smuzhiyun {
470*4882a593Smuzhiyun unsigned long flags;
471*4882a593Smuzhiyun unsigned int cpu = smp_processor_id();
472*4882a593Smuzhiyun
473*4882a593Smuzhiyun if (cpu == 0)
474*4882a593Smuzhiyun return -EBUSY;
475*4882a593Smuzhiyun
476*4882a593Smuzhiyun set_cpu_online(cpu, false);
477*4882a593Smuzhiyun calculate_cpu_foreign_map();
478*4882a593Smuzhiyun local_irq_save(flags);
479*4882a593Smuzhiyun irq_cpu_offline();
480*4882a593Smuzhiyun clear_c0_status(ST0_IM);
481*4882a593Smuzhiyun local_irq_restore(flags);
482*4882a593Smuzhiyun local_flush_tlb_all();
483*4882a593Smuzhiyun
484*4882a593Smuzhiyun return 0;
485*4882a593Smuzhiyun }
486*4882a593Smuzhiyun
487*4882a593Smuzhiyun
loongson3_cpu_die(unsigned int cpu)488*4882a593Smuzhiyun static void loongson3_cpu_die(unsigned int cpu)
489*4882a593Smuzhiyun {
490*4882a593Smuzhiyun while (per_cpu(cpu_state, cpu) != CPU_DEAD)
491*4882a593Smuzhiyun cpu_relax();
492*4882a593Smuzhiyun
493*4882a593Smuzhiyun mb();
494*4882a593Smuzhiyun }
495*4882a593Smuzhiyun
496*4882a593Smuzhiyun /* To shutdown a core in Loongson 3, the target core should go to CKSEG1 and
497*4882a593Smuzhiyun * flush all L1 entries at first. Then, another core (usually Core 0) can
498*4882a593Smuzhiyun * safely disable the clock of the target core. loongson3_play_dead() is
499*4882a593Smuzhiyun * called via CKSEG1 (uncached and unmmaped) */
loongson3_type1_play_dead(int * state_addr)500*4882a593Smuzhiyun static void loongson3_type1_play_dead(int *state_addr)
501*4882a593Smuzhiyun {
502*4882a593Smuzhiyun register int val;
503*4882a593Smuzhiyun register long cpuid, core, node, count;
504*4882a593Smuzhiyun register void *addr, *base, *initfunc;
505*4882a593Smuzhiyun
506*4882a593Smuzhiyun __asm__ __volatile__(
507*4882a593Smuzhiyun " .set push \n"
508*4882a593Smuzhiyun " .set noreorder \n"
509*4882a593Smuzhiyun " li %[addr], 0x80000000 \n" /* KSEG0 */
510*4882a593Smuzhiyun "1: cache 0, 0(%[addr]) \n" /* flush L1 ICache */
511*4882a593Smuzhiyun " cache 0, 1(%[addr]) \n"
512*4882a593Smuzhiyun " cache 0, 2(%[addr]) \n"
513*4882a593Smuzhiyun " cache 0, 3(%[addr]) \n"
514*4882a593Smuzhiyun " cache 1, 0(%[addr]) \n" /* flush L1 DCache */
515*4882a593Smuzhiyun " cache 1, 1(%[addr]) \n"
516*4882a593Smuzhiyun " cache 1, 2(%[addr]) \n"
517*4882a593Smuzhiyun " cache 1, 3(%[addr]) \n"
518*4882a593Smuzhiyun " addiu %[sets], %[sets], -1 \n"
519*4882a593Smuzhiyun " bnez %[sets], 1b \n"
520*4882a593Smuzhiyun " addiu %[addr], %[addr], 0x20 \n"
521*4882a593Smuzhiyun " li %[val], 0x7 \n" /* *state_addr = CPU_DEAD; */
522*4882a593Smuzhiyun " sw %[val], (%[state_addr]) \n"
523*4882a593Smuzhiyun " sync \n"
524*4882a593Smuzhiyun " cache 21, (%[state_addr]) \n" /* flush entry of *state_addr */
525*4882a593Smuzhiyun " .set pop \n"
526*4882a593Smuzhiyun : [addr] "=&r" (addr), [val] "=&r" (val)
527*4882a593Smuzhiyun : [state_addr] "r" (state_addr),
528*4882a593Smuzhiyun [sets] "r" (cpu_data[smp_processor_id()].dcache.sets));
529*4882a593Smuzhiyun
530*4882a593Smuzhiyun __asm__ __volatile__(
531*4882a593Smuzhiyun " .set push \n"
532*4882a593Smuzhiyun " .set noreorder \n"
533*4882a593Smuzhiyun " .set mips64 \n"
534*4882a593Smuzhiyun " mfc0 %[cpuid], $15, 1 \n"
535*4882a593Smuzhiyun " andi %[cpuid], 0x3ff \n"
536*4882a593Smuzhiyun " dli %[base], 0x900000003ff01000 \n"
537*4882a593Smuzhiyun " andi %[core], %[cpuid], 0x3 \n"
538*4882a593Smuzhiyun " sll %[core], 8 \n" /* get core id */
539*4882a593Smuzhiyun " or %[base], %[base], %[core] \n"
540*4882a593Smuzhiyun " andi %[node], %[cpuid], 0xc \n"
541*4882a593Smuzhiyun " dsll %[node], 42 \n" /* get node id */
542*4882a593Smuzhiyun " or %[base], %[base], %[node] \n"
543*4882a593Smuzhiyun "1: li %[count], 0x100 \n" /* wait for init loop */
544*4882a593Smuzhiyun "2: bnez %[count], 2b \n" /* limit mailbox access */
545*4882a593Smuzhiyun " addiu %[count], -1 \n"
546*4882a593Smuzhiyun " ld %[initfunc], 0x20(%[base]) \n" /* get PC via mailbox */
547*4882a593Smuzhiyun " beqz %[initfunc], 1b \n"
548*4882a593Smuzhiyun " nop \n"
549*4882a593Smuzhiyun " ld $sp, 0x28(%[base]) \n" /* get SP via mailbox */
550*4882a593Smuzhiyun " ld $gp, 0x30(%[base]) \n" /* get GP via mailbox */
551*4882a593Smuzhiyun " ld $a1, 0x38(%[base]) \n"
552*4882a593Smuzhiyun " jr %[initfunc] \n" /* jump to initial PC */
553*4882a593Smuzhiyun " nop \n"
554*4882a593Smuzhiyun " .set pop \n"
555*4882a593Smuzhiyun : [core] "=&r" (core), [node] "=&r" (node),
556*4882a593Smuzhiyun [base] "=&r" (base), [cpuid] "=&r" (cpuid),
557*4882a593Smuzhiyun [count] "=&r" (count), [initfunc] "=&r" (initfunc)
558*4882a593Smuzhiyun : /* No Input */
559*4882a593Smuzhiyun : "a1");
560*4882a593Smuzhiyun }
561*4882a593Smuzhiyun
loongson3_type2_play_dead(int * state_addr)562*4882a593Smuzhiyun static void loongson3_type2_play_dead(int *state_addr)
563*4882a593Smuzhiyun {
564*4882a593Smuzhiyun register int val;
565*4882a593Smuzhiyun register long cpuid, core, node, count;
566*4882a593Smuzhiyun register void *addr, *base, *initfunc;
567*4882a593Smuzhiyun
568*4882a593Smuzhiyun __asm__ __volatile__(
569*4882a593Smuzhiyun " .set push \n"
570*4882a593Smuzhiyun " .set noreorder \n"
571*4882a593Smuzhiyun " li %[addr], 0x80000000 \n" /* KSEG0 */
572*4882a593Smuzhiyun "1: cache 0, 0(%[addr]) \n" /* flush L1 ICache */
573*4882a593Smuzhiyun " cache 0, 1(%[addr]) \n"
574*4882a593Smuzhiyun " cache 0, 2(%[addr]) \n"
575*4882a593Smuzhiyun " cache 0, 3(%[addr]) \n"
576*4882a593Smuzhiyun " cache 1, 0(%[addr]) \n" /* flush L1 DCache */
577*4882a593Smuzhiyun " cache 1, 1(%[addr]) \n"
578*4882a593Smuzhiyun " cache 1, 2(%[addr]) \n"
579*4882a593Smuzhiyun " cache 1, 3(%[addr]) \n"
580*4882a593Smuzhiyun " addiu %[sets], %[sets], -1 \n"
581*4882a593Smuzhiyun " bnez %[sets], 1b \n"
582*4882a593Smuzhiyun " addiu %[addr], %[addr], 0x20 \n"
583*4882a593Smuzhiyun " li %[val], 0x7 \n" /* *state_addr = CPU_DEAD; */
584*4882a593Smuzhiyun " sw %[val], (%[state_addr]) \n"
585*4882a593Smuzhiyun " sync \n"
586*4882a593Smuzhiyun " cache 21, (%[state_addr]) \n" /* flush entry of *state_addr */
587*4882a593Smuzhiyun " .set pop \n"
588*4882a593Smuzhiyun : [addr] "=&r" (addr), [val] "=&r" (val)
589*4882a593Smuzhiyun : [state_addr] "r" (state_addr),
590*4882a593Smuzhiyun [sets] "r" (cpu_data[smp_processor_id()].dcache.sets));
591*4882a593Smuzhiyun
592*4882a593Smuzhiyun __asm__ __volatile__(
593*4882a593Smuzhiyun " .set push \n"
594*4882a593Smuzhiyun " .set noreorder \n"
595*4882a593Smuzhiyun " .set mips64 \n"
596*4882a593Smuzhiyun " mfc0 %[cpuid], $15, 1 \n"
597*4882a593Smuzhiyun " andi %[cpuid], 0x3ff \n"
598*4882a593Smuzhiyun " dli %[base], 0x900000003ff01000 \n"
599*4882a593Smuzhiyun " andi %[core], %[cpuid], 0x3 \n"
600*4882a593Smuzhiyun " sll %[core], 8 \n" /* get core id */
601*4882a593Smuzhiyun " or %[base], %[base], %[core] \n"
602*4882a593Smuzhiyun " andi %[node], %[cpuid], 0xc \n"
603*4882a593Smuzhiyun " dsll %[node], 42 \n" /* get node id */
604*4882a593Smuzhiyun " or %[base], %[base], %[node] \n"
605*4882a593Smuzhiyun " dsrl %[node], 30 \n" /* 15:14 */
606*4882a593Smuzhiyun " or %[base], %[base], %[node] \n"
607*4882a593Smuzhiyun "1: li %[count], 0x100 \n" /* wait for init loop */
608*4882a593Smuzhiyun "2: bnez %[count], 2b \n" /* limit mailbox access */
609*4882a593Smuzhiyun " addiu %[count], -1 \n"
610*4882a593Smuzhiyun " ld %[initfunc], 0x20(%[base]) \n" /* get PC via mailbox */
611*4882a593Smuzhiyun " beqz %[initfunc], 1b \n"
612*4882a593Smuzhiyun " nop \n"
613*4882a593Smuzhiyun " ld $sp, 0x28(%[base]) \n" /* get SP via mailbox */
614*4882a593Smuzhiyun " ld $gp, 0x30(%[base]) \n" /* get GP via mailbox */
615*4882a593Smuzhiyun " ld $a1, 0x38(%[base]) \n"
616*4882a593Smuzhiyun " jr %[initfunc] \n" /* jump to initial PC */
617*4882a593Smuzhiyun " nop \n"
618*4882a593Smuzhiyun " .set pop \n"
619*4882a593Smuzhiyun : [core] "=&r" (core), [node] "=&r" (node),
620*4882a593Smuzhiyun [base] "=&r" (base), [cpuid] "=&r" (cpuid),
621*4882a593Smuzhiyun [count] "=&r" (count), [initfunc] "=&r" (initfunc)
622*4882a593Smuzhiyun : /* No Input */
623*4882a593Smuzhiyun : "a1");
624*4882a593Smuzhiyun }
625*4882a593Smuzhiyun
loongson3_type3_play_dead(int * state_addr)626*4882a593Smuzhiyun static void loongson3_type3_play_dead(int *state_addr)
627*4882a593Smuzhiyun {
628*4882a593Smuzhiyun register int val;
629*4882a593Smuzhiyun register long cpuid, core, node, count;
630*4882a593Smuzhiyun register void *addr, *base, *initfunc;
631*4882a593Smuzhiyun
632*4882a593Smuzhiyun __asm__ __volatile__(
633*4882a593Smuzhiyun " .set push \n"
634*4882a593Smuzhiyun " .set noreorder \n"
635*4882a593Smuzhiyun " li %[addr], 0x80000000 \n" /* KSEG0 */
636*4882a593Smuzhiyun "1: cache 0, 0(%[addr]) \n" /* flush L1 ICache */
637*4882a593Smuzhiyun " cache 0, 1(%[addr]) \n"
638*4882a593Smuzhiyun " cache 0, 2(%[addr]) \n"
639*4882a593Smuzhiyun " cache 0, 3(%[addr]) \n"
640*4882a593Smuzhiyun " cache 1, 0(%[addr]) \n" /* flush L1 DCache */
641*4882a593Smuzhiyun " cache 1, 1(%[addr]) \n"
642*4882a593Smuzhiyun " cache 1, 2(%[addr]) \n"
643*4882a593Smuzhiyun " cache 1, 3(%[addr]) \n"
644*4882a593Smuzhiyun " addiu %[sets], %[sets], -1 \n"
645*4882a593Smuzhiyun " bnez %[sets], 1b \n"
646*4882a593Smuzhiyun " addiu %[addr], %[addr], 0x40 \n"
647*4882a593Smuzhiyun " li %[addr], 0x80000000 \n" /* KSEG0 */
648*4882a593Smuzhiyun "2: cache 2, 0(%[addr]) \n" /* flush L1 VCache */
649*4882a593Smuzhiyun " cache 2, 1(%[addr]) \n"
650*4882a593Smuzhiyun " cache 2, 2(%[addr]) \n"
651*4882a593Smuzhiyun " cache 2, 3(%[addr]) \n"
652*4882a593Smuzhiyun " cache 2, 4(%[addr]) \n"
653*4882a593Smuzhiyun " cache 2, 5(%[addr]) \n"
654*4882a593Smuzhiyun " cache 2, 6(%[addr]) \n"
655*4882a593Smuzhiyun " cache 2, 7(%[addr]) \n"
656*4882a593Smuzhiyun " cache 2, 8(%[addr]) \n"
657*4882a593Smuzhiyun " cache 2, 9(%[addr]) \n"
658*4882a593Smuzhiyun " cache 2, 10(%[addr]) \n"
659*4882a593Smuzhiyun " cache 2, 11(%[addr]) \n"
660*4882a593Smuzhiyun " cache 2, 12(%[addr]) \n"
661*4882a593Smuzhiyun " cache 2, 13(%[addr]) \n"
662*4882a593Smuzhiyun " cache 2, 14(%[addr]) \n"
663*4882a593Smuzhiyun " cache 2, 15(%[addr]) \n"
664*4882a593Smuzhiyun " addiu %[vsets], %[vsets], -1 \n"
665*4882a593Smuzhiyun " bnez %[vsets], 2b \n"
666*4882a593Smuzhiyun " addiu %[addr], %[addr], 0x40 \n"
667*4882a593Smuzhiyun " li %[val], 0x7 \n" /* *state_addr = CPU_DEAD; */
668*4882a593Smuzhiyun " sw %[val], (%[state_addr]) \n"
669*4882a593Smuzhiyun " sync \n"
670*4882a593Smuzhiyun " cache 21, (%[state_addr]) \n" /* flush entry of *state_addr */
671*4882a593Smuzhiyun " .set pop \n"
672*4882a593Smuzhiyun : [addr] "=&r" (addr), [val] "=&r" (val)
673*4882a593Smuzhiyun : [state_addr] "r" (state_addr),
674*4882a593Smuzhiyun [sets] "r" (cpu_data[smp_processor_id()].dcache.sets),
675*4882a593Smuzhiyun [vsets] "r" (cpu_data[smp_processor_id()].vcache.sets));
676*4882a593Smuzhiyun
677*4882a593Smuzhiyun __asm__ __volatile__(
678*4882a593Smuzhiyun " .set push \n"
679*4882a593Smuzhiyun " .set noreorder \n"
680*4882a593Smuzhiyun " .set mips64 \n"
681*4882a593Smuzhiyun " mfc0 %[cpuid], $15, 1 \n"
682*4882a593Smuzhiyun " andi %[cpuid], 0x3ff \n"
683*4882a593Smuzhiyun " dli %[base], 0x900000003ff01000 \n"
684*4882a593Smuzhiyun " andi %[core], %[cpuid], 0x3 \n"
685*4882a593Smuzhiyun " sll %[core], 8 \n" /* get core id */
686*4882a593Smuzhiyun " or %[base], %[base], %[core] \n"
687*4882a593Smuzhiyun " andi %[node], %[cpuid], 0xc \n"
688*4882a593Smuzhiyun " dsll %[node], 42 \n" /* get node id */
689*4882a593Smuzhiyun " or %[base], %[base], %[node] \n"
690*4882a593Smuzhiyun "1: li %[count], 0x100 \n" /* wait for init loop */
691*4882a593Smuzhiyun "2: bnez %[count], 2b \n" /* limit mailbox access */
692*4882a593Smuzhiyun " addiu %[count], -1 \n"
693*4882a593Smuzhiyun " ld %[initfunc], 0x20(%[base]) \n" /* get PC via mailbox */
694*4882a593Smuzhiyun " beqz %[initfunc], 1b \n"
695*4882a593Smuzhiyun " nop \n"
696*4882a593Smuzhiyun " ld $sp, 0x28(%[base]) \n" /* get SP via mailbox */
697*4882a593Smuzhiyun " ld $gp, 0x30(%[base]) \n" /* get GP via mailbox */
698*4882a593Smuzhiyun " ld $a1, 0x38(%[base]) \n"
699*4882a593Smuzhiyun " jr %[initfunc] \n" /* jump to initial PC */
700*4882a593Smuzhiyun " nop \n"
701*4882a593Smuzhiyun " .set pop \n"
702*4882a593Smuzhiyun : [core] "=&r" (core), [node] "=&r" (node),
703*4882a593Smuzhiyun [base] "=&r" (base), [cpuid] "=&r" (cpuid),
704*4882a593Smuzhiyun [count] "=&r" (count), [initfunc] "=&r" (initfunc)
705*4882a593Smuzhiyun : /* No Input */
706*4882a593Smuzhiyun : "a1");
707*4882a593Smuzhiyun }
708*4882a593Smuzhiyun
play_dead(void)709*4882a593Smuzhiyun void play_dead(void)
710*4882a593Smuzhiyun {
711*4882a593Smuzhiyun int prid_imp, prid_rev, *state_addr;
712*4882a593Smuzhiyun unsigned int cpu = smp_processor_id();
713*4882a593Smuzhiyun void (*play_dead_at_ckseg1)(int *);
714*4882a593Smuzhiyun
715*4882a593Smuzhiyun idle_task_exit();
716*4882a593Smuzhiyun
717*4882a593Smuzhiyun prid_imp = read_c0_prid() & PRID_IMP_MASK;
718*4882a593Smuzhiyun prid_rev = read_c0_prid() & PRID_REV_MASK;
719*4882a593Smuzhiyun
720*4882a593Smuzhiyun if (prid_imp == PRID_IMP_LOONGSON_64G) {
721*4882a593Smuzhiyun play_dead_at_ckseg1 =
722*4882a593Smuzhiyun (void *)CKSEG1ADDR((unsigned long)loongson3_type3_play_dead);
723*4882a593Smuzhiyun goto out;
724*4882a593Smuzhiyun }
725*4882a593Smuzhiyun
726*4882a593Smuzhiyun switch (prid_rev) {
727*4882a593Smuzhiyun case PRID_REV_LOONGSON3A_R1:
728*4882a593Smuzhiyun default:
729*4882a593Smuzhiyun play_dead_at_ckseg1 =
730*4882a593Smuzhiyun (void *)CKSEG1ADDR((unsigned long)loongson3_type1_play_dead);
731*4882a593Smuzhiyun break;
732*4882a593Smuzhiyun case PRID_REV_LOONGSON3B_R1:
733*4882a593Smuzhiyun case PRID_REV_LOONGSON3B_R2:
734*4882a593Smuzhiyun play_dead_at_ckseg1 =
735*4882a593Smuzhiyun (void *)CKSEG1ADDR((unsigned long)loongson3_type2_play_dead);
736*4882a593Smuzhiyun break;
737*4882a593Smuzhiyun case PRID_REV_LOONGSON3A_R2_0:
738*4882a593Smuzhiyun case PRID_REV_LOONGSON3A_R2_1:
739*4882a593Smuzhiyun case PRID_REV_LOONGSON3A_R3_0:
740*4882a593Smuzhiyun case PRID_REV_LOONGSON3A_R3_1:
741*4882a593Smuzhiyun play_dead_at_ckseg1 =
742*4882a593Smuzhiyun (void *)CKSEG1ADDR((unsigned long)loongson3_type3_play_dead);
743*4882a593Smuzhiyun break;
744*4882a593Smuzhiyun }
745*4882a593Smuzhiyun
746*4882a593Smuzhiyun out:
747*4882a593Smuzhiyun state_addr = &per_cpu(cpu_state, cpu);
748*4882a593Smuzhiyun mb();
749*4882a593Smuzhiyun play_dead_at_ckseg1(state_addr);
750*4882a593Smuzhiyun }
751*4882a593Smuzhiyun
loongson3_disable_clock(unsigned int cpu)752*4882a593Smuzhiyun static int loongson3_disable_clock(unsigned int cpu)
753*4882a593Smuzhiyun {
754*4882a593Smuzhiyun uint64_t core_id = cpu_core(&cpu_data[cpu]);
755*4882a593Smuzhiyun uint64_t package_id = cpu_data[cpu].package;
756*4882a593Smuzhiyun
757*4882a593Smuzhiyun if ((read_c0_prid() & PRID_REV_MASK) == PRID_REV_LOONGSON3A_R1) {
758*4882a593Smuzhiyun LOONGSON_CHIPCFG(package_id) &= ~(1 << (12 + core_id));
759*4882a593Smuzhiyun } else {
760*4882a593Smuzhiyun if (!(loongson_sysconf.workarounds & WORKAROUND_CPUHOTPLUG))
761*4882a593Smuzhiyun LOONGSON_FREQCTRL(package_id) &= ~(1 << (core_id * 4 + 3));
762*4882a593Smuzhiyun }
763*4882a593Smuzhiyun return 0;
764*4882a593Smuzhiyun }
765*4882a593Smuzhiyun
loongson3_enable_clock(unsigned int cpu)766*4882a593Smuzhiyun static int loongson3_enable_clock(unsigned int cpu)
767*4882a593Smuzhiyun {
768*4882a593Smuzhiyun uint64_t core_id = cpu_core(&cpu_data[cpu]);
769*4882a593Smuzhiyun uint64_t package_id = cpu_data[cpu].package;
770*4882a593Smuzhiyun
771*4882a593Smuzhiyun if ((read_c0_prid() & PRID_REV_MASK) == PRID_REV_LOONGSON3A_R1) {
772*4882a593Smuzhiyun LOONGSON_CHIPCFG(package_id) |= 1 << (12 + core_id);
773*4882a593Smuzhiyun } else {
774*4882a593Smuzhiyun if (!(loongson_sysconf.workarounds & WORKAROUND_CPUHOTPLUG))
775*4882a593Smuzhiyun LOONGSON_FREQCTRL(package_id) |= 1 << (core_id * 4 + 3);
776*4882a593Smuzhiyun }
777*4882a593Smuzhiyun return 0;
778*4882a593Smuzhiyun }
779*4882a593Smuzhiyun
register_loongson3_notifier(void)780*4882a593Smuzhiyun static int register_loongson3_notifier(void)
781*4882a593Smuzhiyun {
782*4882a593Smuzhiyun return cpuhp_setup_state_nocalls(CPUHP_MIPS_SOC_PREPARE,
783*4882a593Smuzhiyun "mips/loongson:prepare",
784*4882a593Smuzhiyun loongson3_enable_clock,
785*4882a593Smuzhiyun loongson3_disable_clock);
786*4882a593Smuzhiyun }
787*4882a593Smuzhiyun early_initcall(register_loongson3_notifier);
788*4882a593Smuzhiyun
789*4882a593Smuzhiyun #endif
790*4882a593Smuzhiyun
791*4882a593Smuzhiyun const struct plat_smp_ops loongson3_smp_ops = {
792*4882a593Smuzhiyun .send_ipi_single = loongson3_send_ipi_single,
793*4882a593Smuzhiyun .send_ipi_mask = loongson3_send_ipi_mask,
794*4882a593Smuzhiyun .init_secondary = loongson3_init_secondary,
795*4882a593Smuzhiyun .smp_finish = loongson3_smp_finish,
796*4882a593Smuzhiyun .boot_secondary = loongson3_boot_secondary,
797*4882a593Smuzhiyun .smp_setup = loongson3_smp_setup,
798*4882a593Smuzhiyun .prepare_cpus = loongson3_prepare_cpus,
799*4882a593Smuzhiyun #ifdef CONFIG_HOTPLUG_CPU
800*4882a593Smuzhiyun .cpu_disable = loongson3_cpu_disable,
801*4882a593Smuzhiyun .cpu_die = loongson3_cpu_die,
802*4882a593Smuzhiyun #endif
803*4882a593Smuzhiyun #ifdef CONFIG_KEXEC
804*4882a593Smuzhiyun .kexec_nonboot_cpu = kexec_nonboot_cpu_jump,
805*4882a593Smuzhiyun #endif
806*4882a593Smuzhiyun };
807