1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun // Copyright (C) 2018 Hangzhou C-SKY Microsystems co.,ltd.
3*4882a593Smuzhiyun
4*4882a593Smuzhiyun #include <linux/ptrace.h>
5*4882a593Smuzhiyun #include <linux/uaccess.h>
6*4882a593Smuzhiyun #include <abi/reg_ops.h>
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #define MTCR_MASK 0xFC00FFE0
9*4882a593Smuzhiyun #define MFCR_MASK 0xFC00FFE0
10*4882a593Smuzhiyun #define MTCR_DIST 0xC0006420
11*4882a593Smuzhiyun #define MFCR_DIST 0xC0006020
12*4882a593Smuzhiyun
13*4882a593Smuzhiyun /*
14*4882a593Smuzhiyun * fpu_libc_helper() is to help libc to excute:
15*4882a593Smuzhiyun * - mfcr %a, cr<1, 2>
16*4882a593Smuzhiyun * - mfcr %a, cr<2, 2>
17*4882a593Smuzhiyun * - mtcr %a, cr<1, 2>
18*4882a593Smuzhiyun * - mtcr %a, cr<2, 2>
19*4882a593Smuzhiyun */
fpu_libc_helper(struct pt_regs * regs)20*4882a593Smuzhiyun int fpu_libc_helper(struct pt_regs *regs)
21*4882a593Smuzhiyun {
22*4882a593Smuzhiyun int fault;
23*4882a593Smuzhiyun unsigned long instrptr, regx = 0;
24*4882a593Smuzhiyun unsigned long index = 0, tmp = 0;
25*4882a593Smuzhiyun unsigned long tinstr = 0;
26*4882a593Smuzhiyun u16 instr_hi, instr_low;
27*4882a593Smuzhiyun
28*4882a593Smuzhiyun instrptr = instruction_pointer(regs);
29*4882a593Smuzhiyun if (instrptr & 1)
30*4882a593Smuzhiyun return 0;
31*4882a593Smuzhiyun
32*4882a593Smuzhiyun fault = __get_user(instr_low, (u16 *)instrptr);
33*4882a593Smuzhiyun if (fault)
34*4882a593Smuzhiyun return 0;
35*4882a593Smuzhiyun
36*4882a593Smuzhiyun fault = __get_user(instr_hi, (u16 *)(instrptr + 2));
37*4882a593Smuzhiyun if (fault)
38*4882a593Smuzhiyun return 0;
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun tinstr = instr_hi | ((unsigned long)instr_low << 16);
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun if (((tinstr >> 21) & 0x1F) != 2)
43*4882a593Smuzhiyun return 0;
44*4882a593Smuzhiyun
45*4882a593Smuzhiyun if ((tinstr & MTCR_MASK) == MTCR_DIST) {
46*4882a593Smuzhiyun index = (tinstr >> 16) & 0x1F;
47*4882a593Smuzhiyun if (index > 13)
48*4882a593Smuzhiyun return 0;
49*4882a593Smuzhiyun
50*4882a593Smuzhiyun tmp = tinstr & 0x1F;
51*4882a593Smuzhiyun if (tmp > 2)
52*4882a593Smuzhiyun return 0;
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun regx = *(®s->a0 + index);
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun if (tmp == 1)
57*4882a593Smuzhiyun mtcr("cr<1, 2>", regx);
58*4882a593Smuzhiyun else if (tmp == 2)
59*4882a593Smuzhiyun mtcr("cr<2, 2>", regx);
60*4882a593Smuzhiyun else
61*4882a593Smuzhiyun return 0;
62*4882a593Smuzhiyun
63*4882a593Smuzhiyun regs->pc += 4;
64*4882a593Smuzhiyun return 1;
65*4882a593Smuzhiyun }
66*4882a593Smuzhiyun
67*4882a593Smuzhiyun if ((tinstr & MFCR_MASK) == MFCR_DIST) {
68*4882a593Smuzhiyun index = tinstr & 0x1F;
69*4882a593Smuzhiyun if (index > 13)
70*4882a593Smuzhiyun return 0;
71*4882a593Smuzhiyun
72*4882a593Smuzhiyun tmp = ((tinstr >> 16) & 0x1F);
73*4882a593Smuzhiyun if (tmp > 2)
74*4882a593Smuzhiyun return 0;
75*4882a593Smuzhiyun
76*4882a593Smuzhiyun if (tmp == 1)
77*4882a593Smuzhiyun regx = mfcr("cr<1, 2>");
78*4882a593Smuzhiyun else if (tmp == 2)
79*4882a593Smuzhiyun regx = mfcr("cr<2, 2>");
80*4882a593Smuzhiyun else
81*4882a593Smuzhiyun return 0;
82*4882a593Smuzhiyun
83*4882a593Smuzhiyun *(®s->a0 + index) = regx;
84*4882a593Smuzhiyun
85*4882a593Smuzhiyun regs->pc += 4;
86*4882a593Smuzhiyun return 1;
87*4882a593Smuzhiyun }
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun return 0;
90*4882a593Smuzhiyun }
91*4882a593Smuzhiyun
fpu_fpe(struct pt_regs * regs)92*4882a593Smuzhiyun void fpu_fpe(struct pt_regs *regs)
93*4882a593Smuzhiyun {
94*4882a593Smuzhiyun int sig, code;
95*4882a593Smuzhiyun unsigned int fesr;
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun fesr = mfcr("cr<2, 2>");
98*4882a593Smuzhiyun
99*4882a593Smuzhiyun sig = SIGFPE;
100*4882a593Smuzhiyun code = FPE_FLTUNK;
101*4882a593Smuzhiyun
102*4882a593Smuzhiyun if (fesr & FPE_ILLE) {
103*4882a593Smuzhiyun sig = SIGILL;
104*4882a593Smuzhiyun code = ILL_ILLOPC;
105*4882a593Smuzhiyun } else if (fesr & FPE_IDC) {
106*4882a593Smuzhiyun sig = SIGILL;
107*4882a593Smuzhiyun code = ILL_ILLOPN;
108*4882a593Smuzhiyun } else if (fesr & FPE_FEC) {
109*4882a593Smuzhiyun sig = SIGFPE;
110*4882a593Smuzhiyun if (fesr & FPE_IOC)
111*4882a593Smuzhiyun code = FPE_FLTINV;
112*4882a593Smuzhiyun else if (fesr & FPE_DZC)
113*4882a593Smuzhiyun code = FPE_FLTDIV;
114*4882a593Smuzhiyun else if (fesr & FPE_UFC)
115*4882a593Smuzhiyun code = FPE_FLTUND;
116*4882a593Smuzhiyun else if (fesr & FPE_OFC)
117*4882a593Smuzhiyun code = FPE_FLTOVF;
118*4882a593Smuzhiyun else if (fesr & FPE_IXC)
119*4882a593Smuzhiyun code = FPE_FLTRES;
120*4882a593Smuzhiyun }
121*4882a593Smuzhiyun
122*4882a593Smuzhiyun force_sig_fault(sig, code, (void __user *)regs->pc);
123*4882a593Smuzhiyun }
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun #define FMFVR_FPU_REGS(vrx, vry) \
126*4882a593Smuzhiyun "fmfvrl %0, "#vrx"\n" \
127*4882a593Smuzhiyun "fmfvrh %1, "#vrx"\n" \
128*4882a593Smuzhiyun "fmfvrl %2, "#vry"\n" \
129*4882a593Smuzhiyun "fmfvrh %3, "#vry"\n"
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun #define FMTVR_FPU_REGS(vrx, vry) \
132*4882a593Smuzhiyun "fmtvrl "#vrx", %0\n" \
133*4882a593Smuzhiyun "fmtvrh "#vrx", %1\n" \
134*4882a593Smuzhiyun "fmtvrl "#vry", %2\n" \
135*4882a593Smuzhiyun "fmtvrh "#vry", %3\n"
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun #define STW_FPU_REGS(a, b, c, d) \
138*4882a593Smuzhiyun "stw %0, (%4, "#a")\n" \
139*4882a593Smuzhiyun "stw %1, (%4, "#b")\n" \
140*4882a593Smuzhiyun "stw %2, (%4, "#c")\n" \
141*4882a593Smuzhiyun "stw %3, (%4, "#d")\n"
142*4882a593Smuzhiyun
143*4882a593Smuzhiyun #define LDW_FPU_REGS(a, b, c, d) \
144*4882a593Smuzhiyun "ldw %0, (%4, "#a")\n" \
145*4882a593Smuzhiyun "ldw %1, (%4, "#b")\n" \
146*4882a593Smuzhiyun "ldw %2, (%4, "#c")\n" \
147*4882a593Smuzhiyun "ldw %3, (%4, "#d")\n"
148*4882a593Smuzhiyun
save_to_user_fp(struct user_fp * user_fp)149*4882a593Smuzhiyun void save_to_user_fp(struct user_fp *user_fp)
150*4882a593Smuzhiyun {
151*4882a593Smuzhiyun unsigned long flg;
152*4882a593Smuzhiyun unsigned long tmp1, tmp2;
153*4882a593Smuzhiyun unsigned long *fpregs;
154*4882a593Smuzhiyun
155*4882a593Smuzhiyun local_irq_save(flg);
156*4882a593Smuzhiyun
157*4882a593Smuzhiyun tmp1 = mfcr("cr<1, 2>");
158*4882a593Smuzhiyun tmp2 = mfcr("cr<2, 2>");
159*4882a593Smuzhiyun
160*4882a593Smuzhiyun user_fp->fcr = tmp1;
161*4882a593Smuzhiyun user_fp->fesr = tmp2;
162*4882a593Smuzhiyun
163*4882a593Smuzhiyun fpregs = &user_fp->vr[0];
164*4882a593Smuzhiyun #ifdef CONFIG_CPU_HAS_FPUV2
165*4882a593Smuzhiyun #ifdef CONFIG_CPU_HAS_VDSP
166*4882a593Smuzhiyun asm volatile(
167*4882a593Smuzhiyun "vstmu.32 vr0-vr3, (%0)\n"
168*4882a593Smuzhiyun "vstmu.32 vr4-vr7, (%0)\n"
169*4882a593Smuzhiyun "vstmu.32 vr8-vr11, (%0)\n"
170*4882a593Smuzhiyun "vstmu.32 vr12-vr15, (%0)\n"
171*4882a593Smuzhiyun "fstmu.64 vr16-vr31, (%0)\n"
172*4882a593Smuzhiyun : "+a"(fpregs)
173*4882a593Smuzhiyun ::"memory");
174*4882a593Smuzhiyun #else
175*4882a593Smuzhiyun asm volatile(
176*4882a593Smuzhiyun "fstmu.64 vr0-vr31, (%0)\n"
177*4882a593Smuzhiyun : "+a"(fpregs)
178*4882a593Smuzhiyun ::"memory");
179*4882a593Smuzhiyun #endif
180*4882a593Smuzhiyun #else
181*4882a593Smuzhiyun {
182*4882a593Smuzhiyun unsigned long tmp3, tmp4;
183*4882a593Smuzhiyun
184*4882a593Smuzhiyun asm volatile(
185*4882a593Smuzhiyun FMFVR_FPU_REGS(vr0, vr1)
186*4882a593Smuzhiyun STW_FPU_REGS(0, 4, 16, 20)
187*4882a593Smuzhiyun FMFVR_FPU_REGS(vr2, vr3)
188*4882a593Smuzhiyun STW_FPU_REGS(32, 36, 48, 52)
189*4882a593Smuzhiyun FMFVR_FPU_REGS(vr4, vr5)
190*4882a593Smuzhiyun STW_FPU_REGS(64, 68, 80, 84)
191*4882a593Smuzhiyun FMFVR_FPU_REGS(vr6, vr7)
192*4882a593Smuzhiyun STW_FPU_REGS(96, 100, 112, 116)
193*4882a593Smuzhiyun "addi %4, 128\n"
194*4882a593Smuzhiyun FMFVR_FPU_REGS(vr8, vr9)
195*4882a593Smuzhiyun STW_FPU_REGS(0, 4, 16, 20)
196*4882a593Smuzhiyun FMFVR_FPU_REGS(vr10, vr11)
197*4882a593Smuzhiyun STW_FPU_REGS(32, 36, 48, 52)
198*4882a593Smuzhiyun FMFVR_FPU_REGS(vr12, vr13)
199*4882a593Smuzhiyun STW_FPU_REGS(64, 68, 80, 84)
200*4882a593Smuzhiyun FMFVR_FPU_REGS(vr14, vr15)
201*4882a593Smuzhiyun STW_FPU_REGS(96, 100, 112, 116)
202*4882a593Smuzhiyun : "=a"(tmp1), "=a"(tmp2), "=a"(tmp3),
203*4882a593Smuzhiyun "=a"(tmp4), "+a"(fpregs)
204*4882a593Smuzhiyun ::"memory");
205*4882a593Smuzhiyun }
206*4882a593Smuzhiyun #endif
207*4882a593Smuzhiyun
208*4882a593Smuzhiyun local_irq_restore(flg);
209*4882a593Smuzhiyun }
210*4882a593Smuzhiyun
restore_from_user_fp(struct user_fp * user_fp)211*4882a593Smuzhiyun void restore_from_user_fp(struct user_fp *user_fp)
212*4882a593Smuzhiyun {
213*4882a593Smuzhiyun unsigned long flg;
214*4882a593Smuzhiyun unsigned long tmp1, tmp2;
215*4882a593Smuzhiyun unsigned long *fpregs;
216*4882a593Smuzhiyun
217*4882a593Smuzhiyun local_irq_save(flg);
218*4882a593Smuzhiyun
219*4882a593Smuzhiyun tmp1 = user_fp->fcr;
220*4882a593Smuzhiyun tmp2 = user_fp->fesr;
221*4882a593Smuzhiyun
222*4882a593Smuzhiyun mtcr("cr<1, 2>", tmp1);
223*4882a593Smuzhiyun mtcr("cr<2, 2>", tmp2);
224*4882a593Smuzhiyun
225*4882a593Smuzhiyun fpregs = &user_fp->vr[0];
226*4882a593Smuzhiyun #ifdef CONFIG_CPU_HAS_FPUV2
227*4882a593Smuzhiyun #ifdef CONFIG_CPU_HAS_VDSP
228*4882a593Smuzhiyun asm volatile(
229*4882a593Smuzhiyun "vldmu.32 vr0-vr3, (%0)\n"
230*4882a593Smuzhiyun "vldmu.32 vr4-vr7, (%0)\n"
231*4882a593Smuzhiyun "vldmu.32 vr8-vr11, (%0)\n"
232*4882a593Smuzhiyun "vldmu.32 vr12-vr15, (%0)\n"
233*4882a593Smuzhiyun "fldmu.64 vr16-vr31, (%0)\n"
234*4882a593Smuzhiyun : "+a"(fpregs)
235*4882a593Smuzhiyun ::"memory");
236*4882a593Smuzhiyun #else
237*4882a593Smuzhiyun asm volatile(
238*4882a593Smuzhiyun "fldmu.64 vr0-vr31, (%0)\n"
239*4882a593Smuzhiyun : "+a"(fpregs)
240*4882a593Smuzhiyun ::"memory");
241*4882a593Smuzhiyun #endif
242*4882a593Smuzhiyun #else
243*4882a593Smuzhiyun {
244*4882a593Smuzhiyun unsigned long tmp3, tmp4;
245*4882a593Smuzhiyun
246*4882a593Smuzhiyun asm volatile(
247*4882a593Smuzhiyun LDW_FPU_REGS(0, 4, 16, 20)
248*4882a593Smuzhiyun FMTVR_FPU_REGS(vr0, vr1)
249*4882a593Smuzhiyun LDW_FPU_REGS(32, 36, 48, 52)
250*4882a593Smuzhiyun FMTVR_FPU_REGS(vr2, vr3)
251*4882a593Smuzhiyun LDW_FPU_REGS(64, 68, 80, 84)
252*4882a593Smuzhiyun FMTVR_FPU_REGS(vr4, vr5)
253*4882a593Smuzhiyun LDW_FPU_REGS(96, 100, 112, 116)
254*4882a593Smuzhiyun FMTVR_FPU_REGS(vr6, vr7)
255*4882a593Smuzhiyun "addi %4, 128\n"
256*4882a593Smuzhiyun LDW_FPU_REGS(0, 4, 16, 20)
257*4882a593Smuzhiyun FMTVR_FPU_REGS(vr8, vr9)
258*4882a593Smuzhiyun LDW_FPU_REGS(32, 36, 48, 52)
259*4882a593Smuzhiyun FMTVR_FPU_REGS(vr10, vr11)
260*4882a593Smuzhiyun LDW_FPU_REGS(64, 68, 80, 84)
261*4882a593Smuzhiyun FMTVR_FPU_REGS(vr12, vr13)
262*4882a593Smuzhiyun LDW_FPU_REGS(96, 100, 112, 116)
263*4882a593Smuzhiyun FMTVR_FPU_REGS(vr14, vr15)
264*4882a593Smuzhiyun : "=a"(tmp1), "=a"(tmp2), "=a"(tmp3),
265*4882a593Smuzhiyun "=a"(tmp4), "+a"(fpregs)
266*4882a593Smuzhiyun ::"memory");
267*4882a593Smuzhiyun }
268*4882a593Smuzhiyun #endif
269*4882a593Smuzhiyun local_irq_restore(flg);
270*4882a593Smuzhiyun }
271