xref: /OK3568_Linux_fs/kernel/arch/mips/math-emu/cp1emu.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * cp1emu.c: a MIPS coprocessor 1 (FPU) instruction emulator
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * MIPS floating point support
6*4882a593Smuzhiyun  * Copyright (C) 1994-2000 Algorithmics Ltd.
7*4882a593Smuzhiyun  *
8*4882a593Smuzhiyun  * Kevin D. Kissell, kevink@mips.com and Carsten Langgaard, carstenl@mips.com
9*4882a593Smuzhiyun  * Copyright (C) 2000  MIPS Technologies, Inc.
10*4882a593Smuzhiyun  *
11*4882a593Smuzhiyun  * A complete emulator for MIPS coprocessor 1 instructions.  This is
12*4882a593Smuzhiyun  * required for #float(switch) or #float(trap), where it catches all
13*4882a593Smuzhiyun  * COP1 instructions via the "CoProcessor Unusable" exception.
14*4882a593Smuzhiyun  *
15*4882a593Smuzhiyun  * More surprisingly it is also required for #float(ieee), to help out
16*4882a593Smuzhiyun  * the hardware FPU at the boundaries of the IEEE-754 representation
17*4882a593Smuzhiyun  * (denormalised values, infinities, underflow, etc).  It is made
18*4882a593Smuzhiyun  * quite nasty because emulation of some non-COP1 instructions is
19*4882a593Smuzhiyun  * required, e.g. in branch delay slots.
20*4882a593Smuzhiyun  *
21*4882a593Smuzhiyun  * Note if you know that you won't have an FPU, then you'll get much
22*4882a593Smuzhiyun  * better performance by compiling with -msoft-float!
23*4882a593Smuzhiyun  */
24*4882a593Smuzhiyun #include <linux/sched.h>
25*4882a593Smuzhiyun #include <linux/debugfs.h>
26*4882a593Smuzhiyun #include <linux/percpu-defs.h>
27*4882a593Smuzhiyun #include <linux/perf_event.h>
28*4882a593Smuzhiyun 
29*4882a593Smuzhiyun #include <asm/branch.h>
30*4882a593Smuzhiyun #include <asm/inst.h>
31*4882a593Smuzhiyun #include <asm/ptrace.h>
32*4882a593Smuzhiyun #include <asm/signal.h>
33*4882a593Smuzhiyun #include <linux/uaccess.h>
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun #include <asm/cpu-info.h>
36*4882a593Smuzhiyun #include <asm/processor.h>
37*4882a593Smuzhiyun #include <asm/fpu_emulator.h>
38*4882a593Smuzhiyun #include <asm/fpu.h>
39*4882a593Smuzhiyun #include <asm/mips-r2-to-r6-emul.h>
40*4882a593Smuzhiyun 
41*4882a593Smuzhiyun #include "ieee754.h"
42*4882a593Smuzhiyun 
43*4882a593Smuzhiyun /* Function which emulates a floating point instruction. */
44*4882a593Smuzhiyun 
45*4882a593Smuzhiyun static int fpu_emu(struct pt_regs *, struct mips_fpu_struct *,
46*4882a593Smuzhiyun 	mips_instruction);
47*4882a593Smuzhiyun 
48*4882a593Smuzhiyun static int fpux_emu(struct pt_regs *,
49*4882a593Smuzhiyun 	struct mips_fpu_struct *, mips_instruction, void __user **);
50*4882a593Smuzhiyun 
51*4882a593Smuzhiyun /* Control registers */
52*4882a593Smuzhiyun 
53*4882a593Smuzhiyun #define FPCREG_RID	0	/* $0  = revision id */
54*4882a593Smuzhiyun #define FPCREG_FCCR	25	/* $25 = fccr */
55*4882a593Smuzhiyun #define FPCREG_FEXR	26	/* $26 = fexr */
56*4882a593Smuzhiyun #define FPCREG_FENR	28	/* $28 = fenr */
57*4882a593Smuzhiyun #define FPCREG_CSR	31	/* $31 = csr */
58*4882a593Smuzhiyun 
59*4882a593Smuzhiyun /* convert condition code register number to csr bit */
60*4882a593Smuzhiyun const unsigned int fpucondbit[8] = {
61*4882a593Smuzhiyun 	FPU_CSR_COND,
62*4882a593Smuzhiyun 	FPU_CSR_COND1,
63*4882a593Smuzhiyun 	FPU_CSR_COND2,
64*4882a593Smuzhiyun 	FPU_CSR_COND3,
65*4882a593Smuzhiyun 	FPU_CSR_COND4,
66*4882a593Smuzhiyun 	FPU_CSR_COND5,
67*4882a593Smuzhiyun 	FPU_CSR_COND6,
68*4882a593Smuzhiyun 	FPU_CSR_COND7
69*4882a593Smuzhiyun };
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun /* (microMIPS) Convert certain microMIPS instructions to MIPS32 format. */
72*4882a593Smuzhiyun static const int sd_format[] = {16, 17, 0, 0, 0, 0, 0, 0};
73*4882a593Smuzhiyun static const int sdps_format[] = {16, 17, 22, 0, 0, 0, 0, 0};
74*4882a593Smuzhiyun static const int dwl_format[] = {17, 20, 21, 0, 0, 0, 0, 0};
75*4882a593Smuzhiyun static const int swl_format[] = {16, 20, 21, 0, 0, 0, 0, 0};
76*4882a593Smuzhiyun 
77*4882a593Smuzhiyun /*
78*4882a593Smuzhiyun  * This functions translates a 32-bit microMIPS instruction
79*4882a593Smuzhiyun  * into a 32-bit MIPS32 instruction. Returns 0 on success
80*4882a593Smuzhiyun  * and SIGILL otherwise.
81*4882a593Smuzhiyun  */
microMIPS32_to_MIPS32(union mips_instruction * insn_ptr)82*4882a593Smuzhiyun static int microMIPS32_to_MIPS32(union mips_instruction *insn_ptr)
83*4882a593Smuzhiyun {
84*4882a593Smuzhiyun 	union mips_instruction insn = *insn_ptr;
85*4882a593Smuzhiyun 	union mips_instruction mips32_insn = insn;
86*4882a593Smuzhiyun 	int func, fmt, op;
87*4882a593Smuzhiyun 
88*4882a593Smuzhiyun 	switch (insn.mm_i_format.opcode) {
89*4882a593Smuzhiyun 	case mm_ldc132_op:
90*4882a593Smuzhiyun 		mips32_insn.mm_i_format.opcode = ldc1_op;
91*4882a593Smuzhiyun 		mips32_insn.mm_i_format.rt = insn.mm_i_format.rs;
92*4882a593Smuzhiyun 		mips32_insn.mm_i_format.rs = insn.mm_i_format.rt;
93*4882a593Smuzhiyun 		break;
94*4882a593Smuzhiyun 	case mm_lwc132_op:
95*4882a593Smuzhiyun 		mips32_insn.mm_i_format.opcode = lwc1_op;
96*4882a593Smuzhiyun 		mips32_insn.mm_i_format.rt = insn.mm_i_format.rs;
97*4882a593Smuzhiyun 		mips32_insn.mm_i_format.rs = insn.mm_i_format.rt;
98*4882a593Smuzhiyun 		break;
99*4882a593Smuzhiyun 	case mm_sdc132_op:
100*4882a593Smuzhiyun 		mips32_insn.mm_i_format.opcode = sdc1_op;
101*4882a593Smuzhiyun 		mips32_insn.mm_i_format.rt = insn.mm_i_format.rs;
102*4882a593Smuzhiyun 		mips32_insn.mm_i_format.rs = insn.mm_i_format.rt;
103*4882a593Smuzhiyun 		break;
104*4882a593Smuzhiyun 	case mm_swc132_op:
105*4882a593Smuzhiyun 		mips32_insn.mm_i_format.opcode = swc1_op;
106*4882a593Smuzhiyun 		mips32_insn.mm_i_format.rt = insn.mm_i_format.rs;
107*4882a593Smuzhiyun 		mips32_insn.mm_i_format.rs = insn.mm_i_format.rt;
108*4882a593Smuzhiyun 		break;
109*4882a593Smuzhiyun 	case mm_pool32i_op:
110*4882a593Smuzhiyun 		/* NOTE: offset is << by 1 if in microMIPS mode. */
111*4882a593Smuzhiyun 		if ((insn.mm_i_format.rt == mm_bc1f_op) ||
112*4882a593Smuzhiyun 		    (insn.mm_i_format.rt == mm_bc1t_op)) {
113*4882a593Smuzhiyun 			mips32_insn.fb_format.opcode = cop1_op;
114*4882a593Smuzhiyun 			mips32_insn.fb_format.bc = bc_op;
115*4882a593Smuzhiyun 			mips32_insn.fb_format.flag =
116*4882a593Smuzhiyun 				(insn.mm_i_format.rt == mm_bc1t_op) ? 1 : 0;
117*4882a593Smuzhiyun 		} else
118*4882a593Smuzhiyun 			return SIGILL;
119*4882a593Smuzhiyun 		break;
120*4882a593Smuzhiyun 	case mm_pool32f_op:
121*4882a593Smuzhiyun 		switch (insn.mm_fp0_format.func) {
122*4882a593Smuzhiyun 		case mm_32f_01_op:
123*4882a593Smuzhiyun 		case mm_32f_11_op:
124*4882a593Smuzhiyun 		case mm_32f_02_op:
125*4882a593Smuzhiyun 		case mm_32f_12_op:
126*4882a593Smuzhiyun 		case mm_32f_41_op:
127*4882a593Smuzhiyun 		case mm_32f_51_op:
128*4882a593Smuzhiyun 		case mm_32f_42_op:
129*4882a593Smuzhiyun 		case mm_32f_52_op:
130*4882a593Smuzhiyun 			op = insn.mm_fp0_format.func;
131*4882a593Smuzhiyun 			if (op == mm_32f_01_op)
132*4882a593Smuzhiyun 				func = madd_s_op;
133*4882a593Smuzhiyun 			else if (op == mm_32f_11_op)
134*4882a593Smuzhiyun 				func = madd_d_op;
135*4882a593Smuzhiyun 			else if (op == mm_32f_02_op)
136*4882a593Smuzhiyun 				func = nmadd_s_op;
137*4882a593Smuzhiyun 			else if (op == mm_32f_12_op)
138*4882a593Smuzhiyun 				func = nmadd_d_op;
139*4882a593Smuzhiyun 			else if (op == mm_32f_41_op)
140*4882a593Smuzhiyun 				func = msub_s_op;
141*4882a593Smuzhiyun 			else if (op == mm_32f_51_op)
142*4882a593Smuzhiyun 				func = msub_d_op;
143*4882a593Smuzhiyun 			else if (op == mm_32f_42_op)
144*4882a593Smuzhiyun 				func = nmsub_s_op;
145*4882a593Smuzhiyun 			else
146*4882a593Smuzhiyun 				func = nmsub_d_op;
147*4882a593Smuzhiyun 			mips32_insn.fp6_format.opcode = cop1x_op;
148*4882a593Smuzhiyun 			mips32_insn.fp6_format.fr = insn.mm_fp6_format.fr;
149*4882a593Smuzhiyun 			mips32_insn.fp6_format.ft = insn.mm_fp6_format.ft;
150*4882a593Smuzhiyun 			mips32_insn.fp6_format.fs = insn.mm_fp6_format.fs;
151*4882a593Smuzhiyun 			mips32_insn.fp6_format.fd = insn.mm_fp6_format.fd;
152*4882a593Smuzhiyun 			mips32_insn.fp6_format.func = func;
153*4882a593Smuzhiyun 			break;
154*4882a593Smuzhiyun 		case mm_32f_10_op:
155*4882a593Smuzhiyun 			func = -1;	/* Invalid */
156*4882a593Smuzhiyun 			op = insn.mm_fp5_format.op & 0x7;
157*4882a593Smuzhiyun 			if (op == mm_ldxc1_op)
158*4882a593Smuzhiyun 				func = ldxc1_op;
159*4882a593Smuzhiyun 			else if (op == mm_sdxc1_op)
160*4882a593Smuzhiyun 				func = sdxc1_op;
161*4882a593Smuzhiyun 			else if (op == mm_lwxc1_op)
162*4882a593Smuzhiyun 				func = lwxc1_op;
163*4882a593Smuzhiyun 			else if (op == mm_swxc1_op)
164*4882a593Smuzhiyun 				func = swxc1_op;
165*4882a593Smuzhiyun 
166*4882a593Smuzhiyun 			if (func != -1) {
167*4882a593Smuzhiyun 				mips32_insn.r_format.opcode = cop1x_op;
168*4882a593Smuzhiyun 				mips32_insn.r_format.rs =
169*4882a593Smuzhiyun 					insn.mm_fp5_format.base;
170*4882a593Smuzhiyun 				mips32_insn.r_format.rt =
171*4882a593Smuzhiyun 					insn.mm_fp5_format.index;
172*4882a593Smuzhiyun 				mips32_insn.r_format.rd = 0;
173*4882a593Smuzhiyun 				mips32_insn.r_format.re = insn.mm_fp5_format.fd;
174*4882a593Smuzhiyun 				mips32_insn.r_format.func = func;
175*4882a593Smuzhiyun 			} else
176*4882a593Smuzhiyun 				return SIGILL;
177*4882a593Smuzhiyun 			break;
178*4882a593Smuzhiyun 		case mm_32f_40_op:
179*4882a593Smuzhiyun 			op = -1;	/* Invalid */
180*4882a593Smuzhiyun 			if (insn.mm_fp2_format.op == mm_fmovt_op)
181*4882a593Smuzhiyun 				op = 1;
182*4882a593Smuzhiyun 			else if (insn.mm_fp2_format.op == mm_fmovf_op)
183*4882a593Smuzhiyun 				op = 0;
184*4882a593Smuzhiyun 			if (op != -1) {
185*4882a593Smuzhiyun 				mips32_insn.fp0_format.opcode = cop1_op;
186*4882a593Smuzhiyun 				mips32_insn.fp0_format.fmt =
187*4882a593Smuzhiyun 					sdps_format[insn.mm_fp2_format.fmt];
188*4882a593Smuzhiyun 				mips32_insn.fp0_format.ft =
189*4882a593Smuzhiyun 					(insn.mm_fp2_format.cc<<2) + op;
190*4882a593Smuzhiyun 				mips32_insn.fp0_format.fs =
191*4882a593Smuzhiyun 					insn.mm_fp2_format.fs;
192*4882a593Smuzhiyun 				mips32_insn.fp0_format.fd =
193*4882a593Smuzhiyun 					insn.mm_fp2_format.fd;
194*4882a593Smuzhiyun 				mips32_insn.fp0_format.func = fmovc_op;
195*4882a593Smuzhiyun 			} else
196*4882a593Smuzhiyun 				return SIGILL;
197*4882a593Smuzhiyun 			break;
198*4882a593Smuzhiyun 		case mm_32f_60_op:
199*4882a593Smuzhiyun 			func = -1;	/* Invalid */
200*4882a593Smuzhiyun 			if (insn.mm_fp0_format.op == mm_fadd_op)
201*4882a593Smuzhiyun 				func = fadd_op;
202*4882a593Smuzhiyun 			else if (insn.mm_fp0_format.op == mm_fsub_op)
203*4882a593Smuzhiyun 				func = fsub_op;
204*4882a593Smuzhiyun 			else if (insn.mm_fp0_format.op == mm_fmul_op)
205*4882a593Smuzhiyun 				func = fmul_op;
206*4882a593Smuzhiyun 			else if (insn.mm_fp0_format.op == mm_fdiv_op)
207*4882a593Smuzhiyun 				func = fdiv_op;
208*4882a593Smuzhiyun 			if (func != -1) {
209*4882a593Smuzhiyun 				mips32_insn.fp0_format.opcode = cop1_op;
210*4882a593Smuzhiyun 				mips32_insn.fp0_format.fmt =
211*4882a593Smuzhiyun 					sdps_format[insn.mm_fp0_format.fmt];
212*4882a593Smuzhiyun 				mips32_insn.fp0_format.ft =
213*4882a593Smuzhiyun 					insn.mm_fp0_format.ft;
214*4882a593Smuzhiyun 				mips32_insn.fp0_format.fs =
215*4882a593Smuzhiyun 					insn.mm_fp0_format.fs;
216*4882a593Smuzhiyun 				mips32_insn.fp0_format.fd =
217*4882a593Smuzhiyun 					insn.mm_fp0_format.fd;
218*4882a593Smuzhiyun 				mips32_insn.fp0_format.func = func;
219*4882a593Smuzhiyun 			} else
220*4882a593Smuzhiyun 				return SIGILL;
221*4882a593Smuzhiyun 			break;
222*4882a593Smuzhiyun 		case mm_32f_70_op:
223*4882a593Smuzhiyun 			func = -1;	/* Invalid */
224*4882a593Smuzhiyun 			if (insn.mm_fp0_format.op == mm_fmovn_op)
225*4882a593Smuzhiyun 				func = fmovn_op;
226*4882a593Smuzhiyun 			else if (insn.mm_fp0_format.op == mm_fmovz_op)
227*4882a593Smuzhiyun 				func = fmovz_op;
228*4882a593Smuzhiyun 			if (func != -1) {
229*4882a593Smuzhiyun 				mips32_insn.fp0_format.opcode = cop1_op;
230*4882a593Smuzhiyun 				mips32_insn.fp0_format.fmt =
231*4882a593Smuzhiyun 					sdps_format[insn.mm_fp0_format.fmt];
232*4882a593Smuzhiyun 				mips32_insn.fp0_format.ft =
233*4882a593Smuzhiyun 					insn.mm_fp0_format.ft;
234*4882a593Smuzhiyun 				mips32_insn.fp0_format.fs =
235*4882a593Smuzhiyun 					insn.mm_fp0_format.fs;
236*4882a593Smuzhiyun 				mips32_insn.fp0_format.fd =
237*4882a593Smuzhiyun 					insn.mm_fp0_format.fd;
238*4882a593Smuzhiyun 				mips32_insn.fp0_format.func = func;
239*4882a593Smuzhiyun 			} else
240*4882a593Smuzhiyun 				return SIGILL;
241*4882a593Smuzhiyun 			break;
242*4882a593Smuzhiyun 		case mm_32f_73_op:    /* POOL32FXF */
243*4882a593Smuzhiyun 			switch (insn.mm_fp1_format.op) {
244*4882a593Smuzhiyun 			case mm_movf0_op:
245*4882a593Smuzhiyun 			case mm_movf1_op:
246*4882a593Smuzhiyun 			case mm_movt0_op:
247*4882a593Smuzhiyun 			case mm_movt1_op:
248*4882a593Smuzhiyun 				if ((insn.mm_fp1_format.op & 0x7f) ==
249*4882a593Smuzhiyun 				    mm_movf0_op)
250*4882a593Smuzhiyun 					op = 0;
251*4882a593Smuzhiyun 				else
252*4882a593Smuzhiyun 					op = 1;
253*4882a593Smuzhiyun 				mips32_insn.r_format.opcode = spec_op;
254*4882a593Smuzhiyun 				mips32_insn.r_format.rs = insn.mm_fp4_format.fs;
255*4882a593Smuzhiyun 				mips32_insn.r_format.rt =
256*4882a593Smuzhiyun 					(insn.mm_fp4_format.cc << 2) + op;
257*4882a593Smuzhiyun 				mips32_insn.r_format.rd = insn.mm_fp4_format.rt;
258*4882a593Smuzhiyun 				mips32_insn.r_format.re = 0;
259*4882a593Smuzhiyun 				mips32_insn.r_format.func = movc_op;
260*4882a593Smuzhiyun 				break;
261*4882a593Smuzhiyun 			case mm_fcvtd0_op:
262*4882a593Smuzhiyun 			case mm_fcvtd1_op:
263*4882a593Smuzhiyun 			case mm_fcvts0_op:
264*4882a593Smuzhiyun 			case mm_fcvts1_op:
265*4882a593Smuzhiyun 				if ((insn.mm_fp1_format.op & 0x7f) ==
266*4882a593Smuzhiyun 				    mm_fcvtd0_op) {
267*4882a593Smuzhiyun 					func = fcvtd_op;
268*4882a593Smuzhiyun 					fmt = swl_format[insn.mm_fp3_format.fmt];
269*4882a593Smuzhiyun 				} else {
270*4882a593Smuzhiyun 					func = fcvts_op;
271*4882a593Smuzhiyun 					fmt = dwl_format[insn.mm_fp3_format.fmt];
272*4882a593Smuzhiyun 				}
273*4882a593Smuzhiyun 				mips32_insn.fp0_format.opcode = cop1_op;
274*4882a593Smuzhiyun 				mips32_insn.fp0_format.fmt = fmt;
275*4882a593Smuzhiyun 				mips32_insn.fp0_format.ft = 0;
276*4882a593Smuzhiyun 				mips32_insn.fp0_format.fs =
277*4882a593Smuzhiyun 					insn.mm_fp3_format.fs;
278*4882a593Smuzhiyun 				mips32_insn.fp0_format.fd =
279*4882a593Smuzhiyun 					insn.mm_fp3_format.rt;
280*4882a593Smuzhiyun 				mips32_insn.fp0_format.func = func;
281*4882a593Smuzhiyun 				break;
282*4882a593Smuzhiyun 			case mm_fmov0_op:
283*4882a593Smuzhiyun 			case mm_fmov1_op:
284*4882a593Smuzhiyun 			case mm_fabs0_op:
285*4882a593Smuzhiyun 			case mm_fabs1_op:
286*4882a593Smuzhiyun 			case mm_fneg0_op:
287*4882a593Smuzhiyun 			case mm_fneg1_op:
288*4882a593Smuzhiyun 				if ((insn.mm_fp1_format.op & 0x7f) ==
289*4882a593Smuzhiyun 				    mm_fmov0_op)
290*4882a593Smuzhiyun 					func = fmov_op;
291*4882a593Smuzhiyun 				else if ((insn.mm_fp1_format.op & 0x7f) ==
292*4882a593Smuzhiyun 					 mm_fabs0_op)
293*4882a593Smuzhiyun 					func = fabs_op;
294*4882a593Smuzhiyun 				else
295*4882a593Smuzhiyun 					func = fneg_op;
296*4882a593Smuzhiyun 				mips32_insn.fp0_format.opcode = cop1_op;
297*4882a593Smuzhiyun 				mips32_insn.fp0_format.fmt =
298*4882a593Smuzhiyun 					sdps_format[insn.mm_fp3_format.fmt];
299*4882a593Smuzhiyun 				mips32_insn.fp0_format.ft = 0;
300*4882a593Smuzhiyun 				mips32_insn.fp0_format.fs =
301*4882a593Smuzhiyun 					insn.mm_fp3_format.fs;
302*4882a593Smuzhiyun 				mips32_insn.fp0_format.fd =
303*4882a593Smuzhiyun 					insn.mm_fp3_format.rt;
304*4882a593Smuzhiyun 				mips32_insn.fp0_format.func = func;
305*4882a593Smuzhiyun 				break;
306*4882a593Smuzhiyun 			case mm_ffloorl_op:
307*4882a593Smuzhiyun 			case mm_ffloorw_op:
308*4882a593Smuzhiyun 			case mm_fceill_op:
309*4882a593Smuzhiyun 			case mm_fceilw_op:
310*4882a593Smuzhiyun 			case mm_ftruncl_op:
311*4882a593Smuzhiyun 			case mm_ftruncw_op:
312*4882a593Smuzhiyun 			case mm_froundl_op:
313*4882a593Smuzhiyun 			case mm_froundw_op:
314*4882a593Smuzhiyun 			case mm_fcvtl_op:
315*4882a593Smuzhiyun 			case mm_fcvtw_op:
316*4882a593Smuzhiyun 				if (insn.mm_fp1_format.op == mm_ffloorl_op)
317*4882a593Smuzhiyun 					func = ffloorl_op;
318*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_ffloorw_op)
319*4882a593Smuzhiyun 					func = ffloor_op;
320*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_fceill_op)
321*4882a593Smuzhiyun 					func = fceill_op;
322*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_fceilw_op)
323*4882a593Smuzhiyun 					func = fceil_op;
324*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_ftruncl_op)
325*4882a593Smuzhiyun 					func = ftruncl_op;
326*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_ftruncw_op)
327*4882a593Smuzhiyun 					func = ftrunc_op;
328*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_froundl_op)
329*4882a593Smuzhiyun 					func = froundl_op;
330*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_froundw_op)
331*4882a593Smuzhiyun 					func = fround_op;
332*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_fcvtl_op)
333*4882a593Smuzhiyun 					func = fcvtl_op;
334*4882a593Smuzhiyun 				else
335*4882a593Smuzhiyun 					func = fcvtw_op;
336*4882a593Smuzhiyun 				mips32_insn.fp0_format.opcode = cop1_op;
337*4882a593Smuzhiyun 				mips32_insn.fp0_format.fmt =
338*4882a593Smuzhiyun 					sd_format[insn.mm_fp1_format.fmt];
339*4882a593Smuzhiyun 				mips32_insn.fp0_format.ft = 0;
340*4882a593Smuzhiyun 				mips32_insn.fp0_format.fs =
341*4882a593Smuzhiyun 					insn.mm_fp1_format.fs;
342*4882a593Smuzhiyun 				mips32_insn.fp0_format.fd =
343*4882a593Smuzhiyun 					insn.mm_fp1_format.rt;
344*4882a593Smuzhiyun 				mips32_insn.fp0_format.func = func;
345*4882a593Smuzhiyun 				break;
346*4882a593Smuzhiyun 			case mm_frsqrt_op:
347*4882a593Smuzhiyun 			case mm_fsqrt_op:
348*4882a593Smuzhiyun 			case mm_frecip_op:
349*4882a593Smuzhiyun 				if (insn.mm_fp1_format.op == mm_frsqrt_op)
350*4882a593Smuzhiyun 					func = frsqrt_op;
351*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_fsqrt_op)
352*4882a593Smuzhiyun 					func = fsqrt_op;
353*4882a593Smuzhiyun 				else
354*4882a593Smuzhiyun 					func = frecip_op;
355*4882a593Smuzhiyun 				mips32_insn.fp0_format.opcode = cop1_op;
356*4882a593Smuzhiyun 				mips32_insn.fp0_format.fmt =
357*4882a593Smuzhiyun 					sdps_format[insn.mm_fp1_format.fmt];
358*4882a593Smuzhiyun 				mips32_insn.fp0_format.ft = 0;
359*4882a593Smuzhiyun 				mips32_insn.fp0_format.fs =
360*4882a593Smuzhiyun 					insn.mm_fp1_format.fs;
361*4882a593Smuzhiyun 				mips32_insn.fp0_format.fd =
362*4882a593Smuzhiyun 					insn.mm_fp1_format.rt;
363*4882a593Smuzhiyun 				mips32_insn.fp0_format.func = func;
364*4882a593Smuzhiyun 				break;
365*4882a593Smuzhiyun 			case mm_mfc1_op:
366*4882a593Smuzhiyun 			case mm_mtc1_op:
367*4882a593Smuzhiyun 			case mm_cfc1_op:
368*4882a593Smuzhiyun 			case mm_ctc1_op:
369*4882a593Smuzhiyun 			case mm_mfhc1_op:
370*4882a593Smuzhiyun 			case mm_mthc1_op:
371*4882a593Smuzhiyun 				if (insn.mm_fp1_format.op == mm_mfc1_op)
372*4882a593Smuzhiyun 					op = mfc_op;
373*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_mtc1_op)
374*4882a593Smuzhiyun 					op = mtc_op;
375*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_cfc1_op)
376*4882a593Smuzhiyun 					op = cfc_op;
377*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_ctc1_op)
378*4882a593Smuzhiyun 					op = ctc_op;
379*4882a593Smuzhiyun 				else if (insn.mm_fp1_format.op == mm_mfhc1_op)
380*4882a593Smuzhiyun 					op = mfhc_op;
381*4882a593Smuzhiyun 				else
382*4882a593Smuzhiyun 					op = mthc_op;
383*4882a593Smuzhiyun 				mips32_insn.fp1_format.opcode = cop1_op;
384*4882a593Smuzhiyun 				mips32_insn.fp1_format.op = op;
385*4882a593Smuzhiyun 				mips32_insn.fp1_format.rt =
386*4882a593Smuzhiyun 					insn.mm_fp1_format.rt;
387*4882a593Smuzhiyun 				mips32_insn.fp1_format.fs =
388*4882a593Smuzhiyun 					insn.mm_fp1_format.fs;
389*4882a593Smuzhiyun 				mips32_insn.fp1_format.fd = 0;
390*4882a593Smuzhiyun 				mips32_insn.fp1_format.func = 0;
391*4882a593Smuzhiyun 				break;
392*4882a593Smuzhiyun 			default:
393*4882a593Smuzhiyun 				return SIGILL;
394*4882a593Smuzhiyun 			}
395*4882a593Smuzhiyun 			break;
396*4882a593Smuzhiyun 		case mm_32f_74_op:	/* c.cond.fmt */
397*4882a593Smuzhiyun 			mips32_insn.fp0_format.opcode = cop1_op;
398*4882a593Smuzhiyun 			mips32_insn.fp0_format.fmt =
399*4882a593Smuzhiyun 				sdps_format[insn.mm_fp4_format.fmt];
400*4882a593Smuzhiyun 			mips32_insn.fp0_format.ft = insn.mm_fp4_format.rt;
401*4882a593Smuzhiyun 			mips32_insn.fp0_format.fs = insn.mm_fp4_format.fs;
402*4882a593Smuzhiyun 			mips32_insn.fp0_format.fd = insn.mm_fp4_format.cc << 2;
403*4882a593Smuzhiyun 			mips32_insn.fp0_format.func =
404*4882a593Smuzhiyun 				insn.mm_fp4_format.cond | MM_MIPS32_COND_FC;
405*4882a593Smuzhiyun 			break;
406*4882a593Smuzhiyun 		default:
407*4882a593Smuzhiyun 			return SIGILL;
408*4882a593Smuzhiyun 		}
409*4882a593Smuzhiyun 		break;
410*4882a593Smuzhiyun 	default:
411*4882a593Smuzhiyun 		return SIGILL;
412*4882a593Smuzhiyun 	}
413*4882a593Smuzhiyun 
414*4882a593Smuzhiyun 	*insn_ptr = mips32_insn;
415*4882a593Smuzhiyun 	return 0;
416*4882a593Smuzhiyun }
417*4882a593Smuzhiyun 
418*4882a593Smuzhiyun /*
419*4882a593Smuzhiyun  * Redundant with logic already in kernel/branch.c,
420*4882a593Smuzhiyun  * embedded in compute_return_epc.  At some point,
421*4882a593Smuzhiyun  * a single subroutine should be used across both
422*4882a593Smuzhiyun  * modules.
423*4882a593Smuzhiyun  */
isBranchInstr(struct pt_regs * regs,struct mm_decoded_insn dec_insn,unsigned long * contpc)424*4882a593Smuzhiyun int isBranchInstr(struct pt_regs *regs, struct mm_decoded_insn dec_insn,
425*4882a593Smuzhiyun 		  unsigned long *contpc)
426*4882a593Smuzhiyun {
427*4882a593Smuzhiyun 	union mips_instruction insn = (union mips_instruction)dec_insn.insn;
428*4882a593Smuzhiyun 	unsigned int fcr31;
429*4882a593Smuzhiyun 	unsigned int bit = 0;
430*4882a593Smuzhiyun 	unsigned int bit0;
431*4882a593Smuzhiyun 	union fpureg *fpr;
432*4882a593Smuzhiyun 
433*4882a593Smuzhiyun 	switch (insn.i_format.opcode) {
434*4882a593Smuzhiyun 	case spec_op:
435*4882a593Smuzhiyun 		switch (insn.r_format.func) {
436*4882a593Smuzhiyun 		case jalr_op:
437*4882a593Smuzhiyun 			if (insn.r_format.rd != 0) {
438*4882a593Smuzhiyun 				regs->regs[insn.r_format.rd] =
439*4882a593Smuzhiyun 					regs->cp0_epc + dec_insn.pc_inc +
440*4882a593Smuzhiyun 					dec_insn.next_pc_inc;
441*4882a593Smuzhiyun 			}
442*4882a593Smuzhiyun 			fallthrough;
443*4882a593Smuzhiyun 		case jr_op:
444*4882a593Smuzhiyun 			/* For R6, JR already emulated in jalr_op */
445*4882a593Smuzhiyun 			if (NO_R6EMU && insn.r_format.func == jr_op)
446*4882a593Smuzhiyun 				break;
447*4882a593Smuzhiyun 			*contpc = regs->regs[insn.r_format.rs];
448*4882a593Smuzhiyun 			return 1;
449*4882a593Smuzhiyun 		}
450*4882a593Smuzhiyun 		break;
451*4882a593Smuzhiyun 	case bcond_op:
452*4882a593Smuzhiyun 		switch (insn.i_format.rt) {
453*4882a593Smuzhiyun 		case bltzal_op:
454*4882a593Smuzhiyun 		case bltzall_op:
455*4882a593Smuzhiyun 			if (NO_R6EMU && (insn.i_format.rs ||
456*4882a593Smuzhiyun 			    insn.i_format.rt == bltzall_op))
457*4882a593Smuzhiyun 				break;
458*4882a593Smuzhiyun 
459*4882a593Smuzhiyun 			regs->regs[31] = regs->cp0_epc +
460*4882a593Smuzhiyun 				dec_insn.pc_inc +
461*4882a593Smuzhiyun 				dec_insn.next_pc_inc;
462*4882a593Smuzhiyun 			fallthrough;
463*4882a593Smuzhiyun 		case bltzl_op:
464*4882a593Smuzhiyun 			if (NO_R6EMU)
465*4882a593Smuzhiyun 				break;
466*4882a593Smuzhiyun 			fallthrough;
467*4882a593Smuzhiyun 		case bltz_op:
468*4882a593Smuzhiyun 			if ((long)regs->regs[insn.i_format.rs] < 0)
469*4882a593Smuzhiyun 				*contpc = regs->cp0_epc +
470*4882a593Smuzhiyun 					dec_insn.pc_inc +
471*4882a593Smuzhiyun 					(insn.i_format.simmediate << 2);
472*4882a593Smuzhiyun 			else
473*4882a593Smuzhiyun 				*contpc = regs->cp0_epc +
474*4882a593Smuzhiyun 					dec_insn.pc_inc +
475*4882a593Smuzhiyun 					dec_insn.next_pc_inc;
476*4882a593Smuzhiyun 			return 1;
477*4882a593Smuzhiyun 		case bgezal_op:
478*4882a593Smuzhiyun 		case bgezall_op:
479*4882a593Smuzhiyun 			if (NO_R6EMU && (insn.i_format.rs ||
480*4882a593Smuzhiyun 			    insn.i_format.rt == bgezall_op))
481*4882a593Smuzhiyun 				break;
482*4882a593Smuzhiyun 
483*4882a593Smuzhiyun 			regs->regs[31] = regs->cp0_epc +
484*4882a593Smuzhiyun 				dec_insn.pc_inc +
485*4882a593Smuzhiyun 				dec_insn.next_pc_inc;
486*4882a593Smuzhiyun 			fallthrough;
487*4882a593Smuzhiyun 		case bgezl_op:
488*4882a593Smuzhiyun 			if (NO_R6EMU)
489*4882a593Smuzhiyun 				break;
490*4882a593Smuzhiyun 			fallthrough;
491*4882a593Smuzhiyun 		case bgez_op:
492*4882a593Smuzhiyun 			if ((long)regs->regs[insn.i_format.rs] >= 0)
493*4882a593Smuzhiyun 				*contpc = regs->cp0_epc +
494*4882a593Smuzhiyun 					dec_insn.pc_inc +
495*4882a593Smuzhiyun 					(insn.i_format.simmediate << 2);
496*4882a593Smuzhiyun 			else
497*4882a593Smuzhiyun 				*contpc = regs->cp0_epc +
498*4882a593Smuzhiyun 					dec_insn.pc_inc +
499*4882a593Smuzhiyun 					dec_insn.next_pc_inc;
500*4882a593Smuzhiyun 			return 1;
501*4882a593Smuzhiyun 		}
502*4882a593Smuzhiyun 		break;
503*4882a593Smuzhiyun 	case jalx_op:
504*4882a593Smuzhiyun 		set_isa16_mode(bit);
505*4882a593Smuzhiyun 		fallthrough;
506*4882a593Smuzhiyun 	case jal_op:
507*4882a593Smuzhiyun 		regs->regs[31] = regs->cp0_epc +
508*4882a593Smuzhiyun 			dec_insn.pc_inc +
509*4882a593Smuzhiyun 			dec_insn.next_pc_inc;
510*4882a593Smuzhiyun 		fallthrough;
511*4882a593Smuzhiyun 	case j_op:
512*4882a593Smuzhiyun 		*contpc = regs->cp0_epc + dec_insn.pc_inc;
513*4882a593Smuzhiyun 		*contpc >>= 28;
514*4882a593Smuzhiyun 		*contpc <<= 28;
515*4882a593Smuzhiyun 		*contpc |= (insn.j_format.target << 2);
516*4882a593Smuzhiyun 		/* Set microMIPS mode bit: XOR for jalx. */
517*4882a593Smuzhiyun 		*contpc ^= bit;
518*4882a593Smuzhiyun 		return 1;
519*4882a593Smuzhiyun 	case beql_op:
520*4882a593Smuzhiyun 		if (NO_R6EMU)
521*4882a593Smuzhiyun 			break;
522*4882a593Smuzhiyun 		fallthrough;
523*4882a593Smuzhiyun 	case beq_op:
524*4882a593Smuzhiyun 		if (regs->regs[insn.i_format.rs] ==
525*4882a593Smuzhiyun 		    regs->regs[insn.i_format.rt])
526*4882a593Smuzhiyun 			*contpc = regs->cp0_epc +
527*4882a593Smuzhiyun 				dec_insn.pc_inc +
528*4882a593Smuzhiyun 				(insn.i_format.simmediate << 2);
529*4882a593Smuzhiyun 		else
530*4882a593Smuzhiyun 			*contpc = regs->cp0_epc +
531*4882a593Smuzhiyun 				dec_insn.pc_inc +
532*4882a593Smuzhiyun 				dec_insn.next_pc_inc;
533*4882a593Smuzhiyun 		return 1;
534*4882a593Smuzhiyun 	case bnel_op:
535*4882a593Smuzhiyun 		if (NO_R6EMU)
536*4882a593Smuzhiyun 			break;
537*4882a593Smuzhiyun 		fallthrough;
538*4882a593Smuzhiyun 	case bne_op:
539*4882a593Smuzhiyun 		if (regs->regs[insn.i_format.rs] !=
540*4882a593Smuzhiyun 		    regs->regs[insn.i_format.rt])
541*4882a593Smuzhiyun 			*contpc = regs->cp0_epc +
542*4882a593Smuzhiyun 				dec_insn.pc_inc +
543*4882a593Smuzhiyun 				(insn.i_format.simmediate << 2);
544*4882a593Smuzhiyun 		else
545*4882a593Smuzhiyun 			*contpc = regs->cp0_epc +
546*4882a593Smuzhiyun 				dec_insn.pc_inc +
547*4882a593Smuzhiyun 				dec_insn.next_pc_inc;
548*4882a593Smuzhiyun 		return 1;
549*4882a593Smuzhiyun 	case blezl_op:
550*4882a593Smuzhiyun 		if (!insn.i_format.rt && NO_R6EMU)
551*4882a593Smuzhiyun 			break;
552*4882a593Smuzhiyun 		fallthrough;
553*4882a593Smuzhiyun 	case blez_op:
554*4882a593Smuzhiyun 
555*4882a593Smuzhiyun 		/*
556*4882a593Smuzhiyun 		 * Compact branches for R6 for the
557*4882a593Smuzhiyun 		 * blez and blezl opcodes.
558*4882a593Smuzhiyun 		 * BLEZ  | rs = 0 | rt != 0  == BLEZALC
559*4882a593Smuzhiyun 		 * BLEZ  | rs = rt != 0      == BGEZALC
560*4882a593Smuzhiyun 		 * BLEZ  | rs != 0 | rt != 0 == BGEUC
561*4882a593Smuzhiyun 		 * BLEZL | rs = 0 | rt != 0  == BLEZC
562*4882a593Smuzhiyun 		 * BLEZL | rs = rt != 0      == BGEZC
563*4882a593Smuzhiyun 		 * BLEZL | rs != 0 | rt != 0 == BGEC
564*4882a593Smuzhiyun 		 *
565*4882a593Smuzhiyun 		 * For real BLEZ{,L}, rt is always 0.
566*4882a593Smuzhiyun 		 */
567*4882a593Smuzhiyun 		if (cpu_has_mips_r6 && insn.i_format.rt) {
568*4882a593Smuzhiyun 			if ((insn.i_format.opcode == blez_op) &&
569*4882a593Smuzhiyun 			    ((!insn.i_format.rs && insn.i_format.rt) ||
570*4882a593Smuzhiyun 			     (insn.i_format.rs == insn.i_format.rt)))
571*4882a593Smuzhiyun 				regs->regs[31] = regs->cp0_epc +
572*4882a593Smuzhiyun 					dec_insn.pc_inc;
573*4882a593Smuzhiyun 			*contpc = regs->cp0_epc + dec_insn.pc_inc +
574*4882a593Smuzhiyun 				dec_insn.next_pc_inc;
575*4882a593Smuzhiyun 
576*4882a593Smuzhiyun 			return 1;
577*4882a593Smuzhiyun 		}
578*4882a593Smuzhiyun 		if ((long)regs->regs[insn.i_format.rs] <= 0)
579*4882a593Smuzhiyun 			*contpc = regs->cp0_epc +
580*4882a593Smuzhiyun 				dec_insn.pc_inc +
581*4882a593Smuzhiyun 				(insn.i_format.simmediate << 2);
582*4882a593Smuzhiyun 		else
583*4882a593Smuzhiyun 			*contpc = regs->cp0_epc +
584*4882a593Smuzhiyun 				dec_insn.pc_inc +
585*4882a593Smuzhiyun 				dec_insn.next_pc_inc;
586*4882a593Smuzhiyun 		return 1;
587*4882a593Smuzhiyun 	case bgtzl_op:
588*4882a593Smuzhiyun 		if (!insn.i_format.rt && NO_R6EMU)
589*4882a593Smuzhiyun 			break;
590*4882a593Smuzhiyun 		fallthrough;
591*4882a593Smuzhiyun 	case bgtz_op:
592*4882a593Smuzhiyun 		/*
593*4882a593Smuzhiyun 		 * Compact branches for R6 for the
594*4882a593Smuzhiyun 		 * bgtz and bgtzl opcodes.
595*4882a593Smuzhiyun 		 * BGTZ  | rs = 0 | rt != 0  == BGTZALC
596*4882a593Smuzhiyun 		 * BGTZ  | rs = rt != 0      == BLTZALC
597*4882a593Smuzhiyun 		 * BGTZ  | rs != 0 | rt != 0 == BLTUC
598*4882a593Smuzhiyun 		 * BGTZL | rs = 0 | rt != 0  == BGTZC
599*4882a593Smuzhiyun 		 * BGTZL | rs = rt != 0      == BLTZC
600*4882a593Smuzhiyun 		 * BGTZL | rs != 0 | rt != 0 == BLTC
601*4882a593Smuzhiyun 		 *
602*4882a593Smuzhiyun 		 * *ZALC varint for BGTZ &&& rt != 0
603*4882a593Smuzhiyun 		 * For real GTZ{,L}, rt is always 0.
604*4882a593Smuzhiyun 		 */
605*4882a593Smuzhiyun 		if (cpu_has_mips_r6 && insn.i_format.rt) {
606*4882a593Smuzhiyun 			if ((insn.i_format.opcode == blez_op) &&
607*4882a593Smuzhiyun 			    ((!insn.i_format.rs && insn.i_format.rt) ||
608*4882a593Smuzhiyun 			     (insn.i_format.rs == insn.i_format.rt)))
609*4882a593Smuzhiyun 				regs->regs[31] = regs->cp0_epc +
610*4882a593Smuzhiyun 					dec_insn.pc_inc;
611*4882a593Smuzhiyun 			*contpc = regs->cp0_epc + dec_insn.pc_inc +
612*4882a593Smuzhiyun 				dec_insn.next_pc_inc;
613*4882a593Smuzhiyun 
614*4882a593Smuzhiyun 			return 1;
615*4882a593Smuzhiyun 		}
616*4882a593Smuzhiyun 
617*4882a593Smuzhiyun 		if ((long)regs->regs[insn.i_format.rs] > 0)
618*4882a593Smuzhiyun 			*contpc = regs->cp0_epc +
619*4882a593Smuzhiyun 				dec_insn.pc_inc +
620*4882a593Smuzhiyun 				(insn.i_format.simmediate << 2);
621*4882a593Smuzhiyun 		else
622*4882a593Smuzhiyun 			*contpc = regs->cp0_epc +
623*4882a593Smuzhiyun 				dec_insn.pc_inc +
624*4882a593Smuzhiyun 				dec_insn.next_pc_inc;
625*4882a593Smuzhiyun 		return 1;
626*4882a593Smuzhiyun 	case pop10_op:
627*4882a593Smuzhiyun 	case pop30_op:
628*4882a593Smuzhiyun 		if (!cpu_has_mips_r6)
629*4882a593Smuzhiyun 			break;
630*4882a593Smuzhiyun 		if (insn.i_format.rt && !insn.i_format.rs)
631*4882a593Smuzhiyun 			regs->regs[31] = regs->cp0_epc + 4;
632*4882a593Smuzhiyun 		*contpc = regs->cp0_epc + dec_insn.pc_inc +
633*4882a593Smuzhiyun 			dec_insn.next_pc_inc;
634*4882a593Smuzhiyun 
635*4882a593Smuzhiyun 		return 1;
636*4882a593Smuzhiyun #ifdef CONFIG_CPU_CAVIUM_OCTEON
637*4882a593Smuzhiyun 	case lwc2_op: /* This is bbit0 on Octeon */
638*4882a593Smuzhiyun 		if ((regs->regs[insn.i_format.rs] & (1ull<<insn.i_format.rt)) == 0)
639*4882a593Smuzhiyun 			*contpc = regs->cp0_epc + 4 + (insn.i_format.simmediate << 2);
640*4882a593Smuzhiyun 		else
641*4882a593Smuzhiyun 			*contpc = regs->cp0_epc + 8;
642*4882a593Smuzhiyun 		return 1;
643*4882a593Smuzhiyun 	case ldc2_op: /* This is bbit032 on Octeon */
644*4882a593Smuzhiyun 		if ((regs->regs[insn.i_format.rs] & (1ull<<(insn.i_format.rt + 32))) == 0)
645*4882a593Smuzhiyun 			*contpc = regs->cp0_epc + 4 + (insn.i_format.simmediate << 2);
646*4882a593Smuzhiyun 		else
647*4882a593Smuzhiyun 			*contpc = regs->cp0_epc + 8;
648*4882a593Smuzhiyun 		return 1;
649*4882a593Smuzhiyun 	case swc2_op: /* This is bbit1 on Octeon */
650*4882a593Smuzhiyun 		if (regs->regs[insn.i_format.rs] & (1ull<<insn.i_format.rt))
651*4882a593Smuzhiyun 			*contpc = regs->cp0_epc + 4 + (insn.i_format.simmediate << 2);
652*4882a593Smuzhiyun 		else
653*4882a593Smuzhiyun 			*contpc = regs->cp0_epc + 8;
654*4882a593Smuzhiyun 		return 1;
655*4882a593Smuzhiyun 	case sdc2_op: /* This is bbit132 on Octeon */
656*4882a593Smuzhiyun 		if (regs->regs[insn.i_format.rs] & (1ull<<(insn.i_format.rt + 32)))
657*4882a593Smuzhiyun 			*contpc = regs->cp0_epc + 4 + (insn.i_format.simmediate << 2);
658*4882a593Smuzhiyun 		else
659*4882a593Smuzhiyun 			*contpc = regs->cp0_epc + 8;
660*4882a593Smuzhiyun 		return 1;
661*4882a593Smuzhiyun #else
662*4882a593Smuzhiyun 	case bc6_op:
663*4882a593Smuzhiyun 		/*
664*4882a593Smuzhiyun 		 * Only valid for MIPS R6 but we can still end up
665*4882a593Smuzhiyun 		 * here from a broken userland so just tell emulator
666*4882a593Smuzhiyun 		 * this is not a branch and let it break later on.
667*4882a593Smuzhiyun 		 */
668*4882a593Smuzhiyun 		if  (!cpu_has_mips_r6)
669*4882a593Smuzhiyun 			break;
670*4882a593Smuzhiyun 		*contpc = regs->cp0_epc + dec_insn.pc_inc +
671*4882a593Smuzhiyun 			dec_insn.next_pc_inc;
672*4882a593Smuzhiyun 
673*4882a593Smuzhiyun 		return 1;
674*4882a593Smuzhiyun 	case balc6_op:
675*4882a593Smuzhiyun 		if (!cpu_has_mips_r6)
676*4882a593Smuzhiyun 			break;
677*4882a593Smuzhiyun 		regs->regs[31] = regs->cp0_epc + 4;
678*4882a593Smuzhiyun 		*contpc = regs->cp0_epc + dec_insn.pc_inc +
679*4882a593Smuzhiyun 			dec_insn.next_pc_inc;
680*4882a593Smuzhiyun 
681*4882a593Smuzhiyun 		return 1;
682*4882a593Smuzhiyun 	case pop66_op:
683*4882a593Smuzhiyun 		if (!cpu_has_mips_r6)
684*4882a593Smuzhiyun 			break;
685*4882a593Smuzhiyun 		*contpc = regs->cp0_epc + dec_insn.pc_inc +
686*4882a593Smuzhiyun 			dec_insn.next_pc_inc;
687*4882a593Smuzhiyun 
688*4882a593Smuzhiyun 		return 1;
689*4882a593Smuzhiyun 	case pop76_op:
690*4882a593Smuzhiyun 		if (!cpu_has_mips_r6)
691*4882a593Smuzhiyun 			break;
692*4882a593Smuzhiyun 		if (!insn.i_format.rs)
693*4882a593Smuzhiyun 			regs->regs[31] = regs->cp0_epc + 4;
694*4882a593Smuzhiyun 		*contpc = regs->cp0_epc + dec_insn.pc_inc +
695*4882a593Smuzhiyun 			dec_insn.next_pc_inc;
696*4882a593Smuzhiyun 
697*4882a593Smuzhiyun 		return 1;
698*4882a593Smuzhiyun #endif
699*4882a593Smuzhiyun 	case cop0_op:
700*4882a593Smuzhiyun 	case cop1_op:
701*4882a593Smuzhiyun 		/* Need to check for R6 bc1nez and bc1eqz branches */
702*4882a593Smuzhiyun 		if (cpu_has_mips_r6 &&
703*4882a593Smuzhiyun 		    ((insn.i_format.rs == bc1eqz_op) ||
704*4882a593Smuzhiyun 		     (insn.i_format.rs == bc1nez_op))) {
705*4882a593Smuzhiyun 			bit = 0;
706*4882a593Smuzhiyun 			fpr = &current->thread.fpu.fpr[insn.i_format.rt];
707*4882a593Smuzhiyun 			bit0 = get_fpr32(fpr, 0) & 0x1;
708*4882a593Smuzhiyun 			switch (insn.i_format.rs) {
709*4882a593Smuzhiyun 			case bc1eqz_op:
710*4882a593Smuzhiyun 				bit = bit0 == 0;
711*4882a593Smuzhiyun 				break;
712*4882a593Smuzhiyun 			case bc1nez_op:
713*4882a593Smuzhiyun 				bit = bit0 != 0;
714*4882a593Smuzhiyun 				break;
715*4882a593Smuzhiyun 			}
716*4882a593Smuzhiyun 			if (bit)
717*4882a593Smuzhiyun 				*contpc = regs->cp0_epc +
718*4882a593Smuzhiyun 					dec_insn.pc_inc +
719*4882a593Smuzhiyun 					(insn.i_format.simmediate << 2);
720*4882a593Smuzhiyun 			else
721*4882a593Smuzhiyun 				*contpc = regs->cp0_epc +
722*4882a593Smuzhiyun 					dec_insn.pc_inc +
723*4882a593Smuzhiyun 					dec_insn.next_pc_inc;
724*4882a593Smuzhiyun 
725*4882a593Smuzhiyun 			return 1;
726*4882a593Smuzhiyun 		}
727*4882a593Smuzhiyun 		/* R2/R6 compatible cop1 instruction */
728*4882a593Smuzhiyun 		fallthrough;
729*4882a593Smuzhiyun 	case cop2_op:
730*4882a593Smuzhiyun 	case cop1x_op:
731*4882a593Smuzhiyun 		if (insn.i_format.rs == bc_op) {
732*4882a593Smuzhiyun 			preempt_disable();
733*4882a593Smuzhiyun 			if (is_fpu_owner())
734*4882a593Smuzhiyun 			        fcr31 = read_32bit_cp1_register(CP1_STATUS);
735*4882a593Smuzhiyun 			else
736*4882a593Smuzhiyun 				fcr31 = current->thread.fpu.fcr31;
737*4882a593Smuzhiyun 			preempt_enable();
738*4882a593Smuzhiyun 
739*4882a593Smuzhiyun 			bit = (insn.i_format.rt >> 2);
740*4882a593Smuzhiyun 			bit += (bit != 0);
741*4882a593Smuzhiyun 			bit += 23;
742*4882a593Smuzhiyun 			switch (insn.i_format.rt & 3) {
743*4882a593Smuzhiyun 			case 0:	/* bc1f */
744*4882a593Smuzhiyun 			case 2:	/* bc1fl */
745*4882a593Smuzhiyun 				if (~fcr31 & (1 << bit))
746*4882a593Smuzhiyun 					*contpc = regs->cp0_epc +
747*4882a593Smuzhiyun 						dec_insn.pc_inc +
748*4882a593Smuzhiyun 						(insn.i_format.simmediate << 2);
749*4882a593Smuzhiyun 				else
750*4882a593Smuzhiyun 					*contpc = regs->cp0_epc +
751*4882a593Smuzhiyun 						dec_insn.pc_inc +
752*4882a593Smuzhiyun 						dec_insn.next_pc_inc;
753*4882a593Smuzhiyun 				return 1;
754*4882a593Smuzhiyun 			case 1:	/* bc1t */
755*4882a593Smuzhiyun 			case 3:	/* bc1tl */
756*4882a593Smuzhiyun 				if (fcr31 & (1 << bit))
757*4882a593Smuzhiyun 					*contpc = regs->cp0_epc +
758*4882a593Smuzhiyun 						dec_insn.pc_inc +
759*4882a593Smuzhiyun 						(insn.i_format.simmediate << 2);
760*4882a593Smuzhiyun 				else
761*4882a593Smuzhiyun 					*contpc = regs->cp0_epc +
762*4882a593Smuzhiyun 						dec_insn.pc_inc +
763*4882a593Smuzhiyun 						dec_insn.next_pc_inc;
764*4882a593Smuzhiyun 				return 1;
765*4882a593Smuzhiyun 			}
766*4882a593Smuzhiyun 		}
767*4882a593Smuzhiyun 		break;
768*4882a593Smuzhiyun 	}
769*4882a593Smuzhiyun 	return 0;
770*4882a593Smuzhiyun }
771*4882a593Smuzhiyun 
772*4882a593Smuzhiyun /*
773*4882a593Smuzhiyun  * In the Linux kernel, we support selection of FPR format on the
774*4882a593Smuzhiyun  * basis of the Status.FR bit.	If an FPU is not present, the FR bit
775*4882a593Smuzhiyun  * is hardwired to zero, which would imply a 32-bit FPU even for
776*4882a593Smuzhiyun  * 64-bit CPUs so we rather look at TIF_32BIT_FPREGS.
777*4882a593Smuzhiyun  * FPU emu is slow and bulky and optimizing this function offers fairly
778*4882a593Smuzhiyun  * sizeable benefits so we try to be clever and make this function return
779*4882a593Smuzhiyun  * a constant whenever possible, that is on 64-bit kernels without O32
780*4882a593Smuzhiyun  * compatibility enabled and on 32-bit without 64-bit FPU support.
781*4882a593Smuzhiyun  */
cop1_64bit(struct pt_regs * xcp)782*4882a593Smuzhiyun static inline int cop1_64bit(struct pt_regs *xcp)
783*4882a593Smuzhiyun {
784*4882a593Smuzhiyun 	if (IS_ENABLED(CONFIG_64BIT) && !IS_ENABLED(CONFIG_MIPS32_O32))
785*4882a593Smuzhiyun 		return 1;
786*4882a593Smuzhiyun 	else if (IS_ENABLED(CONFIG_32BIT) &&
787*4882a593Smuzhiyun 		 !IS_ENABLED(CONFIG_MIPS_O32_FP64_SUPPORT))
788*4882a593Smuzhiyun 		return 0;
789*4882a593Smuzhiyun 
790*4882a593Smuzhiyun 	return !test_thread_flag(TIF_32BIT_FPREGS);
791*4882a593Smuzhiyun }
792*4882a593Smuzhiyun 
hybrid_fprs(void)793*4882a593Smuzhiyun static inline bool hybrid_fprs(void)
794*4882a593Smuzhiyun {
795*4882a593Smuzhiyun 	return test_thread_flag(TIF_HYBRID_FPREGS);
796*4882a593Smuzhiyun }
797*4882a593Smuzhiyun 
798*4882a593Smuzhiyun #define SIFROMREG(si, x)						\
799*4882a593Smuzhiyun do {									\
800*4882a593Smuzhiyun 	if (cop1_64bit(xcp) && !hybrid_fprs())				\
801*4882a593Smuzhiyun 		(si) = (int)get_fpr32(&ctx->fpr[x], 0);			\
802*4882a593Smuzhiyun 	else								\
803*4882a593Smuzhiyun 		(si) = (int)get_fpr32(&ctx->fpr[(x) & ~1], (x) & 1);	\
804*4882a593Smuzhiyun } while (0)
805*4882a593Smuzhiyun 
806*4882a593Smuzhiyun #define SITOREG(si, x)							\
807*4882a593Smuzhiyun do {									\
808*4882a593Smuzhiyun 	if (cop1_64bit(xcp) && !hybrid_fprs()) {			\
809*4882a593Smuzhiyun 		unsigned int i;						\
810*4882a593Smuzhiyun 		set_fpr32(&ctx->fpr[x], 0, si);				\
811*4882a593Smuzhiyun 		for (i = 1; i < ARRAY_SIZE(ctx->fpr[x].val32); i++)	\
812*4882a593Smuzhiyun 			set_fpr32(&ctx->fpr[x], i, 0);			\
813*4882a593Smuzhiyun 	} else {							\
814*4882a593Smuzhiyun 		set_fpr32(&ctx->fpr[(x) & ~1], (x) & 1, si);		\
815*4882a593Smuzhiyun 	}								\
816*4882a593Smuzhiyun } while (0)
817*4882a593Smuzhiyun 
818*4882a593Smuzhiyun #define SIFROMHREG(si, x)	((si) = (int)get_fpr32(&ctx->fpr[x], 1))
819*4882a593Smuzhiyun 
820*4882a593Smuzhiyun #define SITOHREG(si, x)							\
821*4882a593Smuzhiyun do {									\
822*4882a593Smuzhiyun 	unsigned int i;							\
823*4882a593Smuzhiyun 	set_fpr32(&ctx->fpr[x], 1, si);					\
824*4882a593Smuzhiyun 	for (i = 2; i < ARRAY_SIZE(ctx->fpr[x].val32); i++)		\
825*4882a593Smuzhiyun 		set_fpr32(&ctx->fpr[x], i, 0);				\
826*4882a593Smuzhiyun } while (0)
827*4882a593Smuzhiyun 
828*4882a593Smuzhiyun #define DIFROMREG(di, x)						\
829*4882a593Smuzhiyun 	((di) = get_fpr64(&ctx->fpr[(x) & ~(cop1_64bit(xcp) ^ 1)], 0))
830*4882a593Smuzhiyun 
831*4882a593Smuzhiyun #define DITOREG(di, x)							\
832*4882a593Smuzhiyun do {									\
833*4882a593Smuzhiyun 	unsigned int fpr, i;						\
834*4882a593Smuzhiyun 	fpr = (x) & ~(cop1_64bit(xcp) ^ 1);				\
835*4882a593Smuzhiyun 	set_fpr64(&ctx->fpr[fpr], 0, di);				\
836*4882a593Smuzhiyun 	for (i = 1; i < ARRAY_SIZE(ctx->fpr[x].val64); i++)		\
837*4882a593Smuzhiyun 		set_fpr64(&ctx->fpr[fpr], i, 0);			\
838*4882a593Smuzhiyun } while (0)
839*4882a593Smuzhiyun 
840*4882a593Smuzhiyun #define SPFROMREG(sp, x) SIFROMREG((sp).bits, x)
841*4882a593Smuzhiyun #define SPTOREG(sp, x)	SITOREG((sp).bits, x)
842*4882a593Smuzhiyun #define DPFROMREG(dp, x)	DIFROMREG((dp).bits, x)
843*4882a593Smuzhiyun #define DPTOREG(dp, x)	DITOREG((dp).bits, x)
844*4882a593Smuzhiyun 
845*4882a593Smuzhiyun /*
846*4882a593Smuzhiyun  * Emulate a CFC1 instruction.
847*4882a593Smuzhiyun  */
cop1_cfc(struct pt_regs * xcp,struct mips_fpu_struct * ctx,mips_instruction ir)848*4882a593Smuzhiyun static inline void cop1_cfc(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
849*4882a593Smuzhiyun 			    mips_instruction ir)
850*4882a593Smuzhiyun {
851*4882a593Smuzhiyun 	u32 fcr31 = ctx->fcr31;
852*4882a593Smuzhiyun 	u32 value = 0;
853*4882a593Smuzhiyun 
854*4882a593Smuzhiyun 	switch (MIPSInst_RD(ir)) {
855*4882a593Smuzhiyun 	case FPCREG_CSR:
856*4882a593Smuzhiyun 		value = fcr31;
857*4882a593Smuzhiyun 		pr_debug("%p gpr[%d]<-csr=%08x\n",
858*4882a593Smuzhiyun 			 (void *)xcp->cp0_epc, MIPSInst_RT(ir), value);
859*4882a593Smuzhiyun 		break;
860*4882a593Smuzhiyun 
861*4882a593Smuzhiyun 	case FPCREG_FENR:
862*4882a593Smuzhiyun 		if (!cpu_has_mips_r)
863*4882a593Smuzhiyun 			break;
864*4882a593Smuzhiyun 		value = (fcr31 >> (FPU_CSR_FS_S - MIPS_FENR_FS_S)) &
865*4882a593Smuzhiyun 			MIPS_FENR_FS;
866*4882a593Smuzhiyun 		value |= fcr31 & (FPU_CSR_ALL_E | FPU_CSR_RM);
867*4882a593Smuzhiyun 		pr_debug("%p gpr[%d]<-enr=%08x\n",
868*4882a593Smuzhiyun 			 (void *)xcp->cp0_epc, MIPSInst_RT(ir), value);
869*4882a593Smuzhiyun 		break;
870*4882a593Smuzhiyun 
871*4882a593Smuzhiyun 	case FPCREG_FEXR:
872*4882a593Smuzhiyun 		if (!cpu_has_mips_r)
873*4882a593Smuzhiyun 			break;
874*4882a593Smuzhiyun 		value = fcr31 & (FPU_CSR_ALL_X | FPU_CSR_ALL_S);
875*4882a593Smuzhiyun 		pr_debug("%p gpr[%d]<-exr=%08x\n",
876*4882a593Smuzhiyun 			 (void *)xcp->cp0_epc, MIPSInst_RT(ir), value);
877*4882a593Smuzhiyun 		break;
878*4882a593Smuzhiyun 
879*4882a593Smuzhiyun 	case FPCREG_FCCR:
880*4882a593Smuzhiyun 		if (!cpu_has_mips_r)
881*4882a593Smuzhiyun 			break;
882*4882a593Smuzhiyun 		value = (fcr31 >> (FPU_CSR_COND_S - MIPS_FCCR_COND0_S)) &
883*4882a593Smuzhiyun 			MIPS_FCCR_COND0;
884*4882a593Smuzhiyun 		value |= (fcr31 >> (FPU_CSR_COND1_S - MIPS_FCCR_COND1_S)) &
885*4882a593Smuzhiyun 			 (MIPS_FCCR_CONDX & ~MIPS_FCCR_COND0);
886*4882a593Smuzhiyun 		pr_debug("%p gpr[%d]<-ccr=%08x\n",
887*4882a593Smuzhiyun 			 (void *)xcp->cp0_epc, MIPSInst_RT(ir), value);
888*4882a593Smuzhiyun 		break;
889*4882a593Smuzhiyun 
890*4882a593Smuzhiyun 	case FPCREG_RID:
891*4882a593Smuzhiyun 		value = boot_cpu_data.fpu_id;
892*4882a593Smuzhiyun 		break;
893*4882a593Smuzhiyun 
894*4882a593Smuzhiyun 	default:
895*4882a593Smuzhiyun 		break;
896*4882a593Smuzhiyun 	}
897*4882a593Smuzhiyun 
898*4882a593Smuzhiyun 	if (MIPSInst_RT(ir))
899*4882a593Smuzhiyun 		xcp->regs[MIPSInst_RT(ir)] = value;
900*4882a593Smuzhiyun }
901*4882a593Smuzhiyun 
902*4882a593Smuzhiyun /*
903*4882a593Smuzhiyun  * Emulate a CTC1 instruction.
904*4882a593Smuzhiyun  */
cop1_ctc(struct pt_regs * xcp,struct mips_fpu_struct * ctx,mips_instruction ir)905*4882a593Smuzhiyun static inline void cop1_ctc(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
906*4882a593Smuzhiyun 			    mips_instruction ir)
907*4882a593Smuzhiyun {
908*4882a593Smuzhiyun 	u32 fcr31 = ctx->fcr31;
909*4882a593Smuzhiyun 	u32 value;
910*4882a593Smuzhiyun 	u32 mask;
911*4882a593Smuzhiyun 
912*4882a593Smuzhiyun 	if (MIPSInst_RT(ir) == 0)
913*4882a593Smuzhiyun 		value = 0;
914*4882a593Smuzhiyun 	else
915*4882a593Smuzhiyun 		value = xcp->regs[MIPSInst_RT(ir)];
916*4882a593Smuzhiyun 
917*4882a593Smuzhiyun 	switch (MIPSInst_RD(ir)) {
918*4882a593Smuzhiyun 	case FPCREG_CSR:
919*4882a593Smuzhiyun 		pr_debug("%p gpr[%d]->csr=%08x\n",
920*4882a593Smuzhiyun 			 (void *)xcp->cp0_epc, MIPSInst_RT(ir), value);
921*4882a593Smuzhiyun 
922*4882a593Smuzhiyun 		/* Preserve read-only bits.  */
923*4882a593Smuzhiyun 		mask = boot_cpu_data.fpu_msk31;
924*4882a593Smuzhiyun 		fcr31 = (value & ~mask) | (fcr31 & mask);
925*4882a593Smuzhiyun 		break;
926*4882a593Smuzhiyun 
927*4882a593Smuzhiyun 	case FPCREG_FENR:
928*4882a593Smuzhiyun 		if (!cpu_has_mips_r)
929*4882a593Smuzhiyun 			break;
930*4882a593Smuzhiyun 		pr_debug("%p gpr[%d]->enr=%08x\n",
931*4882a593Smuzhiyun 			 (void *)xcp->cp0_epc, MIPSInst_RT(ir), value);
932*4882a593Smuzhiyun 		fcr31 &= ~(FPU_CSR_FS | FPU_CSR_ALL_E | FPU_CSR_RM);
933*4882a593Smuzhiyun 		fcr31 |= (value << (FPU_CSR_FS_S - MIPS_FENR_FS_S)) &
934*4882a593Smuzhiyun 			 FPU_CSR_FS;
935*4882a593Smuzhiyun 		fcr31 |= value & (FPU_CSR_ALL_E | FPU_CSR_RM);
936*4882a593Smuzhiyun 		break;
937*4882a593Smuzhiyun 
938*4882a593Smuzhiyun 	case FPCREG_FEXR:
939*4882a593Smuzhiyun 		if (!cpu_has_mips_r)
940*4882a593Smuzhiyun 			break;
941*4882a593Smuzhiyun 		pr_debug("%p gpr[%d]->exr=%08x\n",
942*4882a593Smuzhiyun 			 (void *)xcp->cp0_epc, MIPSInst_RT(ir), value);
943*4882a593Smuzhiyun 		fcr31 &= ~(FPU_CSR_ALL_X | FPU_CSR_ALL_S);
944*4882a593Smuzhiyun 		fcr31 |= value & (FPU_CSR_ALL_X | FPU_CSR_ALL_S);
945*4882a593Smuzhiyun 		break;
946*4882a593Smuzhiyun 
947*4882a593Smuzhiyun 	case FPCREG_FCCR:
948*4882a593Smuzhiyun 		if (!cpu_has_mips_r)
949*4882a593Smuzhiyun 			break;
950*4882a593Smuzhiyun 		pr_debug("%p gpr[%d]->ccr=%08x\n",
951*4882a593Smuzhiyun 			 (void *)xcp->cp0_epc, MIPSInst_RT(ir), value);
952*4882a593Smuzhiyun 		fcr31 &= ~(FPU_CSR_CONDX | FPU_CSR_COND);
953*4882a593Smuzhiyun 		fcr31 |= (value << (FPU_CSR_COND_S - MIPS_FCCR_COND0_S)) &
954*4882a593Smuzhiyun 			 FPU_CSR_COND;
955*4882a593Smuzhiyun 		fcr31 |= (value << (FPU_CSR_COND1_S - MIPS_FCCR_COND1_S)) &
956*4882a593Smuzhiyun 			 FPU_CSR_CONDX;
957*4882a593Smuzhiyun 		break;
958*4882a593Smuzhiyun 
959*4882a593Smuzhiyun 	default:
960*4882a593Smuzhiyun 		break;
961*4882a593Smuzhiyun 	}
962*4882a593Smuzhiyun 
963*4882a593Smuzhiyun 	ctx->fcr31 = fcr31;
964*4882a593Smuzhiyun }
965*4882a593Smuzhiyun 
966*4882a593Smuzhiyun /*
967*4882a593Smuzhiyun  * Emulate the single floating point instruction pointed at by EPC.
968*4882a593Smuzhiyun  * Two instructions if the instruction is in a branch delay slot.
969*4882a593Smuzhiyun  */
970*4882a593Smuzhiyun 
cop1Emulate(struct pt_regs * xcp,struct mips_fpu_struct * ctx,struct mm_decoded_insn dec_insn,void __user ** fault_addr)971*4882a593Smuzhiyun static int cop1Emulate(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
972*4882a593Smuzhiyun 		struct mm_decoded_insn dec_insn, void __user **fault_addr)
973*4882a593Smuzhiyun {
974*4882a593Smuzhiyun 	unsigned long contpc = xcp->cp0_epc + dec_insn.pc_inc;
975*4882a593Smuzhiyun 	unsigned int cond, cbit, bit0;
976*4882a593Smuzhiyun 	mips_instruction ir;
977*4882a593Smuzhiyun 	int likely, pc_inc;
978*4882a593Smuzhiyun 	union fpureg *fpr;
979*4882a593Smuzhiyun 	u32 __user *wva;
980*4882a593Smuzhiyun 	u64 __user *dva;
981*4882a593Smuzhiyun 	u32 wval;
982*4882a593Smuzhiyun 	u64 dval;
983*4882a593Smuzhiyun 	int sig;
984*4882a593Smuzhiyun 
985*4882a593Smuzhiyun 	/*
986*4882a593Smuzhiyun 	 * These are giving gcc a gentle hint about what to expect in
987*4882a593Smuzhiyun 	 * dec_inst in order to do better optimization.
988*4882a593Smuzhiyun 	 */
989*4882a593Smuzhiyun 	if (!cpu_has_mmips && dec_insn.micro_mips_mode)
990*4882a593Smuzhiyun 		unreachable();
991*4882a593Smuzhiyun 
992*4882a593Smuzhiyun 	/* XXX NEC Vr54xx bug workaround */
993*4882a593Smuzhiyun 	if (delay_slot(xcp)) {
994*4882a593Smuzhiyun 		if (dec_insn.micro_mips_mode) {
995*4882a593Smuzhiyun 			if (!mm_isBranchInstr(xcp, dec_insn, &contpc))
996*4882a593Smuzhiyun 				clear_delay_slot(xcp);
997*4882a593Smuzhiyun 		} else {
998*4882a593Smuzhiyun 			if (!isBranchInstr(xcp, dec_insn, &contpc))
999*4882a593Smuzhiyun 				clear_delay_slot(xcp);
1000*4882a593Smuzhiyun 		}
1001*4882a593Smuzhiyun 	}
1002*4882a593Smuzhiyun 
1003*4882a593Smuzhiyun 	if (delay_slot(xcp)) {
1004*4882a593Smuzhiyun 		/*
1005*4882a593Smuzhiyun 		 * The instruction to be emulated is in a branch delay slot
1006*4882a593Smuzhiyun 		 * which means that we have to	emulate the branch instruction
1007*4882a593Smuzhiyun 		 * BEFORE we do the cop1 instruction.
1008*4882a593Smuzhiyun 		 *
1009*4882a593Smuzhiyun 		 * This branch could be a COP1 branch, but in that case we
1010*4882a593Smuzhiyun 		 * would have had a trap for that instruction, and would not
1011*4882a593Smuzhiyun 		 * come through this route.
1012*4882a593Smuzhiyun 		 *
1013*4882a593Smuzhiyun 		 * Linux MIPS branch emulator operates on context, updating the
1014*4882a593Smuzhiyun 		 * cp0_epc.
1015*4882a593Smuzhiyun 		 */
1016*4882a593Smuzhiyun 		ir = dec_insn.next_insn;  /* process delay slot instr */
1017*4882a593Smuzhiyun 		pc_inc = dec_insn.next_pc_inc;
1018*4882a593Smuzhiyun 	} else {
1019*4882a593Smuzhiyun 		ir = dec_insn.insn;       /* process current instr */
1020*4882a593Smuzhiyun 		pc_inc = dec_insn.pc_inc;
1021*4882a593Smuzhiyun 	}
1022*4882a593Smuzhiyun 
1023*4882a593Smuzhiyun 	/*
1024*4882a593Smuzhiyun 	 * Since microMIPS FPU instructios are a subset of MIPS32 FPU
1025*4882a593Smuzhiyun 	 * instructions, we want to convert microMIPS FPU instructions
1026*4882a593Smuzhiyun 	 * into MIPS32 instructions so that we could reuse all of the
1027*4882a593Smuzhiyun 	 * FPU emulation code.
1028*4882a593Smuzhiyun 	 *
1029*4882a593Smuzhiyun 	 * NOTE: We cannot do this for branch instructions since they
1030*4882a593Smuzhiyun 	 *       are not a subset. Example: Cannot emulate a 16-bit
1031*4882a593Smuzhiyun 	 *       aligned target address with a MIPS32 instruction.
1032*4882a593Smuzhiyun 	 */
1033*4882a593Smuzhiyun 	if (dec_insn.micro_mips_mode) {
1034*4882a593Smuzhiyun 		/*
1035*4882a593Smuzhiyun 		 * If next instruction is a 16-bit instruction, then it
1036*4882a593Smuzhiyun 		 * it cannot be a FPU instruction. This could happen
1037*4882a593Smuzhiyun 		 * since we can be called for non-FPU instructions.
1038*4882a593Smuzhiyun 		 */
1039*4882a593Smuzhiyun 		if ((pc_inc == 2) ||
1040*4882a593Smuzhiyun 			(microMIPS32_to_MIPS32((union mips_instruction *)&ir)
1041*4882a593Smuzhiyun 			 == SIGILL))
1042*4882a593Smuzhiyun 			return SIGILL;
1043*4882a593Smuzhiyun 	}
1044*4882a593Smuzhiyun 
1045*4882a593Smuzhiyun emul:
1046*4882a593Smuzhiyun 	perf_sw_event(PERF_COUNT_SW_EMULATION_FAULTS, 1, xcp, 0);
1047*4882a593Smuzhiyun 	MIPS_FPU_EMU_INC_STATS(emulated);
1048*4882a593Smuzhiyun 	switch (MIPSInst_OPCODE(ir)) {
1049*4882a593Smuzhiyun 	case ldc1_op:
1050*4882a593Smuzhiyun 		dva = (u64 __user *) (xcp->regs[MIPSInst_RS(ir)] +
1051*4882a593Smuzhiyun 				     MIPSInst_SIMM(ir));
1052*4882a593Smuzhiyun 		MIPS_FPU_EMU_INC_STATS(loads);
1053*4882a593Smuzhiyun 
1054*4882a593Smuzhiyun 		if (!access_ok(dva, sizeof(u64))) {
1055*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(errors);
1056*4882a593Smuzhiyun 			*fault_addr = dva;
1057*4882a593Smuzhiyun 			return SIGBUS;
1058*4882a593Smuzhiyun 		}
1059*4882a593Smuzhiyun 		if (__get_user(dval, dva)) {
1060*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(errors);
1061*4882a593Smuzhiyun 			*fault_addr = dva;
1062*4882a593Smuzhiyun 			return SIGSEGV;
1063*4882a593Smuzhiyun 		}
1064*4882a593Smuzhiyun 		DITOREG(dval, MIPSInst_RT(ir));
1065*4882a593Smuzhiyun 		break;
1066*4882a593Smuzhiyun 
1067*4882a593Smuzhiyun 	case sdc1_op:
1068*4882a593Smuzhiyun 		dva = (u64 __user *) (xcp->regs[MIPSInst_RS(ir)] +
1069*4882a593Smuzhiyun 				      MIPSInst_SIMM(ir));
1070*4882a593Smuzhiyun 		MIPS_FPU_EMU_INC_STATS(stores);
1071*4882a593Smuzhiyun 		DIFROMREG(dval, MIPSInst_RT(ir));
1072*4882a593Smuzhiyun 		if (!access_ok(dva, sizeof(u64))) {
1073*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(errors);
1074*4882a593Smuzhiyun 			*fault_addr = dva;
1075*4882a593Smuzhiyun 			return SIGBUS;
1076*4882a593Smuzhiyun 		}
1077*4882a593Smuzhiyun 		if (__put_user(dval, dva)) {
1078*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(errors);
1079*4882a593Smuzhiyun 			*fault_addr = dva;
1080*4882a593Smuzhiyun 			return SIGSEGV;
1081*4882a593Smuzhiyun 		}
1082*4882a593Smuzhiyun 		break;
1083*4882a593Smuzhiyun 
1084*4882a593Smuzhiyun 	case lwc1_op:
1085*4882a593Smuzhiyun 		wva = (u32 __user *) (xcp->regs[MIPSInst_RS(ir)] +
1086*4882a593Smuzhiyun 				      MIPSInst_SIMM(ir));
1087*4882a593Smuzhiyun 		MIPS_FPU_EMU_INC_STATS(loads);
1088*4882a593Smuzhiyun 		if (!access_ok(wva, sizeof(u32))) {
1089*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(errors);
1090*4882a593Smuzhiyun 			*fault_addr = wva;
1091*4882a593Smuzhiyun 			return SIGBUS;
1092*4882a593Smuzhiyun 		}
1093*4882a593Smuzhiyun 		if (__get_user(wval, wva)) {
1094*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(errors);
1095*4882a593Smuzhiyun 			*fault_addr = wva;
1096*4882a593Smuzhiyun 			return SIGSEGV;
1097*4882a593Smuzhiyun 		}
1098*4882a593Smuzhiyun 		SITOREG(wval, MIPSInst_RT(ir));
1099*4882a593Smuzhiyun 		break;
1100*4882a593Smuzhiyun 
1101*4882a593Smuzhiyun 	case swc1_op:
1102*4882a593Smuzhiyun 		wva = (u32 __user *) (xcp->regs[MIPSInst_RS(ir)] +
1103*4882a593Smuzhiyun 				      MIPSInst_SIMM(ir));
1104*4882a593Smuzhiyun 		MIPS_FPU_EMU_INC_STATS(stores);
1105*4882a593Smuzhiyun 		SIFROMREG(wval, MIPSInst_RT(ir));
1106*4882a593Smuzhiyun 		if (!access_ok(wva, sizeof(u32))) {
1107*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(errors);
1108*4882a593Smuzhiyun 			*fault_addr = wva;
1109*4882a593Smuzhiyun 			return SIGBUS;
1110*4882a593Smuzhiyun 		}
1111*4882a593Smuzhiyun 		if (__put_user(wval, wva)) {
1112*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(errors);
1113*4882a593Smuzhiyun 			*fault_addr = wva;
1114*4882a593Smuzhiyun 			return SIGSEGV;
1115*4882a593Smuzhiyun 		}
1116*4882a593Smuzhiyun 		break;
1117*4882a593Smuzhiyun 
1118*4882a593Smuzhiyun 	case cop1_op:
1119*4882a593Smuzhiyun 		switch (MIPSInst_RS(ir)) {
1120*4882a593Smuzhiyun 		case dmfc_op:
1121*4882a593Smuzhiyun 			if (!cpu_has_mips_3_4_5 && !cpu_has_mips64)
1122*4882a593Smuzhiyun 				return SIGILL;
1123*4882a593Smuzhiyun 
1124*4882a593Smuzhiyun 			/* copregister fs -> gpr[rt] */
1125*4882a593Smuzhiyun 			if (MIPSInst_RT(ir) != 0) {
1126*4882a593Smuzhiyun 				DIFROMREG(xcp->regs[MIPSInst_RT(ir)],
1127*4882a593Smuzhiyun 					MIPSInst_RD(ir));
1128*4882a593Smuzhiyun 			}
1129*4882a593Smuzhiyun 			break;
1130*4882a593Smuzhiyun 
1131*4882a593Smuzhiyun 		case dmtc_op:
1132*4882a593Smuzhiyun 			if (!cpu_has_mips_3_4_5 && !cpu_has_mips64)
1133*4882a593Smuzhiyun 				return SIGILL;
1134*4882a593Smuzhiyun 
1135*4882a593Smuzhiyun 			/* copregister fs <- rt */
1136*4882a593Smuzhiyun 			DITOREG(xcp->regs[MIPSInst_RT(ir)], MIPSInst_RD(ir));
1137*4882a593Smuzhiyun 			break;
1138*4882a593Smuzhiyun 
1139*4882a593Smuzhiyun 		case mfhc_op:
1140*4882a593Smuzhiyun 			if (!cpu_has_mips_r2_r6)
1141*4882a593Smuzhiyun 				return SIGILL;
1142*4882a593Smuzhiyun 
1143*4882a593Smuzhiyun 			/* copregister rd -> gpr[rt] */
1144*4882a593Smuzhiyun 			if (MIPSInst_RT(ir) != 0) {
1145*4882a593Smuzhiyun 				SIFROMHREG(xcp->regs[MIPSInst_RT(ir)],
1146*4882a593Smuzhiyun 					MIPSInst_RD(ir));
1147*4882a593Smuzhiyun 			}
1148*4882a593Smuzhiyun 			break;
1149*4882a593Smuzhiyun 
1150*4882a593Smuzhiyun 		case mthc_op:
1151*4882a593Smuzhiyun 			if (!cpu_has_mips_r2_r6)
1152*4882a593Smuzhiyun 				return SIGILL;
1153*4882a593Smuzhiyun 
1154*4882a593Smuzhiyun 			/* copregister rd <- gpr[rt] */
1155*4882a593Smuzhiyun 			SITOHREG(xcp->regs[MIPSInst_RT(ir)], MIPSInst_RD(ir));
1156*4882a593Smuzhiyun 			break;
1157*4882a593Smuzhiyun 
1158*4882a593Smuzhiyun 		case mfc_op:
1159*4882a593Smuzhiyun 			/* copregister rd -> gpr[rt] */
1160*4882a593Smuzhiyun 			if (MIPSInst_RT(ir) != 0) {
1161*4882a593Smuzhiyun 				SIFROMREG(xcp->regs[MIPSInst_RT(ir)],
1162*4882a593Smuzhiyun 					MIPSInst_RD(ir));
1163*4882a593Smuzhiyun 			}
1164*4882a593Smuzhiyun 			break;
1165*4882a593Smuzhiyun 
1166*4882a593Smuzhiyun 		case mtc_op:
1167*4882a593Smuzhiyun 			/* copregister rd <- rt */
1168*4882a593Smuzhiyun 			SITOREG(xcp->regs[MIPSInst_RT(ir)], MIPSInst_RD(ir));
1169*4882a593Smuzhiyun 			break;
1170*4882a593Smuzhiyun 
1171*4882a593Smuzhiyun 		case cfc_op:
1172*4882a593Smuzhiyun 			/* cop control register rd -> gpr[rt] */
1173*4882a593Smuzhiyun 			cop1_cfc(xcp, ctx, ir);
1174*4882a593Smuzhiyun 			break;
1175*4882a593Smuzhiyun 
1176*4882a593Smuzhiyun 		case ctc_op:
1177*4882a593Smuzhiyun 			/* copregister rd <- rt */
1178*4882a593Smuzhiyun 			cop1_ctc(xcp, ctx, ir);
1179*4882a593Smuzhiyun 			if ((ctx->fcr31 >> 5) & ctx->fcr31 & FPU_CSR_ALL_E) {
1180*4882a593Smuzhiyun 				return SIGFPE;
1181*4882a593Smuzhiyun 			}
1182*4882a593Smuzhiyun 			break;
1183*4882a593Smuzhiyun 
1184*4882a593Smuzhiyun 		case bc1eqz_op:
1185*4882a593Smuzhiyun 		case bc1nez_op:
1186*4882a593Smuzhiyun 			if (!cpu_has_mips_r6 || delay_slot(xcp))
1187*4882a593Smuzhiyun 				return SIGILL;
1188*4882a593Smuzhiyun 
1189*4882a593Smuzhiyun 			likely = 0;
1190*4882a593Smuzhiyun 			cond = 0;
1191*4882a593Smuzhiyun 			fpr = &current->thread.fpu.fpr[MIPSInst_RT(ir)];
1192*4882a593Smuzhiyun 			bit0 = get_fpr32(fpr, 0) & 0x1;
1193*4882a593Smuzhiyun 			switch (MIPSInst_RS(ir)) {
1194*4882a593Smuzhiyun 			case bc1eqz_op:
1195*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(bc1eqz);
1196*4882a593Smuzhiyun 				cond = bit0 == 0;
1197*4882a593Smuzhiyun 				break;
1198*4882a593Smuzhiyun 			case bc1nez_op:
1199*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(bc1nez);
1200*4882a593Smuzhiyun 				cond = bit0 != 0;
1201*4882a593Smuzhiyun 				break;
1202*4882a593Smuzhiyun 			}
1203*4882a593Smuzhiyun 			goto branch_common;
1204*4882a593Smuzhiyun 
1205*4882a593Smuzhiyun 		case bc_op:
1206*4882a593Smuzhiyun 			if (delay_slot(xcp))
1207*4882a593Smuzhiyun 				return SIGILL;
1208*4882a593Smuzhiyun 
1209*4882a593Smuzhiyun 			if (cpu_has_mips_4_5_r)
1210*4882a593Smuzhiyun 				cbit = fpucondbit[MIPSInst_RT(ir) >> 2];
1211*4882a593Smuzhiyun 			else
1212*4882a593Smuzhiyun 				cbit = FPU_CSR_COND;
1213*4882a593Smuzhiyun 			cond = ctx->fcr31 & cbit;
1214*4882a593Smuzhiyun 
1215*4882a593Smuzhiyun 			likely = 0;
1216*4882a593Smuzhiyun 			switch (MIPSInst_RT(ir) & 3) {
1217*4882a593Smuzhiyun 			case bcfl_op:
1218*4882a593Smuzhiyun 				if (cpu_has_mips_2_3_4_5_r)
1219*4882a593Smuzhiyun 					likely = 1;
1220*4882a593Smuzhiyun 				fallthrough;
1221*4882a593Smuzhiyun 			case bcf_op:
1222*4882a593Smuzhiyun 				cond = !cond;
1223*4882a593Smuzhiyun 				break;
1224*4882a593Smuzhiyun 			case bctl_op:
1225*4882a593Smuzhiyun 				if (cpu_has_mips_2_3_4_5_r)
1226*4882a593Smuzhiyun 					likely = 1;
1227*4882a593Smuzhiyun 				fallthrough;
1228*4882a593Smuzhiyun 			case bct_op:
1229*4882a593Smuzhiyun 				break;
1230*4882a593Smuzhiyun 			}
1231*4882a593Smuzhiyun branch_common:
1232*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(branches);
1233*4882a593Smuzhiyun 			set_delay_slot(xcp);
1234*4882a593Smuzhiyun 			if (cond) {
1235*4882a593Smuzhiyun 				/*
1236*4882a593Smuzhiyun 				 * Branch taken: emulate dslot instruction
1237*4882a593Smuzhiyun 				 */
1238*4882a593Smuzhiyun 				unsigned long bcpc;
1239*4882a593Smuzhiyun 
1240*4882a593Smuzhiyun 				/*
1241*4882a593Smuzhiyun 				 * Remember EPC at the branch to point back
1242*4882a593Smuzhiyun 				 * at so that any delay-slot instruction
1243*4882a593Smuzhiyun 				 * signal is not silently ignored.
1244*4882a593Smuzhiyun 				 */
1245*4882a593Smuzhiyun 				bcpc = xcp->cp0_epc;
1246*4882a593Smuzhiyun 				xcp->cp0_epc += dec_insn.pc_inc;
1247*4882a593Smuzhiyun 
1248*4882a593Smuzhiyun 				contpc = MIPSInst_SIMM(ir);
1249*4882a593Smuzhiyun 				ir = dec_insn.next_insn;
1250*4882a593Smuzhiyun 				if (dec_insn.micro_mips_mode) {
1251*4882a593Smuzhiyun 					contpc = (xcp->cp0_epc + (contpc << 1));
1252*4882a593Smuzhiyun 
1253*4882a593Smuzhiyun 					/* If 16-bit instruction, not FPU. */
1254*4882a593Smuzhiyun 					if ((dec_insn.next_pc_inc == 2) ||
1255*4882a593Smuzhiyun 						(microMIPS32_to_MIPS32((union mips_instruction *)&ir) == SIGILL)) {
1256*4882a593Smuzhiyun 
1257*4882a593Smuzhiyun 						/*
1258*4882a593Smuzhiyun 						 * Since this instruction will
1259*4882a593Smuzhiyun 						 * be put on the stack with
1260*4882a593Smuzhiyun 						 * 32-bit words, get around
1261*4882a593Smuzhiyun 						 * this problem by putting a
1262*4882a593Smuzhiyun 						 * NOP16 as the second one.
1263*4882a593Smuzhiyun 						 */
1264*4882a593Smuzhiyun 						if (dec_insn.next_pc_inc == 2)
1265*4882a593Smuzhiyun 							ir = (ir & (~0xffff)) | MM_NOP16;
1266*4882a593Smuzhiyun 
1267*4882a593Smuzhiyun 						/*
1268*4882a593Smuzhiyun 						 * Single step the non-CP1
1269*4882a593Smuzhiyun 						 * instruction in the dslot.
1270*4882a593Smuzhiyun 						 */
1271*4882a593Smuzhiyun 						sig = mips_dsemul(xcp, ir,
1272*4882a593Smuzhiyun 								  bcpc, contpc);
1273*4882a593Smuzhiyun 						if (sig < 0)
1274*4882a593Smuzhiyun 							break;
1275*4882a593Smuzhiyun 						if (sig)
1276*4882a593Smuzhiyun 							xcp->cp0_epc = bcpc;
1277*4882a593Smuzhiyun 						/*
1278*4882a593Smuzhiyun 						 * SIGILL forces out of
1279*4882a593Smuzhiyun 						 * the emulation loop.
1280*4882a593Smuzhiyun 						 */
1281*4882a593Smuzhiyun 						return sig ? sig : SIGILL;
1282*4882a593Smuzhiyun 					}
1283*4882a593Smuzhiyun 				} else
1284*4882a593Smuzhiyun 					contpc = (xcp->cp0_epc + (contpc << 2));
1285*4882a593Smuzhiyun 
1286*4882a593Smuzhiyun 				switch (MIPSInst_OPCODE(ir)) {
1287*4882a593Smuzhiyun 				case lwc1_op:
1288*4882a593Smuzhiyun 				case swc1_op:
1289*4882a593Smuzhiyun 					goto emul;
1290*4882a593Smuzhiyun 
1291*4882a593Smuzhiyun 				case ldc1_op:
1292*4882a593Smuzhiyun 				case sdc1_op:
1293*4882a593Smuzhiyun 					if (cpu_has_mips_2_3_4_5_r)
1294*4882a593Smuzhiyun 						goto emul;
1295*4882a593Smuzhiyun 
1296*4882a593Smuzhiyun 					goto bc_sigill;
1297*4882a593Smuzhiyun 
1298*4882a593Smuzhiyun 				case cop1_op:
1299*4882a593Smuzhiyun 					goto emul;
1300*4882a593Smuzhiyun 
1301*4882a593Smuzhiyun 				case cop1x_op:
1302*4882a593Smuzhiyun 					if (cpu_has_mips_4_5_64_r2_r6)
1303*4882a593Smuzhiyun 						/* its one of ours */
1304*4882a593Smuzhiyun 						goto emul;
1305*4882a593Smuzhiyun 
1306*4882a593Smuzhiyun 					goto bc_sigill;
1307*4882a593Smuzhiyun 
1308*4882a593Smuzhiyun 				case spec_op:
1309*4882a593Smuzhiyun 					switch (MIPSInst_FUNC(ir)) {
1310*4882a593Smuzhiyun 					case movc_op:
1311*4882a593Smuzhiyun 						if (cpu_has_mips_4_5_r)
1312*4882a593Smuzhiyun 							goto emul;
1313*4882a593Smuzhiyun 
1314*4882a593Smuzhiyun 						goto bc_sigill;
1315*4882a593Smuzhiyun 					}
1316*4882a593Smuzhiyun 					break;
1317*4882a593Smuzhiyun 
1318*4882a593Smuzhiyun 				bc_sigill:
1319*4882a593Smuzhiyun 					xcp->cp0_epc = bcpc;
1320*4882a593Smuzhiyun 					return SIGILL;
1321*4882a593Smuzhiyun 				}
1322*4882a593Smuzhiyun 
1323*4882a593Smuzhiyun 				/*
1324*4882a593Smuzhiyun 				 * Single step the non-cp1
1325*4882a593Smuzhiyun 				 * instruction in the dslot
1326*4882a593Smuzhiyun 				 */
1327*4882a593Smuzhiyun 				sig = mips_dsemul(xcp, ir, bcpc, contpc);
1328*4882a593Smuzhiyun 				if (sig < 0)
1329*4882a593Smuzhiyun 					break;
1330*4882a593Smuzhiyun 				if (sig)
1331*4882a593Smuzhiyun 					xcp->cp0_epc = bcpc;
1332*4882a593Smuzhiyun 				/* SIGILL forces out of the emulation loop.  */
1333*4882a593Smuzhiyun 				return sig ? sig : SIGILL;
1334*4882a593Smuzhiyun 			} else if (likely) {	/* branch not taken */
1335*4882a593Smuzhiyun 				/*
1336*4882a593Smuzhiyun 				 * branch likely nullifies
1337*4882a593Smuzhiyun 				 * dslot if not taken
1338*4882a593Smuzhiyun 				 */
1339*4882a593Smuzhiyun 				xcp->cp0_epc += dec_insn.pc_inc;
1340*4882a593Smuzhiyun 				contpc += dec_insn.pc_inc;
1341*4882a593Smuzhiyun 				/*
1342*4882a593Smuzhiyun 				 * else continue & execute
1343*4882a593Smuzhiyun 				 * dslot as normal insn
1344*4882a593Smuzhiyun 				 */
1345*4882a593Smuzhiyun 			}
1346*4882a593Smuzhiyun 			break;
1347*4882a593Smuzhiyun 
1348*4882a593Smuzhiyun 		default:
1349*4882a593Smuzhiyun 			if (!(MIPSInst_RS(ir) & 0x10))
1350*4882a593Smuzhiyun 				return SIGILL;
1351*4882a593Smuzhiyun 
1352*4882a593Smuzhiyun 			/* a real fpu computation instruction */
1353*4882a593Smuzhiyun 			sig = fpu_emu(xcp, ctx, ir);
1354*4882a593Smuzhiyun 			if (sig)
1355*4882a593Smuzhiyun 				return sig;
1356*4882a593Smuzhiyun 		}
1357*4882a593Smuzhiyun 		break;
1358*4882a593Smuzhiyun 
1359*4882a593Smuzhiyun 	case cop1x_op:
1360*4882a593Smuzhiyun 		if (!cpu_has_mips_4_5_64_r2_r6)
1361*4882a593Smuzhiyun 			return SIGILL;
1362*4882a593Smuzhiyun 
1363*4882a593Smuzhiyun 		sig = fpux_emu(xcp, ctx, ir, fault_addr);
1364*4882a593Smuzhiyun 		if (sig)
1365*4882a593Smuzhiyun 			return sig;
1366*4882a593Smuzhiyun 		break;
1367*4882a593Smuzhiyun 
1368*4882a593Smuzhiyun 	case spec_op:
1369*4882a593Smuzhiyun 		if (!cpu_has_mips_4_5_r)
1370*4882a593Smuzhiyun 			return SIGILL;
1371*4882a593Smuzhiyun 
1372*4882a593Smuzhiyun 		if (MIPSInst_FUNC(ir) != movc_op)
1373*4882a593Smuzhiyun 			return SIGILL;
1374*4882a593Smuzhiyun 		cond = fpucondbit[MIPSInst_RT(ir) >> 2];
1375*4882a593Smuzhiyun 		if (((ctx->fcr31 & cond) != 0) == ((MIPSInst_RT(ir) & 1) != 0))
1376*4882a593Smuzhiyun 			xcp->regs[MIPSInst_RD(ir)] =
1377*4882a593Smuzhiyun 				xcp->regs[MIPSInst_RS(ir)];
1378*4882a593Smuzhiyun 		break;
1379*4882a593Smuzhiyun 	default:
1380*4882a593Smuzhiyun 		return SIGILL;
1381*4882a593Smuzhiyun 	}
1382*4882a593Smuzhiyun 
1383*4882a593Smuzhiyun 	/* we did it !! */
1384*4882a593Smuzhiyun 	xcp->cp0_epc = contpc;
1385*4882a593Smuzhiyun 	clear_delay_slot(xcp);
1386*4882a593Smuzhiyun 
1387*4882a593Smuzhiyun 	return 0;
1388*4882a593Smuzhiyun }
1389*4882a593Smuzhiyun 
1390*4882a593Smuzhiyun /*
1391*4882a593Smuzhiyun  * Conversion table from MIPS compare ops 48-63
1392*4882a593Smuzhiyun  * cond = ieee754dp_cmp(x,y,IEEE754_UN,sig);
1393*4882a593Smuzhiyun  */
1394*4882a593Smuzhiyun static const unsigned char cmptab[8] = {
1395*4882a593Smuzhiyun 	0,			/* cmp_0 (sig) cmp_sf */
1396*4882a593Smuzhiyun 	IEEE754_CUN,		/* cmp_un (sig) cmp_ngle */
1397*4882a593Smuzhiyun 	IEEE754_CEQ,		/* cmp_eq (sig) cmp_seq */
1398*4882a593Smuzhiyun 	IEEE754_CEQ | IEEE754_CUN,	/* cmp_ueq (sig) cmp_ngl  */
1399*4882a593Smuzhiyun 	IEEE754_CLT,		/* cmp_olt (sig) cmp_lt */
1400*4882a593Smuzhiyun 	IEEE754_CLT | IEEE754_CUN,	/* cmp_ult (sig) cmp_nge */
1401*4882a593Smuzhiyun 	IEEE754_CLT | IEEE754_CEQ,	/* cmp_ole (sig) cmp_le */
1402*4882a593Smuzhiyun 	IEEE754_CLT | IEEE754_CEQ | IEEE754_CUN,	/* cmp_ule (sig) cmp_ngt */
1403*4882a593Smuzhiyun };
1404*4882a593Smuzhiyun 
1405*4882a593Smuzhiyun static const unsigned char negative_cmptab[8] = {
1406*4882a593Smuzhiyun 	0, /* Reserved */
1407*4882a593Smuzhiyun 	IEEE754_CLT | IEEE754_CGT | IEEE754_CEQ,
1408*4882a593Smuzhiyun 	IEEE754_CLT | IEEE754_CGT | IEEE754_CUN,
1409*4882a593Smuzhiyun 	IEEE754_CLT | IEEE754_CGT,
1410*4882a593Smuzhiyun 	/* Reserved */
1411*4882a593Smuzhiyun };
1412*4882a593Smuzhiyun 
1413*4882a593Smuzhiyun 
1414*4882a593Smuzhiyun /*
1415*4882a593Smuzhiyun  * Additional MIPS4 instructions
1416*4882a593Smuzhiyun  */
1417*4882a593Smuzhiyun 
1418*4882a593Smuzhiyun #define DEF3OP(name, p, f1, f2, f3)					\
1419*4882a593Smuzhiyun static union ieee754##p fpemu_##p##_##name(union ieee754##p r,		\
1420*4882a593Smuzhiyun 	union ieee754##p s, union ieee754##p t)				\
1421*4882a593Smuzhiyun {									\
1422*4882a593Smuzhiyun 	struct _ieee754_csr ieee754_csr_save;				\
1423*4882a593Smuzhiyun 	s = f1(s, t);							\
1424*4882a593Smuzhiyun 	ieee754_csr_save = ieee754_csr;					\
1425*4882a593Smuzhiyun 	s = f2(s, r);							\
1426*4882a593Smuzhiyun 	ieee754_csr_save.cx |= ieee754_csr.cx;				\
1427*4882a593Smuzhiyun 	ieee754_csr_save.sx |= ieee754_csr.sx;				\
1428*4882a593Smuzhiyun 	s = f3(s);							\
1429*4882a593Smuzhiyun 	ieee754_csr.cx |= ieee754_csr_save.cx;				\
1430*4882a593Smuzhiyun 	ieee754_csr.sx |= ieee754_csr_save.sx;				\
1431*4882a593Smuzhiyun 	return s;							\
1432*4882a593Smuzhiyun }
1433*4882a593Smuzhiyun 
fpemu_dp_recip(union ieee754dp d)1434*4882a593Smuzhiyun static union ieee754dp fpemu_dp_recip(union ieee754dp d)
1435*4882a593Smuzhiyun {
1436*4882a593Smuzhiyun 	return ieee754dp_div(ieee754dp_one(0), d);
1437*4882a593Smuzhiyun }
1438*4882a593Smuzhiyun 
fpemu_dp_rsqrt(union ieee754dp d)1439*4882a593Smuzhiyun static union ieee754dp fpemu_dp_rsqrt(union ieee754dp d)
1440*4882a593Smuzhiyun {
1441*4882a593Smuzhiyun 	return ieee754dp_div(ieee754dp_one(0), ieee754dp_sqrt(d));
1442*4882a593Smuzhiyun }
1443*4882a593Smuzhiyun 
fpemu_sp_recip(union ieee754sp s)1444*4882a593Smuzhiyun static union ieee754sp fpemu_sp_recip(union ieee754sp s)
1445*4882a593Smuzhiyun {
1446*4882a593Smuzhiyun 	return ieee754sp_div(ieee754sp_one(0), s);
1447*4882a593Smuzhiyun }
1448*4882a593Smuzhiyun 
fpemu_sp_rsqrt(union ieee754sp s)1449*4882a593Smuzhiyun static union ieee754sp fpemu_sp_rsqrt(union ieee754sp s)
1450*4882a593Smuzhiyun {
1451*4882a593Smuzhiyun 	return ieee754sp_div(ieee754sp_one(0), ieee754sp_sqrt(s));
1452*4882a593Smuzhiyun }
1453*4882a593Smuzhiyun 
1454*4882a593Smuzhiyun DEF3OP(madd, sp, ieee754sp_mul, ieee754sp_add, );
1455*4882a593Smuzhiyun DEF3OP(msub, sp, ieee754sp_mul, ieee754sp_sub, );
1456*4882a593Smuzhiyun DEF3OP(nmadd, sp, ieee754sp_mul, ieee754sp_add, ieee754sp_neg);
1457*4882a593Smuzhiyun DEF3OP(nmsub, sp, ieee754sp_mul, ieee754sp_sub, ieee754sp_neg);
1458*4882a593Smuzhiyun DEF3OP(madd, dp, ieee754dp_mul, ieee754dp_add, );
1459*4882a593Smuzhiyun DEF3OP(msub, dp, ieee754dp_mul, ieee754dp_sub, );
1460*4882a593Smuzhiyun DEF3OP(nmadd, dp, ieee754dp_mul, ieee754dp_add, ieee754dp_neg);
1461*4882a593Smuzhiyun DEF3OP(nmsub, dp, ieee754dp_mul, ieee754dp_sub, ieee754dp_neg);
1462*4882a593Smuzhiyun 
fpux_emu(struct pt_regs * xcp,struct mips_fpu_struct * ctx,mips_instruction ir,void __user ** fault_addr)1463*4882a593Smuzhiyun static int fpux_emu(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
1464*4882a593Smuzhiyun 	mips_instruction ir, void __user **fault_addr)
1465*4882a593Smuzhiyun {
1466*4882a593Smuzhiyun 	unsigned int rcsr = 0;	/* resulting csr */
1467*4882a593Smuzhiyun 
1468*4882a593Smuzhiyun 	MIPS_FPU_EMU_INC_STATS(cp1xops);
1469*4882a593Smuzhiyun 
1470*4882a593Smuzhiyun 	switch (MIPSInst_FMA_FFMT(ir)) {
1471*4882a593Smuzhiyun 	case s_fmt:{		/* 0 */
1472*4882a593Smuzhiyun 
1473*4882a593Smuzhiyun 		union ieee754sp(*handler) (union ieee754sp, union ieee754sp, union ieee754sp);
1474*4882a593Smuzhiyun 		union ieee754sp fd, fr, fs, ft;
1475*4882a593Smuzhiyun 		u32 __user *va;
1476*4882a593Smuzhiyun 		u32 val;
1477*4882a593Smuzhiyun 
1478*4882a593Smuzhiyun 		switch (MIPSInst_FUNC(ir)) {
1479*4882a593Smuzhiyun 		case lwxc1_op:
1480*4882a593Smuzhiyun 			va = (void __user *) (xcp->regs[MIPSInst_FR(ir)] +
1481*4882a593Smuzhiyun 				xcp->regs[MIPSInst_FT(ir)]);
1482*4882a593Smuzhiyun 
1483*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(loads);
1484*4882a593Smuzhiyun 			if (!access_ok(va, sizeof(u32))) {
1485*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(errors);
1486*4882a593Smuzhiyun 				*fault_addr = va;
1487*4882a593Smuzhiyun 				return SIGBUS;
1488*4882a593Smuzhiyun 			}
1489*4882a593Smuzhiyun 			if (__get_user(val, va)) {
1490*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(errors);
1491*4882a593Smuzhiyun 				*fault_addr = va;
1492*4882a593Smuzhiyun 				return SIGSEGV;
1493*4882a593Smuzhiyun 			}
1494*4882a593Smuzhiyun 			SITOREG(val, MIPSInst_FD(ir));
1495*4882a593Smuzhiyun 			break;
1496*4882a593Smuzhiyun 
1497*4882a593Smuzhiyun 		case swxc1_op:
1498*4882a593Smuzhiyun 			va = (void __user *) (xcp->regs[MIPSInst_FR(ir)] +
1499*4882a593Smuzhiyun 				xcp->regs[MIPSInst_FT(ir)]);
1500*4882a593Smuzhiyun 
1501*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(stores);
1502*4882a593Smuzhiyun 
1503*4882a593Smuzhiyun 			SIFROMREG(val, MIPSInst_FS(ir));
1504*4882a593Smuzhiyun 			if (!access_ok(va, sizeof(u32))) {
1505*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(errors);
1506*4882a593Smuzhiyun 				*fault_addr = va;
1507*4882a593Smuzhiyun 				return SIGBUS;
1508*4882a593Smuzhiyun 			}
1509*4882a593Smuzhiyun 			if (put_user(val, va)) {
1510*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(errors);
1511*4882a593Smuzhiyun 				*fault_addr = va;
1512*4882a593Smuzhiyun 				return SIGSEGV;
1513*4882a593Smuzhiyun 			}
1514*4882a593Smuzhiyun 			break;
1515*4882a593Smuzhiyun 
1516*4882a593Smuzhiyun 		case madd_s_op:
1517*4882a593Smuzhiyun 			if (cpu_has_mac2008_only)
1518*4882a593Smuzhiyun 				handler = ieee754sp_madd;
1519*4882a593Smuzhiyun 			else
1520*4882a593Smuzhiyun 				handler = fpemu_sp_madd;
1521*4882a593Smuzhiyun 			goto scoptop;
1522*4882a593Smuzhiyun 		case msub_s_op:
1523*4882a593Smuzhiyun 			if (cpu_has_mac2008_only)
1524*4882a593Smuzhiyun 				handler = ieee754sp_msub;
1525*4882a593Smuzhiyun 			else
1526*4882a593Smuzhiyun 				handler = fpemu_sp_msub;
1527*4882a593Smuzhiyun 			goto scoptop;
1528*4882a593Smuzhiyun 		case nmadd_s_op:
1529*4882a593Smuzhiyun 			if (cpu_has_mac2008_only)
1530*4882a593Smuzhiyun 				handler = ieee754sp_nmadd;
1531*4882a593Smuzhiyun 			else
1532*4882a593Smuzhiyun 				handler = fpemu_sp_nmadd;
1533*4882a593Smuzhiyun 			goto scoptop;
1534*4882a593Smuzhiyun 		case nmsub_s_op:
1535*4882a593Smuzhiyun 			if (cpu_has_mac2008_only)
1536*4882a593Smuzhiyun 				handler = ieee754sp_nmsub;
1537*4882a593Smuzhiyun 			else
1538*4882a593Smuzhiyun 				handler = fpemu_sp_nmsub;
1539*4882a593Smuzhiyun 			goto scoptop;
1540*4882a593Smuzhiyun 
1541*4882a593Smuzhiyun 		      scoptop:
1542*4882a593Smuzhiyun 			SPFROMREG(fr, MIPSInst_FR(ir));
1543*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1544*4882a593Smuzhiyun 			SPFROMREG(ft, MIPSInst_FT(ir));
1545*4882a593Smuzhiyun 			fd = (*handler) (fr, fs, ft);
1546*4882a593Smuzhiyun 			SPTOREG(fd, MIPSInst_FD(ir));
1547*4882a593Smuzhiyun 
1548*4882a593Smuzhiyun 		      copcsr:
1549*4882a593Smuzhiyun 			if (ieee754_cxtest(IEEE754_INEXACT)) {
1550*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ieee754_inexact);
1551*4882a593Smuzhiyun 				rcsr |= FPU_CSR_INE_X | FPU_CSR_INE_S;
1552*4882a593Smuzhiyun 			}
1553*4882a593Smuzhiyun 			if (ieee754_cxtest(IEEE754_UNDERFLOW)) {
1554*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ieee754_underflow);
1555*4882a593Smuzhiyun 				rcsr |= FPU_CSR_UDF_X | FPU_CSR_UDF_S;
1556*4882a593Smuzhiyun 			}
1557*4882a593Smuzhiyun 			if (ieee754_cxtest(IEEE754_OVERFLOW)) {
1558*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ieee754_overflow);
1559*4882a593Smuzhiyun 				rcsr |= FPU_CSR_OVF_X | FPU_CSR_OVF_S;
1560*4882a593Smuzhiyun 			}
1561*4882a593Smuzhiyun 			if (ieee754_cxtest(IEEE754_INVALID_OPERATION)) {
1562*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ieee754_invalidop);
1563*4882a593Smuzhiyun 				rcsr |= FPU_CSR_INV_X | FPU_CSR_INV_S;
1564*4882a593Smuzhiyun 			}
1565*4882a593Smuzhiyun 
1566*4882a593Smuzhiyun 			ctx->fcr31 = (ctx->fcr31 & ~FPU_CSR_ALL_X) | rcsr;
1567*4882a593Smuzhiyun 			if ((ctx->fcr31 >> 5) & ctx->fcr31 & FPU_CSR_ALL_E) {
1568*4882a593Smuzhiyun 				/*printk ("SIGFPE: FPU csr = %08x\n",
1569*4882a593Smuzhiyun 				   ctx->fcr31); */
1570*4882a593Smuzhiyun 				return SIGFPE;
1571*4882a593Smuzhiyun 			}
1572*4882a593Smuzhiyun 
1573*4882a593Smuzhiyun 			break;
1574*4882a593Smuzhiyun 
1575*4882a593Smuzhiyun 		default:
1576*4882a593Smuzhiyun 			return SIGILL;
1577*4882a593Smuzhiyun 		}
1578*4882a593Smuzhiyun 		break;
1579*4882a593Smuzhiyun 	}
1580*4882a593Smuzhiyun 
1581*4882a593Smuzhiyun 	case d_fmt:{		/* 1 */
1582*4882a593Smuzhiyun 		union ieee754dp(*handler) (union ieee754dp, union ieee754dp, union ieee754dp);
1583*4882a593Smuzhiyun 		union ieee754dp fd, fr, fs, ft;
1584*4882a593Smuzhiyun 		u64 __user *va;
1585*4882a593Smuzhiyun 		u64 val;
1586*4882a593Smuzhiyun 
1587*4882a593Smuzhiyun 		switch (MIPSInst_FUNC(ir)) {
1588*4882a593Smuzhiyun 		case ldxc1_op:
1589*4882a593Smuzhiyun 			va = (void __user *) (xcp->regs[MIPSInst_FR(ir)] +
1590*4882a593Smuzhiyun 				xcp->regs[MIPSInst_FT(ir)]);
1591*4882a593Smuzhiyun 
1592*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(loads);
1593*4882a593Smuzhiyun 			if (!access_ok(va, sizeof(u64))) {
1594*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(errors);
1595*4882a593Smuzhiyun 				*fault_addr = va;
1596*4882a593Smuzhiyun 				return SIGBUS;
1597*4882a593Smuzhiyun 			}
1598*4882a593Smuzhiyun 			if (__get_user(val, va)) {
1599*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(errors);
1600*4882a593Smuzhiyun 				*fault_addr = va;
1601*4882a593Smuzhiyun 				return SIGSEGV;
1602*4882a593Smuzhiyun 			}
1603*4882a593Smuzhiyun 			DITOREG(val, MIPSInst_FD(ir));
1604*4882a593Smuzhiyun 			break;
1605*4882a593Smuzhiyun 
1606*4882a593Smuzhiyun 		case sdxc1_op:
1607*4882a593Smuzhiyun 			va = (void __user *) (xcp->regs[MIPSInst_FR(ir)] +
1608*4882a593Smuzhiyun 				xcp->regs[MIPSInst_FT(ir)]);
1609*4882a593Smuzhiyun 
1610*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(stores);
1611*4882a593Smuzhiyun 			DIFROMREG(val, MIPSInst_FS(ir));
1612*4882a593Smuzhiyun 			if (!access_ok(va, sizeof(u64))) {
1613*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(errors);
1614*4882a593Smuzhiyun 				*fault_addr = va;
1615*4882a593Smuzhiyun 				return SIGBUS;
1616*4882a593Smuzhiyun 			}
1617*4882a593Smuzhiyun 			if (__put_user(val, va)) {
1618*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(errors);
1619*4882a593Smuzhiyun 				*fault_addr = va;
1620*4882a593Smuzhiyun 				return SIGSEGV;
1621*4882a593Smuzhiyun 			}
1622*4882a593Smuzhiyun 			break;
1623*4882a593Smuzhiyun 
1624*4882a593Smuzhiyun 		case madd_d_op:
1625*4882a593Smuzhiyun 			if (cpu_has_mac2008_only)
1626*4882a593Smuzhiyun 				handler = ieee754dp_madd;
1627*4882a593Smuzhiyun 			else
1628*4882a593Smuzhiyun 				handler = fpemu_dp_madd;
1629*4882a593Smuzhiyun 			goto dcoptop;
1630*4882a593Smuzhiyun 		case msub_d_op:
1631*4882a593Smuzhiyun 			if (cpu_has_mac2008_only)
1632*4882a593Smuzhiyun 				handler = ieee754dp_msub;
1633*4882a593Smuzhiyun 			else
1634*4882a593Smuzhiyun 				handler = fpemu_dp_msub;
1635*4882a593Smuzhiyun 			goto dcoptop;
1636*4882a593Smuzhiyun 		case nmadd_d_op:
1637*4882a593Smuzhiyun 			if (cpu_has_mac2008_only)
1638*4882a593Smuzhiyun 				handler = ieee754dp_nmadd;
1639*4882a593Smuzhiyun 			else
1640*4882a593Smuzhiyun 				handler = fpemu_dp_nmadd;
1641*4882a593Smuzhiyun 			goto dcoptop;
1642*4882a593Smuzhiyun 		case nmsub_d_op:
1643*4882a593Smuzhiyun 			if (cpu_has_mac2008_only)
1644*4882a593Smuzhiyun 				handler = ieee754dp_nmsub;
1645*4882a593Smuzhiyun 			else
1646*4882a593Smuzhiyun 			handler = fpemu_dp_nmsub;
1647*4882a593Smuzhiyun 			goto dcoptop;
1648*4882a593Smuzhiyun 
1649*4882a593Smuzhiyun 		      dcoptop:
1650*4882a593Smuzhiyun 			DPFROMREG(fr, MIPSInst_FR(ir));
1651*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
1652*4882a593Smuzhiyun 			DPFROMREG(ft, MIPSInst_FT(ir));
1653*4882a593Smuzhiyun 			fd = (*handler) (fr, fs, ft);
1654*4882a593Smuzhiyun 			DPTOREG(fd, MIPSInst_FD(ir));
1655*4882a593Smuzhiyun 			goto copcsr;
1656*4882a593Smuzhiyun 
1657*4882a593Smuzhiyun 		default:
1658*4882a593Smuzhiyun 			return SIGILL;
1659*4882a593Smuzhiyun 		}
1660*4882a593Smuzhiyun 		break;
1661*4882a593Smuzhiyun 	}
1662*4882a593Smuzhiyun 
1663*4882a593Smuzhiyun 	case 0x3:
1664*4882a593Smuzhiyun 		if (MIPSInst_FUNC(ir) != pfetch_op)
1665*4882a593Smuzhiyun 			return SIGILL;
1666*4882a593Smuzhiyun 
1667*4882a593Smuzhiyun 		/* ignore prefx operation */
1668*4882a593Smuzhiyun 		break;
1669*4882a593Smuzhiyun 
1670*4882a593Smuzhiyun 	default:
1671*4882a593Smuzhiyun 		return SIGILL;
1672*4882a593Smuzhiyun 	}
1673*4882a593Smuzhiyun 
1674*4882a593Smuzhiyun 	return 0;
1675*4882a593Smuzhiyun }
1676*4882a593Smuzhiyun 
1677*4882a593Smuzhiyun 
1678*4882a593Smuzhiyun 
1679*4882a593Smuzhiyun /*
1680*4882a593Smuzhiyun  * Emulate a single COP1 arithmetic instruction.
1681*4882a593Smuzhiyun  */
fpu_emu(struct pt_regs * xcp,struct mips_fpu_struct * ctx,mips_instruction ir)1682*4882a593Smuzhiyun static int fpu_emu(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
1683*4882a593Smuzhiyun 	mips_instruction ir)
1684*4882a593Smuzhiyun {
1685*4882a593Smuzhiyun 	int rfmt;		/* resulting format */
1686*4882a593Smuzhiyun 	unsigned int rcsr = 0;	/* resulting csr */
1687*4882a593Smuzhiyun 	unsigned int oldrm;
1688*4882a593Smuzhiyun 	unsigned int cbit;
1689*4882a593Smuzhiyun 	unsigned int cond;
1690*4882a593Smuzhiyun 	union {
1691*4882a593Smuzhiyun 		union ieee754dp d;
1692*4882a593Smuzhiyun 		union ieee754sp s;
1693*4882a593Smuzhiyun 		int w;
1694*4882a593Smuzhiyun 		s64 l;
1695*4882a593Smuzhiyun 	} rv;			/* resulting value */
1696*4882a593Smuzhiyun 	u64 bits;
1697*4882a593Smuzhiyun 
1698*4882a593Smuzhiyun 	MIPS_FPU_EMU_INC_STATS(cp1ops);
1699*4882a593Smuzhiyun 	switch (rfmt = (MIPSInst_FFMT(ir) & 0xf)) {
1700*4882a593Smuzhiyun 	case s_fmt: {		/* 0 */
1701*4882a593Smuzhiyun 		union {
1702*4882a593Smuzhiyun 			union ieee754sp(*b) (union ieee754sp, union ieee754sp);
1703*4882a593Smuzhiyun 			union ieee754sp(*u) (union ieee754sp);
1704*4882a593Smuzhiyun 		} handler;
1705*4882a593Smuzhiyun 		union ieee754sp fd, fs, ft;
1706*4882a593Smuzhiyun 
1707*4882a593Smuzhiyun 		switch (MIPSInst_FUNC(ir)) {
1708*4882a593Smuzhiyun 			/* binary ops */
1709*4882a593Smuzhiyun 		case fadd_op:
1710*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(add_s);
1711*4882a593Smuzhiyun 			handler.b = ieee754sp_add;
1712*4882a593Smuzhiyun 			goto scopbop;
1713*4882a593Smuzhiyun 		case fsub_op:
1714*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(sub_s);
1715*4882a593Smuzhiyun 			handler.b = ieee754sp_sub;
1716*4882a593Smuzhiyun 			goto scopbop;
1717*4882a593Smuzhiyun 		case fmul_op:
1718*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(mul_s);
1719*4882a593Smuzhiyun 			handler.b = ieee754sp_mul;
1720*4882a593Smuzhiyun 			goto scopbop;
1721*4882a593Smuzhiyun 		case fdiv_op:
1722*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(div_s);
1723*4882a593Smuzhiyun 			handler.b = ieee754sp_div;
1724*4882a593Smuzhiyun 			goto scopbop;
1725*4882a593Smuzhiyun 
1726*4882a593Smuzhiyun 			/* unary  ops */
1727*4882a593Smuzhiyun 		case fsqrt_op:
1728*4882a593Smuzhiyun 			if (!cpu_has_mips_2_3_4_5_r)
1729*4882a593Smuzhiyun 				return SIGILL;
1730*4882a593Smuzhiyun 
1731*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(sqrt_s);
1732*4882a593Smuzhiyun 			handler.u = ieee754sp_sqrt;
1733*4882a593Smuzhiyun 			goto scopuop;
1734*4882a593Smuzhiyun 
1735*4882a593Smuzhiyun 		/*
1736*4882a593Smuzhiyun 		 * Note that on some MIPS IV implementations such as the
1737*4882a593Smuzhiyun 		 * R5000 and R8000 the FSQRT and FRECIP instructions do not
1738*4882a593Smuzhiyun 		 * achieve full IEEE-754 accuracy - however this emulator does.
1739*4882a593Smuzhiyun 		 */
1740*4882a593Smuzhiyun 		case frsqrt_op:
1741*4882a593Smuzhiyun 			if (!cpu_has_mips_4_5_64_r2_r6)
1742*4882a593Smuzhiyun 				return SIGILL;
1743*4882a593Smuzhiyun 
1744*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(rsqrt_s);
1745*4882a593Smuzhiyun 			handler.u = fpemu_sp_rsqrt;
1746*4882a593Smuzhiyun 			goto scopuop;
1747*4882a593Smuzhiyun 
1748*4882a593Smuzhiyun 		case frecip_op:
1749*4882a593Smuzhiyun 			if (!cpu_has_mips_4_5_64_r2_r6)
1750*4882a593Smuzhiyun 				return SIGILL;
1751*4882a593Smuzhiyun 
1752*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(recip_s);
1753*4882a593Smuzhiyun 			handler.u = fpemu_sp_recip;
1754*4882a593Smuzhiyun 			goto scopuop;
1755*4882a593Smuzhiyun 
1756*4882a593Smuzhiyun 		case fmovc_op:
1757*4882a593Smuzhiyun 			if (!cpu_has_mips_4_5_r)
1758*4882a593Smuzhiyun 				return SIGILL;
1759*4882a593Smuzhiyun 
1760*4882a593Smuzhiyun 			cond = fpucondbit[MIPSInst_FT(ir) >> 2];
1761*4882a593Smuzhiyun 			if (((ctx->fcr31 & cond) != 0) !=
1762*4882a593Smuzhiyun 				((MIPSInst_FT(ir) & 1) != 0))
1763*4882a593Smuzhiyun 				return 0;
1764*4882a593Smuzhiyun 			SPFROMREG(rv.s, MIPSInst_FS(ir));
1765*4882a593Smuzhiyun 			break;
1766*4882a593Smuzhiyun 
1767*4882a593Smuzhiyun 		case fmovz_op:
1768*4882a593Smuzhiyun 			if (!cpu_has_mips_4_5_r)
1769*4882a593Smuzhiyun 				return SIGILL;
1770*4882a593Smuzhiyun 
1771*4882a593Smuzhiyun 			if (xcp->regs[MIPSInst_FT(ir)] != 0)
1772*4882a593Smuzhiyun 				return 0;
1773*4882a593Smuzhiyun 			SPFROMREG(rv.s, MIPSInst_FS(ir));
1774*4882a593Smuzhiyun 			break;
1775*4882a593Smuzhiyun 
1776*4882a593Smuzhiyun 		case fmovn_op:
1777*4882a593Smuzhiyun 			if (!cpu_has_mips_4_5_r)
1778*4882a593Smuzhiyun 				return SIGILL;
1779*4882a593Smuzhiyun 
1780*4882a593Smuzhiyun 			if (xcp->regs[MIPSInst_FT(ir)] == 0)
1781*4882a593Smuzhiyun 				return 0;
1782*4882a593Smuzhiyun 			SPFROMREG(rv.s, MIPSInst_FS(ir));
1783*4882a593Smuzhiyun 			break;
1784*4882a593Smuzhiyun 
1785*4882a593Smuzhiyun 		case fseleqz_op:
1786*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
1787*4882a593Smuzhiyun 				return SIGILL;
1788*4882a593Smuzhiyun 
1789*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(seleqz_s);
1790*4882a593Smuzhiyun 			SPFROMREG(rv.s, MIPSInst_FT(ir));
1791*4882a593Smuzhiyun 			if (rv.w & 0x1)
1792*4882a593Smuzhiyun 				rv.w = 0;
1793*4882a593Smuzhiyun 			else
1794*4882a593Smuzhiyun 				SPFROMREG(rv.s, MIPSInst_FS(ir));
1795*4882a593Smuzhiyun 			break;
1796*4882a593Smuzhiyun 
1797*4882a593Smuzhiyun 		case fselnez_op:
1798*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
1799*4882a593Smuzhiyun 				return SIGILL;
1800*4882a593Smuzhiyun 
1801*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(selnez_s);
1802*4882a593Smuzhiyun 			SPFROMREG(rv.s, MIPSInst_FT(ir));
1803*4882a593Smuzhiyun 			if (rv.w & 0x1)
1804*4882a593Smuzhiyun 				SPFROMREG(rv.s, MIPSInst_FS(ir));
1805*4882a593Smuzhiyun 			else
1806*4882a593Smuzhiyun 				rv.w = 0;
1807*4882a593Smuzhiyun 			break;
1808*4882a593Smuzhiyun 
1809*4882a593Smuzhiyun 		case fmaddf_op: {
1810*4882a593Smuzhiyun 			union ieee754sp ft, fs, fd;
1811*4882a593Smuzhiyun 
1812*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
1813*4882a593Smuzhiyun 				return SIGILL;
1814*4882a593Smuzhiyun 
1815*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(maddf_s);
1816*4882a593Smuzhiyun 			SPFROMREG(ft, MIPSInst_FT(ir));
1817*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1818*4882a593Smuzhiyun 			SPFROMREG(fd, MIPSInst_FD(ir));
1819*4882a593Smuzhiyun 			rv.s = ieee754sp_maddf(fd, fs, ft);
1820*4882a593Smuzhiyun 			goto copcsr;
1821*4882a593Smuzhiyun 		}
1822*4882a593Smuzhiyun 
1823*4882a593Smuzhiyun 		case fmsubf_op: {
1824*4882a593Smuzhiyun 			union ieee754sp ft, fs, fd;
1825*4882a593Smuzhiyun 
1826*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
1827*4882a593Smuzhiyun 				return SIGILL;
1828*4882a593Smuzhiyun 
1829*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(msubf_s);
1830*4882a593Smuzhiyun 			SPFROMREG(ft, MIPSInst_FT(ir));
1831*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1832*4882a593Smuzhiyun 			SPFROMREG(fd, MIPSInst_FD(ir));
1833*4882a593Smuzhiyun 			rv.s = ieee754sp_msubf(fd, fs, ft);
1834*4882a593Smuzhiyun 			goto copcsr;
1835*4882a593Smuzhiyun 		}
1836*4882a593Smuzhiyun 
1837*4882a593Smuzhiyun 		case frint_op: {
1838*4882a593Smuzhiyun 			union ieee754sp fs;
1839*4882a593Smuzhiyun 
1840*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
1841*4882a593Smuzhiyun 				return SIGILL;
1842*4882a593Smuzhiyun 
1843*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(rint_s);
1844*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1845*4882a593Smuzhiyun 			rv.s = ieee754sp_rint(fs);
1846*4882a593Smuzhiyun 			goto copcsr;
1847*4882a593Smuzhiyun 		}
1848*4882a593Smuzhiyun 
1849*4882a593Smuzhiyun 		case fclass_op: {
1850*4882a593Smuzhiyun 			union ieee754sp fs;
1851*4882a593Smuzhiyun 
1852*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
1853*4882a593Smuzhiyun 				return SIGILL;
1854*4882a593Smuzhiyun 
1855*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(class_s);
1856*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1857*4882a593Smuzhiyun 			rv.w = ieee754sp_2008class(fs);
1858*4882a593Smuzhiyun 			rfmt = w_fmt;
1859*4882a593Smuzhiyun 			goto copcsr;
1860*4882a593Smuzhiyun 		}
1861*4882a593Smuzhiyun 
1862*4882a593Smuzhiyun 		case fmin_op: {
1863*4882a593Smuzhiyun 			union ieee754sp fs, ft;
1864*4882a593Smuzhiyun 
1865*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
1866*4882a593Smuzhiyun 				return SIGILL;
1867*4882a593Smuzhiyun 
1868*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(min_s);
1869*4882a593Smuzhiyun 			SPFROMREG(ft, MIPSInst_FT(ir));
1870*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1871*4882a593Smuzhiyun 			rv.s = ieee754sp_fmin(fs, ft);
1872*4882a593Smuzhiyun 			goto copcsr;
1873*4882a593Smuzhiyun 		}
1874*4882a593Smuzhiyun 
1875*4882a593Smuzhiyun 		case fmina_op: {
1876*4882a593Smuzhiyun 			union ieee754sp fs, ft;
1877*4882a593Smuzhiyun 
1878*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
1879*4882a593Smuzhiyun 				return SIGILL;
1880*4882a593Smuzhiyun 
1881*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(mina_s);
1882*4882a593Smuzhiyun 			SPFROMREG(ft, MIPSInst_FT(ir));
1883*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1884*4882a593Smuzhiyun 			rv.s = ieee754sp_fmina(fs, ft);
1885*4882a593Smuzhiyun 			goto copcsr;
1886*4882a593Smuzhiyun 		}
1887*4882a593Smuzhiyun 
1888*4882a593Smuzhiyun 		case fmax_op: {
1889*4882a593Smuzhiyun 			union ieee754sp fs, ft;
1890*4882a593Smuzhiyun 
1891*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
1892*4882a593Smuzhiyun 				return SIGILL;
1893*4882a593Smuzhiyun 
1894*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(max_s);
1895*4882a593Smuzhiyun 			SPFROMREG(ft, MIPSInst_FT(ir));
1896*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1897*4882a593Smuzhiyun 			rv.s = ieee754sp_fmax(fs, ft);
1898*4882a593Smuzhiyun 			goto copcsr;
1899*4882a593Smuzhiyun 		}
1900*4882a593Smuzhiyun 
1901*4882a593Smuzhiyun 		case fmaxa_op: {
1902*4882a593Smuzhiyun 			union ieee754sp fs, ft;
1903*4882a593Smuzhiyun 
1904*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
1905*4882a593Smuzhiyun 				return SIGILL;
1906*4882a593Smuzhiyun 
1907*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(maxa_s);
1908*4882a593Smuzhiyun 			SPFROMREG(ft, MIPSInst_FT(ir));
1909*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1910*4882a593Smuzhiyun 			rv.s = ieee754sp_fmaxa(fs, ft);
1911*4882a593Smuzhiyun 			goto copcsr;
1912*4882a593Smuzhiyun 		}
1913*4882a593Smuzhiyun 
1914*4882a593Smuzhiyun 		case fabs_op:
1915*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(abs_s);
1916*4882a593Smuzhiyun 			handler.u = ieee754sp_abs;
1917*4882a593Smuzhiyun 			goto scopuop;
1918*4882a593Smuzhiyun 
1919*4882a593Smuzhiyun 		case fneg_op:
1920*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(neg_s);
1921*4882a593Smuzhiyun 			handler.u = ieee754sp_neg;
1922*4882a593Smuzhiyun 			goto scopuop;
1923*4882a593Smuzhiyun 
1924*4882a593Smuzhiyun 		case fmov_op:
1925*4882a593Smuzhiyun 			/* an easy one */
1926*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(mov_s);
1927*4882a593Smuzhiyun 			SPFROMREG(rv.s, MIPSInst_FS(ir));
1928*4882a593Smuzhiyun 			goto copcsr;
1929*4882a593Smuzhiyun 
1930*4882a593Smuzhiyun 			/* binary op on handler */
1931*4882a593Smuzhiyun scopbop:
1932*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1933*4882a593Smuzhiyun 			SPFROMREG(ft, MIPSInst_FT(ir));
1934*4882a593Smuzhiyun 
1935*4882a593Smuzhiyun 			rv.s = (*handler.b) (fs, ft);
1936*4882a593Smuzhiyun 			goto copcsr;
1937*4882a593Smuzhiyun scopuop:
1938*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1939*4882a593Smuzhiyun 			rv.s = (*handler.u) (fs);
1940*4882a593Smuzhiyun 			goto copcsr;
1941*4882a593Smuzhiyun copcsr:
1942*4882a593Smuzhiyun 			if (ieee754_cxtest(IEEE754_INEXACT)) {
1943*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ieee754_inexact);
1944*4882a593Smuzhiyun 				rcsr |= FPU_CSR_INE_X | FPU_CSR_INE_S;
1945*4882a593Smuzhiyun 			}
1946*4882a593Smuzhiyun 			if (ieee754_cxtest(IEEE754_UNDERFLOW)) {
1947*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ieee754_underflow);
1948*4882a593Smuzhiyun 				rcsr |= FPU_CSR_UDF_X | FPU_CSR_UDF_S;
1949*4882a593Smuzhiyun 			}
1950*4882a593Smuzhiyun 			if (ieee754_cxtest(IEEE754_OVERFLOW)) {
1951*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ieee754_overflow);
1952*4882a593Smuzhiyun 				rcsr |= FPU_CSR_OVF_X | FPU_CSR_OVF_S;
1953*4882a593Smuzhiyun 			}
1954*4882a593Smuzhiyun 			if (ieee754_cxtest(IEEE754_ZERO_DIVIDE)) {
1955*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ieee754_zerodiv);
1956*4882a593Smuzhiyun 				rcsr |= FPU_CSR_DIV_X | FPU_CSR_DIV_S;
1957*4882a593Smuzhiyun 			}
1958*4882a593Smuzhiyun 			if (ieee754_cxtest(IEEE754_INVALID_OPERATION)) {
1959*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ieee754_invalidop);
1960*4882a593Smuzhiyun 				rcsr |= FPU_CSR_INV_X | FPU_CSR_INV_S;
1961*4882a593Smuzhiyun 			}
1962*4882a593Smuzhiyun 			break;
1963*4882a593Smuzhiyun 
1964*4882a593Smuzhiyun 			/* unary conv ops */
1965*4882a593Smuzhiyun 		case fcvts_op:
1966*4882a593Smuzhiyun 			return SIGILL;	/* not defined */
1967*4882a593Smuzhiyun 
1968*4882a593Smuzhiyun 		case fcvtd_op:
1969*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(cvt_d_s);
1970*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1971*4882a593Smuzhiyun 			rv.d = ieee754dp_fsp(fs);
1972*4882a593Smuzhiyun 			rfmt = d_fmt;
1973*4882a593Smuzhiyun 			goto copcsr;
1974*4882a593Smuzhiyun 
1975*4882a593Smuzhiyun 		case fcvtw_op:
1976*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(cvt_w_s);
1977*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
1978*4882a593Smuzhiyun 			rv.w = ieee754sp_tint(fs);
1979*4882a593Smuzhiyun 			rfmt = w_fmt;
1980*4882a593Smuzhiyun 			goto copcsr;
1981*4882a593Smuzhiyun 
1982*4882a593Smuzhiyun 		case fround_op:
1983*4882a593Smuzhiyun 		case ftrunc_op:
1984*4882a593Smuzhiyun 		case fceil_op:
1985*4882a593Smuzhiyun 		case ffloor_op:
1986*4882a593Smuzhiyun 			if (!cpu_has_mips_2_3_4_5_r)
1987*4882a593Smuzhiyun 				return SIGILL;
1988*4882a593Smuzhiyun 
1989*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == fceil_op)
1990*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ceil_w_s);
1991*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == ffloor_op)
1992*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(floor_w_s);
1993*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == fround_op)
1994*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(round_w_s);
1995*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == ftrunc_op)
1996*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(trunc_w_s);
1997*4882a593Smuzhiyun 
1998*4882a593Smuzhiyun 			oldrm = ieee754_csr.rm;
1999*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
2000*4882a593Smuzhiyun 			ieee754_csr.rm = MIPSInst_FUNC(ir);
2001*4882a593Smuzhiyun 			rv.w = ieee754sp_tint(fs);
2002*4882a593Smuzhiyun 			ieee754_csr.rm = oldrm;
2003*4882a593Smuzhiyun 			rfmt = w_fmt;
2004*4882a593Smuzhiyun 			goto copcsr;
2005*4882a593Smuzhiyun 
2006*4882a593Smuzhiyun 		case fsel_op:
2007*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2008*4882a593Smuzhiyun 				return SIGILL;
2009*4882a593Smuzhiyun 
2010*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(sel_s);
2011*4882a593Smuzhiyun 			SPFROMREG(fd, MIPSInst_FD(ir));
2012*4882a593Smuzhiyun 			if (fd.bits & 0x1)
2013*4882a593Smuzhiyun 				SPFROMREG(rv.s, MIPSInst_FT(ir));
2014*4882a593Smuzhiyun 			else
2015*4882a593Smuzhiyun 				SPFROMREG(rv.s, MIPSInst_FS(ir));
2016*4882a593Smuzhiyun 			break;
2017*4882a593Smuzhiyun 
2018*4882a593Smuzhiyun 		case fcvtl_op:
2019*4882a593Smuzhiyun 			if (!cpu_has_mips_3_4_5_64_r2_r6)
2020*4882a593Smuzhiyun 				return SIGILL;
2021*4882a593Smuzhiyun 
2022*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(cvt_l_s);
2023*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
2024*4882a593Smuzhiyun 			rv.l = ieee754sp_tlong(fs);
2025*4882a593Smuzhiyun 			rfmt = l_fmt;
2026*4882a593Smuzhiyun 			goto copcsr;
2027*4882a593Smuzhiyun 
2028*4882a593Smuzhiyun 		case froundl_op:
2029*4882a593Smuzhiyun 		case ftruncl_op:
2030*4882a593Smuzhiyun 		case fceill_op:
2031*4882a593Smuzhiyun 		case ffloorl_op:
2032*4882a593Smuzhiyun 			if (!cpu_has_mips_3_4_5_64_r2_r6)
2033*4882a593Smuzhiyun 				return SIGILL;
2034*4882a593Smuzhiyun 
2035*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == fceill_op)
2036*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ceil_l_s);
2037*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == ffloorl_op)
2038*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(floor_l_s);
2039*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == froundl_op)
2040*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(round_l_s);
2041*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == ftruncl_op)
2042*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(trunc_l_s);
2043*4882a593Smuzhiyun 
2044*4882a593Smuzhiyun 			oldrm = ieee754_csr.rm;
2045*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
2046*4882a593Smuzhiyun 			ieee754_csr.rm = MIPSInst_FUNC(ir);
2047*4882a593Smuzhiyun 			rv.l = ieee754sp_tlong(fs);
2048*4882a593Smuzhiyun 			ieee754_csr.rm = oldrm;
2049*4882a593Smuzhiyun 			rfmt = l_fmt;
2050*4882a593Smuzhiyun 			goto copcsr;
2051*4882a593Smuzhiyun 
2052*4882a593Smuzhiyun 		default:
2053*4882a593Smuzhiyun 			if (!NO_R6EMU && MIPSInst_FUNC(ir) >= fcmp_op) {
2054*4882a593Smuzhiyun 				unsigned int cmpop;
2055*4882a593Smuzhiyun 				union ieee754sp fs, ft;
2056*4882a593Smuzhiyun 
2057*4882a593Smuzhiyun 				cmpop = MIPSInst_FUNC(ir) - fcmp_op;
2058*4882a593Smuzhiyun 				SPFROMREG(fs, MIPSInst_FS(ir));
2059*4882a593Smuzhiyun 				SPFROMREG(ft, MIPSInst_FT(ir));
2060*4882a593Smuzhiyun 				rv.w = ieee754sp_cmp(fs, ft,
2061*4882a593Smuzhiyun 					cmptab[cmpop & 0x7], cmpop & 0x8);
2062*4882a593Smuzhiyun 				rfmt = -1;
2063*4882a593Smuzhiyun 				if ((cmpop & 0x8) && ieee754_cxtest
2064*4882a593Smuzhiyun 					(IEEE754_INVALID_OPERATION))
2065*4882a593Smuzhiyun 					rcsr = FPU_CSR_INV_X | FPU_CSR_INV_S;
2066*4882a593Smuzhiyun 				else
2067*4882a593Smuzhiyun 					goto copcsr;
2068*4882a593Smuzhiyun 
2069*4882a593Smuzhiyun 			} else
2070*4882a593Smuzhiyun 				return SIGILL;
2071*4882a593Smuzhiyun 			break;
2072*4882a593Smuzhiyun 		}
2073*4882a593Smuzhiyun 		break;
2074*4882a593Smuzhiyun 	}
2075*4882a593Smuzhiyun 
2076*4882a593Smuzhiyun 	case d_fmt: {
2077*4882a593Smuzhiyun 		union ieee754dp fd, fs, ft;
2078*4882a593Smuzhiyun 		union {
2079*4882a593Smuzhiyun 			union ieee754dp(*b) (union ieee754dp, union ieee754dp);
2080*4882a593Smuzhiyun 			union ieee754dp(*u) (union ieee754dp);
2081*4882a593Smuzhiyun 		} handler;
2082*4882a593Smuzhiyun 
2083*4882a593Smuzhiyun 		switch (MIPSInst_FUNC(ir)) {
2084*4882a593Smuzhiyun 			/* binary ops */
2085*4882a593Smuzhiyun 		case fadd_op:
2086*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(add_d);
2087*4882a593Smuzhiyun 			handler.b = ieee754dp_add;
2088*4882a593Smuzhiyun 			goto dcopbop;
2089*4882a593Smuzhiyun 		case fsub_op:
2090*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(sub_d);
2091*4882a593Smuzhiyun 			handler.b = ieee754dp_sub;
2092*4882a593Smuzhiyun 			goto dcopbop;
2093*4882a593Smuzhiyun 		case fmul_op:
2094*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(mul_d);
2095*4882a593Smuzhiyun 			handler.b = ieee754dp_mul;
2096*4882a593Smuzhiyun 			goto dcopbop;
2097*4882a593Smuzhiyun 		case fdiv_op:
2098*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(div_d);
2099*4882a593Smuzhiyun 			handler.b = ieee754dp_div;
2100*4882a593Smuzhiyun 			goto dcopbop;
2101*4882a593Smuzhiyun 
2102*4882a593Smuzhiyun 			/* unary  ops */
2103*4882a593Smuzhiyun 		case fsqrt_op:
2104*4882a593Smuzhiyun 			if (!cpu_has_mips_2_3_4_5_r)
2105*4882a593Smuzhiyun 				return SIGILL;
2106*4882a593Smuzhiyun 
2107*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(sqrt_d);
2108*4882a593Smuzhiyun 			handler.u = ieee754dp_sqrt;
2109*4882a593Smuzhiyun 			goto dcopuop;
2110*4882a593Smuzhiyun 		/*
2111*4882a593Smuzhiyun 		 * Note that on some MIPS IV implementations such as the
2112*4882a593Smuzhiyun 		 * R5000 and R8000 the FSQRT and FRECIP instructions do not
2113*4882a593Smuzhiyun 		 * achieve full IEEE-754 accuracy - however this emulator does.
2114*4882a593Smuzhiyun 		 */
2115*4882a593Smuzhiyun 		case frsqrt_op:
2116*4882a593Smuzhiyun 			if (!cpu_has_mips_4_5_64_r2_r6)
2117*4882a593Smuzhiyun 				return SIGILL;
2118*4882a593Smuzhiyun 
2119*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(rsqrt_d);
2120*4882a593Smuzhiyun 			handler.u = fpemu_dp_rsqrt;
2121*4882a593Smuzhiyun 			goto dcopuop;
2122*4882a593Smuzhiyun 		case frecip_op:
2123*4882a593Smuzhiyun 			if (!cpu_has_mips_4_5_64_r2_r6)
2124*4882a593Smuzhiyun 				return SIGILL;
2125*4882a593Smuzhiyun 
2126*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(recip_d);
2127*4882a593Smuzhiyun 			handler.u = fpemu_dp_recip;
2128*4882a593Smuzhiyun 			goto dcopuop;
2129*4882a593Smuzhiyun 		case fmovc_op:
2130*4882a593Smuzhiyun 			if (!cpu_has_mips_4_5_r)
2131*4882a593Smuzhiyun 				return SIGILL;
2132*4882a593Smuzhiyun 
2133*4882a593Smuzhiyun 			cond = fpucondbit[MIPSInst_FT(ir) >> 2];
2134*4882a593Smuzhiyun 			if (((ctx->fcr31 & cond) != 0) !=
2135*4882a593Smuzhiyun 				((MIPSInst_FT(ir) & 1) != 0))
2136*4882a593Smuzhiyun 				return 0;
2137*4882a593Smuzhiyun 			DPFROMREG(rv.d, MIPSInst_FS(ir));
2138*4882a593Smuzhiyun 			break;
2139*4882a593Smuzhiyun 		case fmovz_op:
2140*4882a593Smuzhiyun 			if (!cpu_has_mips_4_5_r)
2141*4882a593Smuzhiyun 				return SIGILL;
2142*4882a593Smuzhiyun 
2143*4882a593Smuzhiyun 			if (xcp->regs[MIPSInst_FT(ir)] != 0)
2144*4882a593Smuzhiyun 				return 0;
2145*4882a593Smuzhiyun 			DPFROMREG(rv.d, MIPSInst_FS(ir));
2146*4882a593Smuzhiyun 			break;
2147*4882a593Smuzhiyun 		case fmovn_op:
2148*4882a593Smuzhiyun 			if (!cpu_has_mips_4_5_r)
2149*4882a593Smuzhiyun 				return SIGILL;
2150*4882a593Smuzhiyun 
2151*4882a593Smuzhiyun 			if (xcp->regs[MIPSInst_FT(ir)] == 0)
2152*4882a593Smuzhiyun 				return 0;
2153*4882a593Smuzhiyun 			DPFROMREG(rv.d, MIPSInst_FS(ir));
2154*4882a593Smuzhiyun 			break;
2155*4882a593Smuzhiyun 
2156*4882a593Smuzhiyun 		case fseleqz_op:
2157*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2158*4882a593Smuzhiyun 				return SIGILL;
2159*4882a593Smuzhiyun 
2160*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(seleqz_d);
2161*4882a593Smuzhiyun 			DPFROMREG(rv.d, MIPSInst_FT(ir));
2162*4882a593Smuzhiyun 			if (rv.l & 0x1)
2163*4882a593Smuzhiyun 				rv.l = 0;
2164*4882a593Smuzhiyun 			else
2165*4882a593Smuzhiyun 				DPFROMREG(rv.d, MIPSInst_FS(ir));
2166*4882a593Smuzhiyun 			break;
2167*4882a593Smuzhiyun 
2168*4882a593Smuzhiyun 		case fselnez_op:
2169*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2170*4882a593Smuzhiyun 				return SIGILL;
2171*4882a593Smuzhiyun 
2172*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(selnez_d);
2173*4882a593Smuzhiyun 			DPFROMREG(rv.d, MIPSInst_FT(ir));
2174*4882a593Smuzhiyun 			if (rv.l & 0x1)
2175*4882a593Smuzhiyun 				DPFROMREG(rv.d, MIPSInst_FS(ir));
2176*4882a593Smuzhiyun 			else
2177*4882a593Smuzhiyun 				rv.l = 0;
2178*4882a593Smuzhiyun 			break;
2179*4882a593Smuzhiyun 
2180*4882a593Smuzhiyun 		case fmaddf_op: {
2181*4882a593Smuzhiyun 			union ieee754dp ft, fs, fd;
2182*4882a593Smuzhiyun 
2183*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2184*4882a593Smuzhiyun 				return SIGILL;
2185*4882a593Smuzhiyun 
2186*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(maddf_d);
2187*4882a593Smuzhiyun 			DPFROMREG(ft, MIPSInst_FT(ir));
2188*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2189*4882a593Smuzhiyun 			DPFROMREG(fd, MIPSInst_FD(ir));
2190*4882a593Smuzhiyun 			rv.d = ieee754dp_maddf(fd, fs, ft);
2191*4882a593Smuzhiyun 			goto copcsr;
2192*4882a593Smuzhiyun 		}
2193*4882a593Smuzhiyun 
2194*4882a593Smuzhiyun 		case fmsubf_op: {
2195*4882a593Smuzhiyun 			union ieee754dp ft, fs, fd;
2196*4882a593Smuzhiyun 
2197*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2198*4882a593Smuzhiyun 				return SIGILL;
2199*4882a593Smuzhiyun 
2200*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(msubf_d);
2201*4882a593Smuzhiyun 			DPFROMREG(ft, MIPSInst_FT(ir));
2202*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2203*4882a593Smuzhiyun 			DPFROMREG(fd, MIPSInst_FD(ir));
2204*4882a593Smuzhiyun 			rv.d = ieee754dp_msubf(fd, fs, ft);
2205*4882a593Smuzhiyun 			goto copcsr;
2206*4882a593Smuzhiyun 		}
2207*4882a593Smuzhiyun 
2208*4882a593Smuzhiyun 		case frint_op: {
2209*4882a593Smuzhiyun 			union ieee754dp fs;
2210*4882a593Smuzhiyun 
2211*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2212*4882a593Smuzhiyun 				return SIGILL;
2213*4882a593Smuzhiyun 
2214*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(rint_d);
2215*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2216*4882a593Smuzhiyun 			rv.d = ieee754dp_rint(fs);
2217*4882a593Smuzhiyun 			goto copcsr;
2218*4882a593Smuzhiyun 		}
2219*4882a593Smuzhiyun 
2220*4882a593Smuzhiyun 		case fclass_op: {
2221*4882a593Smuzhiyun 			union ieee754dp fs;
2222*4882a593Smuzhiyun 
2223*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2224*4882a593Smuzhiyun 				return SIGILL;
2225*4882a593Smuzhiyun 
2226*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(class_d);
2227*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2228*4882a593Smuzhiyun 			rv.l = ieee754dp_2008class(fs);
2229*4882a593Smuzhiyun 			rfmt = l_fmt;
2230*4882a593Smuzhiyun 			goto copcsr;
2231*4882a593Smuzhiyun 		}
2232*4882a593Smuzhiyun 
2233*4882a593Smuzhiyun 		case fmin_op: {
2234*4882a593Smuzhiyun 			union ieee754dp fs, ft;
2235*4882a593Smuzhiyun 
2236*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2237*4882a593Smuzhiyun 				return SIGILL;
2238*4882a593Smuzhiyun 
2239*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(min_d);
2240*4882a593Smuzhiyun 			DPFROMREG(ft, MIPSInst_FT(ir));
2241*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2242*4882a593Smuzhiyun 			rv.d = ieee754dp_fmin(fs, ft);
2243*4882a593Smuzhiyun 			goto copcsr;
2244*4882a593Smuzhiyun 		}
2245*4882a593Smuzhiyun 
2246*4882a593Smuzhiyun 		case fmina_op: {
2247*4882a593Smuzhiyun 			union ieee754dp fs, ft;
2248*4882a593Smuzhiyun 
2249*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2250*4882a593Smuzhiyun 				return SIGILL;
2251*4882a593Smuzhiyun 
2252*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(mina_d);
2253*4882a593Smuzhiyun 			DPFROMREG(ft, MIPSInst_FT(ir));
2254*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2255*4882a593Smuzhiyun 			rv.d = ieee754dp_fmina(fs, ft);
2256*4882a593Smuzhiyun 			goto copcsr;
2257*4882a593Smuzhiyun 		}
2258*4882a593Smuzhiyun 
2259*4882a593Smuzhiyun 		case fmax_op: {
2260*4882a593Smuzhiyun 			union ieee754dp fs, ft;
2261*4882a593Smuzhiyun 
2262*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2263*4882a593Smuzhiyun 				return SIGILL;
2264*4882a593Smuzhiyun 
2265*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(max_d);
2266*4882a593Smuzhiyun 			DPFROMREG(ft, MIPSInst_FT(ir));
2267*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2268*4882a593Smuzhiyun 			rv.d = ieee754dp_fmax(fs, ft);
2269*4882a593Smuzhiyun 			goto copcsr;
2270*4882a593Smuzhiyun 		}
2271*4882a593Smuzhiyun 
2272*4882a593Smuzhiyun 		case fmaxa_op: {
2273*4882a593Smuzhiyun 			union ieee754dp fs, ft;
2274*4882a593Smuzhiyun 
2275*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2276*4882a593Smuzhiyun 				return SIGILL;
2277*4882a593Smuzhiyun 
2278*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(maxa_d);
2279*4882a593Smuzhiyun 			DPFROMREG(ft, MIPSInst_FT(ir));
2280*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2281*4882a593Smuzhiyun 			rv.d = ieee754dp_fmaxa(fs, ft);
2282*4882a593Smuzhiyun 			goto copcsr;
2283*4882a593Smuzhiyun 		}
2284*4882a593Smuzhiyun 
2285*4882a593Smuzhiyun 		case fabs_op:
2286*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(abs_d);
2287*4882a593Smuzhiyun 			handler.u = ieee754dp_abs;
2288*4882a593Smuzhiyun 			goto dcopuop;
2289*4882a593Smuzhiyun 
2290*4882a593Smuzhiyun 		case fneg_op:
2291*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(neg_d);
2292*4882a593Smuzhiyun 			handler.u = ieee754dp_neg;
2293*4882a593Smuzhiyun 			goto dcopuop;
2294*4882a593Smuzhiyun 
2295*4882a593Smuzhiyun 		case fmov_op:
2296*4882a593Smuzhiyun 			/* an easy one */
2297*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(mov_d);
2298*4882a593Smuzhiyun 			DPFROMREG(rv.d, MIPSInst_FS(ir));
2299*4882a593Smuzhiyun 			goto copcsr;
2300*4882a593Smuzhiyun 
2301*4882a593Smuzhiyun 			/* binary op on handler */
2302*4882a593Smuzhiyun dcopbop:
2303*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2304*4882a593Smuzhiyun 			DPFROMREG(ft, MIPSInst_FT(ir));
2305*4882a593Smuzhiyun 
2306*4882a593Smuzhiyun 			rv.d = (*handler.b) (fs, ft);
2307*4882a593Smuzhiyun 			goto copcsr;
2308*4882a593Smuzhiyun dcopuop:
2309*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2310*4882a593Smuzhiyun 			rv.d = (*handler.u) (fs);
2311*4882a593Smuzhiyun 			goto copcsr;
2312*4882a593Smuzhiyun 
2313*4882a593Smuzhiyun 		/*
2314*4882a593Smuzhiyun 		 * unary conv ops
2315*4882a593Smuzhiyun 		 */
2316*4882a593Smuzhiyun 		case fcvts_op:
2317*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(cvt_s_d);
2318*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2319*4882a593Smuzhiyun 			rv.s = ieee754sp_fdp(fs);
2320*4882a593Smuzhiyun 			rfmt = s_fmt;
2321*4882a593Smuzhiyun 			goto copcsr;
2322*4882a593Smuzhiyun 
2323*4882a593Smuzhiyun 		case fcvtd_op:
2324*4882a593Smuzhiyun 			return SIGILL;	/* not defined */
2325*4882a593Smuzhiyun 
2326*4882a593Smuzhiyun 		case fcvtw_op:
2327*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(cvt_w_d);
2328*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2329*4882a593Smuzhiyun 			rv.w = ieee754dp_tint(fs);	/* wrong */
2330*4882a593Smuzhiyun 			rfmt = w_fmt;
2331*4882a593Smuzhiyun 			goto copcsr;
2332*4882a593Smuzhiyun 
2333*4882a593Smuzhiyun 		case fround_op:
2334*4882a593Smuzhiyun 		case ftrunc_op:
2335*4882a593Smuzhiyun 		case fceil_op:
2336*4882a593Smuzhiyun 		case ffloor_op:
2337*4882a593Smuzhiyun 			if (!cpu_has_mips_2_3_4_5_r)
2338*4882a593Smuzhiyun 				return SIGILL;
2339*4882a593Smuzhiyun 
2340*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == fceil_op)
2341*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ceil_w_d);
2342*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == ffloor_op)
2343*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(floor_w_d);
2344*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == fround_op)
2345*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(round_w_d);
2346*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == ftrunc_op)
2347*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(trunc_w_d);
2348*4882a593Smuzhiyun 
2349*4882a593Smuzhiyun 			oldrm = ieee754_csr.rm;
2350*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2351*4882a593Smuzhiyun 			ieee754_csr.rm = MIPSInst_FUNC(ir);
2352*4882a593Smuzhiyun 			rv.w = ieee754dp_tint(fs);
2353*4882a593Smuzhiyun 			ieee754_csr.rm = oldrm;
2354*4882a593Smuzhiyun 			rfmt = w_fmt;
2355*4882a593Smuzhiyun 			goto copcsr;
2356*4882a593Smuzhiyun 
2357*4882a593Smuzhiyun 		case fsel_op:
2358*4882a593Smuzhiyun 			if (!cpu_has_mips_r6)
2359*4882a593Smuzhiyun 				return SIGILL;
2360*4882a593Smuzhiyun 
2361*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(sel_d);
2362*4882a593Smuzhiyun 			DPFROMREG(fd, MIPSInst_FD(ir));
2363*4882a593Smuzhiyun 			if (fd.bits & 0x1)
2364*4882a593Smuzhiyun 				DPFROMREG(rv.d, MIPSInst_FT(ir));
2365*4882a593Smuzhiyun 			else
2366*4882a593Smuzhiyun 				DPFROMREG(rv.d, MIPSInst_FS(ir));
2367*4882a593Smuzhiyun 			break;
2368*4882a593Smuzhiyun 
2369*4882a593Smuzhiyun 		case fcvtl_op:
2370*4882a593Smuzhiyun 			if (!cpu_has_mips_3_4_5_64_r2_r6)
2371*4882a593Smuzhiyun 				return SIGILL;
2372*4882a593Smuzhiyun 
2373*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(cvt_l_d);
2374*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2375*4882a593Smuzhiyun 			rv.l = ieee754dp_tlong(fs);
2376*4882a593Smuzhiyun 			rfmt = l_fmt;
2377*4882a593Smuzhiyun 			goto copcsr;
2378*4882a593Smuzhiyun 
2379*4882a593Smuzhiyun 		case froundl_op:
2380*4882a593Smuzhiyun 		case ftruncl_op:
2381*4882a593Smuzhiyun 		case fceill_op:
2382*4882a593Smuzhiyun 		case ffloorl_op:
2383*4882a593Smuzhiyun 			if (!cpu_has_mips_3_4_5_64_r2_r6)
2384*4882a593Smuzhiyun 				return SIGILL;
2385*4882a593Smuzhiyun 
2386*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == fceill_op)
2387*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(ceil_l_d);
2388*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == ffloorl_op)
2389*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(floor_l_d);
2390*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == froundl_op)
2391*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(round_l_d);
2392*4882a593Smuzhiyun 			if (MIPSInst_FUNC(ir) == ftruncl_op)
2393*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(trunc_l_d);
2394*4882a593Smuzhiyun 
2395*4882a593Smuzhiyun 			oldrm = ieee754_csr.rm;
2396*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2397*4882a593Smuzhiyun 			ieee754_csr.rm = MIPSInst_FUNC(ir);
2398*4882a593Smuzhiyun 			rv.l = ieee754dp_tlong(fs);
2399*4882a593Smuzhiyun 			ieee754_csr.rm = oldrm;
2400*4882a593Smuzhiyun 			rfmt = l_fmt;
2401*4882a593Smuzhiyun 			goto copcsr;
2402*4882a593Smuzhiyun 
2403*4882a593Smuzhiyun 		default:
2404*4882a593Smuzhiyun 			if (!NO_R6EMU && MIPSInst_FUNC(ir) >= fcmp_op) {
2405*4882a593Smuzhiyun 				unsigned int cmpop;
2406*4882a593Smuzhiyun 				union ieee754dp fs, ft;
2407*4882a593Smuzhiyun 
2408*4882a593Smuzhiyun 				cmpop = MIPSInst_FUNC(ir) - fcmp_op;
2409*4882a593Smuzhiyun 				DPFROMREG(fs, MIPSInst_FS(ir));
2410*4882a593Smuzhiyun 				DPFROMREG(ft, MIPSInst_FT(ir));
2411*4882a593Smuzhiyun 				rv.w = ieee754dp_cmp(fs, ft,
2412*4882a593Smuzhiyun 					cmptab[cmpop & 0x7], cmpop & 0x8);
2413*4882a593Smuzhiyun 				rfmt = -1;
2414*4882a593Smuzhiyun 				if ((cmpop & 0x8)
2415*4882a593Smuzhiyun 					&&
2416*4882a593Smuzhiyun 					ieee754_cxtest
2417*4882a593Smuzhiyun 					(IEEE754_INVALID_OPERATION))
2418*4882a593Smuzhiyun 					rcsr = FPU_CSR_INV_X | FPU_CSR_INV_S;
2419*4882a593Smuzhiyun 				else
2420*4882a593Smuzhiyun 					goto copcsr;
2421*4882a593Smuzhiyun 
2422*4882a593Smuzhiyun 			}
2423*4882a593Smuzhiyun 			else {
2424*4882a593Smuzhiyun 				return SIGILL;
2425*4882a593Smuzhiyun 			}
2426*4882a593Smuzhiyun 			break;
2427*4882a593Smuzhiyun 		}
2428*4882a593Smuzhiyun 		break;
2429*4882a593Smuzhiyun 	}
2430*4882a593Smuzhiyun 
2431*4882a593Smuzhiyun 	case w_fmt: {
2432*4882a593Smuzhiyun 		union ieee754dp fs;
2433*4882a593Smuzhiyun 
2434*4882a593Smuzhiyun 		switch (MIPSInst_FUNC(ir)) {
2435*4882a593Smuzhiyun 		case fcvts_op:
2436*4882a593Smuzhiyun 			/* convert word to single precision real */
2437*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(cvt_s_w);
2438*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
2439*4882a593Smuzhiyun 			rv.s = ieee754sp_fint(fs.bits);
2440*4882a593Smuzhiyun 			rfmt = s_fmt;
2441*4882a593Smuzhiyun 			goto copcsr;
2442*4882a593Smuzhiyun 		case fcvtd_op:
2443*4882a593Smuzhiyun 			/* convert word to double precision real */
2444*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(cvt_d_w);
2445*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
2446*4882a593Smuzhiyun 			rv.d = ieee754dp_fint(fs.bits);
2447*4882a593Smuzhiyun 			rfmt = d_fmt;
2448*4882a593Smuzhiyun 			goto copcsr;
2449*4882a593Smuzhiyun 		default: {
2450*4882a593Smuzhiyun 			/* Emulating the new CMP.condn.fmt R6 instruction */
2451*4882a593Smuzhiyun #define CMPOP_MASK	0x7
2452*4882a593Smuzhiyun #define SIGN_BIT	(0x1 << 3)
2453*4882a593Smuzhiyun #define PREDICATE_BIT	(0x1 << 4)
2454*4882a593Smuzhiyun 
2455*4882a593Smuzhiyun 			int cmpop = MIPSInst_FUNC(ir) & CMPOP_MASK;
2456*4882a593Smuzhiyun 			int sig = MIPSInst_FUNC(ir) & SIGN_BIT;
2457*4882a593Smuzhiyun 			union ieee754sp fs, ft;
2458*4882a593Smuzhiyun 
2459*4882a593Smuzhiyun 			/* This is an R6 only instruction */
2460*4882a593Smuzhiyun 			if (!cpu_has_mips_r6 ||
2461*4882a593Smuzhiyun 			    (MIPSInst_FUNC(ir) & 0x20))
2462*4882a593Smuzhiyun 				return SIGILL;
2463*4882a593Smuzhiyun 
2464*4882a593Smuzhiyun 			if (!sig) {
2465*4882a593Smuzhiyun 				if (!(MIPSInst_FUNC(ir) & PREDICATE_BIT)) {
2466*4882a593Smuzhiyun 					switch (cmpop) {
2467*4882a593Smuzhiyun 					case 0:
2468*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_af_s);
2469*4882a593Smuzhiyun 					break;
2470*4882a593Smuzhiyun 					case 1:
2471*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_un_s);
2472*4882a593Smuzhiyun 					break;
2473*4882a593Smuzhiyun 					case 2:
2474*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_eq_s);
2475*4882a593Smuzhiyun 					break;
2476*4882a593Smuzhiyun 					case 3:
2477*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_ueq_s);
2478*4882a593Smuzhiyun 					break;
2479*4882a593Smuzhiyun 					case 4:
2480*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_lt_s);
2481*4882a593Smuzhiyun 					break;
2482*4882a593Smuzhiyun 					case 5:
2483*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_ult_s);
2484*4882a593Smuzhiyun 					break;
2485*4882a593Smuzhiyun 					case 6:
2486*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_le_s);
2487*4882a593Smuzhiyun 					break;
2488*4882a593Smuzhiyun 					case 7:
2489*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_ule_s);
2490*4882a593Smuzhiyun 					break;
2491*4882a593Smuzhiyun 					}
2492*4882a593Smuzhiyun 				} else {
2493*4882a593Smuzhiyun 					switch (cmpop) {
2494*4882a593Smuzhiyun 					case 1:
2495*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_or_s);
2496*4882a593Smuzhiyun 					break;
2497*4882a593Smuzhiyun 					case 2:
2498*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_une_s);
2499*4882a593Smuzhiyun 					break;
2500*4882a593Smuzhiyun 					case 3:
2501*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_ne_s);
2502*4882a593Smuzhiyun 					break;
2503*4882a593Smuzhiyun 					}
2504*4882a593Smuzhiyun 				}
2505*4882a593Smuzhiyun 			} else {
2506*4882a593Smuzhiyun 				if (!(MIPSInst_FUNC(ir) & PREDICATE_BIT)) {
2507*4882a593Smuzhiyun 					switch (cmpop) {
2508*4882a593Smuzhiyun 					case 0:
2509*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_saf_s);
2510*4882a593Smuzhiyun 					break;
2511*4882a593Smuzhiyun 					case 1:
2512*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sun_s);
2513*4882a593Smuzhiyun 					break;
2514*4882a593Smuzhiyun 					case 2:
2515*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_seq_s);
2516*4882a593Smuzhiyun 					break;
2517*4882a593Smuzhiyun 					case 3:
2518*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sueq_s);
2519*4882a593Smuzhiyun 					break;
2520*4882a593Smuzhiyun 					case 4:
2521*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_slt_s);
2522*4882a593Smuzhiyun 					break;
2523*4882a593Smuzhiyun 					case 5:
2524*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sult_s);
2525*4882a593Smuzhiyun 					break;
2526*4882a593Smuzhiyun 					case 6:
2527*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sle_s);
2528*4882a593Smuzhiyun 					break;
2529*4882a593Smuzhiyun 					case 7:
2530*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sule_s);
2531*4882a593Smuzhiyun 					break;
2532*4882a593Smuzhiyun 					}
2533*4882a593Smuzhiyun 				} else {
2534*4882a593Smuzhiyun 					switch (cmpop) {
2535*4882a593Smuzhiyun 					case 1:
2536*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sor_s);
2537*4882a593Smuzhiyun 					break;
2538*4882a593Smuzhiyun 					case 2:
2539*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sune_s);
2540*4882a593Smuzhiyun 					break;
2541*4882a593Smuzhiyun 					case 3:
2542*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sne_s);
2543*4882a593Smuzhiyun 					break;
2544*4882a593Smuzhiyun 					}
2545*4882a593Smuzhiyun 				}
2546*4882a593Smuzhiyun 			}
2547*4882a593Smuzhiyun 
2548*4882a593Smuzhiyun 			/* fmt is w_fmt for single precision so fix it */
2549*4882a593Smuzhiyun 			rfmt = s_fmt;
2550*4882a593Smuzhiyun 			/* default to false */
2551*4882a593Smuzhiyun 			rv.w = 0;
2552*4882a593Smuzhiyun 
2553*4882a593Smuzhiyun 			/* CMP.condn.S */
2554*4882a593Smuzhiyun 			SPFROMREG(fs, MIPSInst_FS(ir));
2555*4882a593Smuzhiyun 			SPFROMREG(ft, MIPSInst_FT(ir));
2556*4882a593Smuzhiyun 
2557*4882a593Smuzhiyun 			/* positive predicates */
2558*4882a593Smuzhiyun 			if (!(MIPSInst_FUNC(ir) & PREDICATE_BIT)) {
2559*4882a593Smuzhiyun 				if (ieee754sp_cmp(fs, ft, cmptab[cmpop],
2560*4882a593Smuzhiyun 						  sig))
2561*4882a593Smuzhiyun 				    rv.w = -1; /* true, all 1s */
2562*4882a593Smuzhiyun 				if ((sig) &&
2563*4882a593Smuzhiyun 				    ieee754_cxtest(IEEE754_INVALID_OPERATION))
2564*4882a593Smuzhiyun 					rcsr = FPU_CSR_INV_X | FPU_CSR_INV_S;
2565*4882a593Smuzhiyun 				else
2566*4882a593Smuzhiyun 					goto copcsr;
2567*4882a593Smuzhiyun 			} else {
2568*4882a593Smuzhiyun 				/* negative predicates */
2569*4882a593Smuzhiyun 				switch (cmpop) {
2570*4882a593Smuzhiyun 				case 1:
2571*4882a593Smuzhiyun 				case 2:
2572*4882a593Smuzhiyun 				case 3:
2573*4882a593Smuzhiyun 					if (ieee754sp_cmp(fs, ft,
2574*4882a593Smuzhiyun 							  negative_cmptab[cmpop],
2575*4882a593Smuzhiyun 							  sig))
2576*4882a593Smuzhiyun 						rv.w = -1; /* true, all 1s */
2577*4882a593Smuzhiyun 					if (sig &&
2578*4882a593Smuzhiyun 					    ieee754_cxtest(IEEE754_INVALID_OPERATION))
2579*4882a593Smuzhiyun 						rcsr = FPU_CSR_INV_X | FPU_CSR_INV_S;
2580*4882a593Smuzhiyun 					else
2581*4882a593Smuzhiyun 						goto copcsr;
2582*4882a593Smuzhiyun 					break;
2583*4882a593Smuzhiyun 				default:
2584*4882a593Smuzhiyun 					/* Reserved R6 ops */
2585*4882a593Smuzhiyun 					return SIGILL;
2586*4882a593Smuzhiyun 				}
2587*4882a593Smuzhiyun 			}
2588*4882a593Smuzhiyun 			break;
2589*4882a593Smuzhiyun 			}
2590*4882a593Smuzhiyun 		}
2591*4882a593Smuzhiyun 		break;
2592*4882a593Smuzhiyun 	}
2593*4882a593Smuzhiyun 
2594*4882a593Smuzhiyun 	case l_fmt:
2595*4882a593Smuzhiyun 
2596*4882a593Smuzhiyun 		if (!cpu_has_mips_3_4_5_64_r2_r6)
2597*4882a593Smuzhiyun 			return SIGILL;
2598*4882a593Smuzhiyun 
2599*4882a593Smuzhiyun 		DIFROMREG(bits, MIPSInst_FS(ir));
2600*4882a593Smuzhiyun 
2601*4882a593Smuzhiyun 		switch (MIPSInst_FUNC(ir)) {
2602*4882a593Smuzhiyun 		case fcvts_op:
2603*4882a593Smuzhiyun 			/* convert long to single precision real */
2604*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(cvt_s_l);
2605*4882a593Smuzhiyun 			rv.s = ieee754sp_flong(bits);
2606*4882a593Smuzhiyun 			rfmt = s_fmt;
2607*4882a593Smuzhiyun 			goto copcsr;
2608*4882a593Smuzhiyun 		case fcvtd_op:
2609*4882a593Smuzhiyun 			/* convert long to double precision real */
2610*4882a593Smuzhiyun 			MIPS_FPU_EMU_INC_STATS(cvt_d_l);
2611*4882a593Smuzhiyun 			rv.d = ieee754dp_flong(bits);
2612*4882a593Smuzhiyun 			rfmt = d_fmt;
2613*4882a593Smuzhiyun 			goto copcsr;
2614*4882a593Smuzhiyun 		default: {
2615*4882a593Smuzhiyun 			/* Emulating the new CMP.condn.fmt R6 instruction */
2616*4882a593Smuzhiyun 			int cmpop = MIPSInst_FUNC(ir) & CMPOP_MASK;
2617*4882a593Smuzhiyun 			int sig = MIPSInst_FUNC(ir) & SIGN_BIT;
2618*4882a593Smuzhiyun 			union ieee754dp fs, ft;
2619*4882a593Smuzhiyun 
2620*4882a593Smuzhiyun 			if (!cpu_has_mips_r6 ||
2621*4882a593Smuzhiyun 			    (MIPSInst_FUNC(ir) & 0x20))
2622*4882a593Smuzhiyun 				return SIGILL;
2623*4882a593Smuzhiyun 
2624*4882a593Smuzhiyun 			if (!sig) {
2625*4882a593Smuzhiyun 				if (!(MIPSInst_FUNC(ir) & PREDICATE_BIT)) {
2626*4882a593Smuzhiyun 					switch (cmpop) {
2627*4882a593Smuzhiyun 					case 0:
2628*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_af_d);
2629*4882a593Smuzhiyun 					break;
2630*4882a593Smuzhiyun 					case 1:
2631*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_un_d);
2632*4882a593Smuzhiyun 					break;
2633*4882a593Smuzhiyun 					case 2:
2634*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_eq_d);
2635*4882a593Smuzhiyun 					break;
2636*4882a593Smuzhiyun 					case 3:
2637*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_ueq_d);
2638*4882a593Smuzhiyun 					break;
2639*4882a593Smuzhiyun 					case 4:
2640*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_lt_d);
2641*4882a593Smuzhiyun 					break;
2642*4882a593Smuzhiyun 					case 5:
2643*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_ult_d);
2644*4882a593Smuzhiyun 					break;
2645*4882a593Smuzhiyun 					case 6:
2646*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_le_d);
2647*4882a593Smuzhiyun 					break;
2648*4882a593Smuzhiyun 					case 7:
2649*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_ule_d);
2650*4882a593Smuzhiyun 					break;
2651*4882a593Smuzhiyun 					}
2652*4882a593Smuzhiyun 				} else {
2653*4882a593Smuzhiyun 					switch (cmpop) {
2654*4882a593Smuzhiyun 					case 1:
2655*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_or_d);
2656*4882a593Smuzhiyun 					break;
2657*4882a593Smuzhiyun 					case 2:
2658*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_une_d);
2659*4882a593Smuzhiyun 					break;
2660*4882a593Smuzhiyun 					case 3:
2661*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_ne_d);
2662*4882a593Smuzhiyun 					break;
2663*4882a593Smuzhiyun 					}
2664*4882a593Smuzhiyun 				}
2665*4882a593Smuzhiyun 			} else {
2666*4882a593Smuzhiyun 				if (!(MIPSInst_FUNC(ir) & PREDICATE_BIT)) {
2667*4882a593Smuzhiyun 					switch (cmpop) {
2668*4882a593Smuzhiyun 					case 0:
2669*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_saf_d);
2670*4882a593Smuzhiyun 					break;
2671*4882a593Smuzhiyun 					case 1:
2672*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sun_d);
2673*4882a593Smuzhiyun 					break;
2674*4882a593Smuzhiyun 					case 2:
2675*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_seq_d);
2676*4882a593Smuzhiyun 					break;
2677*4882a593Smuzhiyun 					case 3:
2678*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sueq_d);
2679*4882a593Smuzhiyun 					break;
2680*4882a593Smuzhiyun 					case 4:
2681*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_slt_d);
2682*4882a593Smuzhiyun 					break;
2683*4882a593Smuzhiyun 					case 5:
2684*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sult_d);
2685*4882a593Smuzhiyun 					break;
2686*4882a593Smuzhiyun 					case 6:
2687*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sle_d);
2688*4882a593Smuzhiyun 					break;
2689*4882a593Smuzhiyun 					case 7:
2690*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sule_d);
2691*4882a593Smuzhiyun 					break;
2692*4882a593Smuzhiyun 					}
2693*4882a593Smuzhiyun 				} else {
2694*4882a593Smuzhiyun 					switch (cmpop) {
2695*4882a593Smuzhiyun 					case 1:
2696*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sor_d);
2697*4882a593Smuzhiyun 					break;
2698*4882a593Smuzhiyun 					case 2:
2699*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sune_d);
2700*4882a593Smuzhiyun 					break;
2701*4882a593Smuzhiyun 					case 3:
2702*4882a593Smuzhiyun 					MIPS_FPU_EMU_INC_STATS(cmp_sne_d);
2703*4882a593Smuzhiyun 					break;
2704*4882a593Smuzhiyun 					}
2705*4882a593Smuzhiyun 				}
2706*4882a593Smuzhiyun 			}
2707*4882a593Smuzhiyun 
2708*4882a593Smuzhiyun 			/* fmt is l_fmt for double precision so fix it */
2709*4882a593Smuzhiyun 			rfmt = d_fmt;
2710*4882a593Smuzhiyun 			/* default to false */
2711*4882a593Smuzhiyun 			rv.l = 0;
2712*4882a593Smuzhiyun 
2713*4882a593Smuzhiyun 			/* CMP.condn.D */
2714*4882a593Smuzhiyun 			DPFROMREG(fs, MIPSInst_FS(ir));
2715*4882a593Smuzhiyun 			DPFROMREG(ft, MIPSInst_FT(ir));
2716*4882a593Smuzhiyun 
2717*4882a593Smuzhiyun 			/* positive predicates */
2718*4882a593Smuzhiyun 			if (!(MIPSInst_FUNC(ir) & PREDICATE_BIT)) {
2719*4882a593Smuzhiyun 				if (ieee754dp_cmp(fs, ft,
2720*4882a593Smuzhiyun 						  cmptab[cmpop], sig))
2721*4882a593Smuzhiyun 				    rv.l = -1LL; /* true, all 1s */
2722*4882a593Smuzhiyun 				if (sig &&
2723*4882a593Smuzhiyun 				    ieee754_cxtest(IEEE754_INVALID_OPERATION))
2724*4882a593Smuzhiyun 					rcsr = FPU_CSR_INV_X | FPU_CSR_INV_S;
2725*4882a593Smuzhiyun 				else
2726*4882a593Smuzhiyun 					goto copcsr;
2727*4882a593Smuzhiyun 			} else {
2728*4882a593Smuzhiyun 				/* negative predicates */
2729*4882a593Smuzhiyun 				switch (cmpop) {
2730*4882a593Smuzhiyun 				case 1:
2731*4882a593Smuzhiyun 				case 2:
2732*4882a593Smuzhiyun 				case 3:
2733*4882a593Smuzhiyun 					if (ieee754dp_cmp(fs, ft,
2734*4882a593Smuzhiyun 							  negative_cmptab[cmpop],
2735*4882a593Smuzhiyun 							  sig))
2736*4882a593Smuzhiyun 						rv.l = -1LL; /* true, all 1s */
2737*4882a593Smuzhiyun 					if (sig &&
2738*4882a593Smuzhiyun 					    ieee754_cxtest(IEEE754_INVALID_OPERATION))
2739*4882a593Smuzhiyun 						rcsr = FPU_CSR_INV_X | FPU_CSR_INV_S;
2740*4882a593Smuzhiyun 					else
2741*4882a593Smuzhiyun 						goto copcsr;
2742*4882a593Smuzhiyun 					break;
2743*4882a593Smuzhiyun 				default:
2744*4882a593Smuzhiyun 					/* Reserved R6 ops */
2745*4882a593Smuzhiyun 					return SIGILL;
2746*4882a593Smuzhiyun 				}
2747*4882a593Smuzhiyun 			}
2748*4882a593Smuzhiyun 			break;
2749*4882a593Smuzhiyun 			}
2750*4882a593Smuzhiyun 		}
2751*4882a593Smuzhiyun 		break;
2752*4882a593Smuzhiyun 
2753*4882a593Smuzhiyun 	default:
2754*4882a593Smuzhiyun 		return SIGILL;
2755*4882a593Smuzhiyun 	}
2756*4882a593Smuzhiyun 
2757*4882a593Smuzhiyun 	/*
2758*4882a593Smuzhiyun 	 * Update the fpu CSR register for this operation.
2759*4882a593Smuzhiyun 	 * If an exception is required, generate a tidy SIGFPE exception,
2760*4882a593Smuzhiyun 	 * without updating the result register.
2761*4882a593Smuzhiyun 	 * Note: cause exception bits do not accumulate, they are rewritten
2762*4882a593Smuzhiyun 	 * for each op; only the flag/sticky bits accumulate.
2763*4882a593Smuzhiyun 	 */
2764*4882a593Smuzhiyun 	ctx->fcr31 = (ctx->fcr31 & ~FPU_CSR_ALL_X) | rcsr;
2765*4882a593Smuzhiyun 	if ((ctx->fcr31 >> 5) & ctx->fcr31 & FPU_CSR_ALL_E) {
2766*4882a593Smuzhiyun 		/*printk ("SIGFPE: FPU csr = %08x\n",ctx->fcr31); */
2767*4882a593Smuzhiyun 		return SIGFPE;
2768*4882a593Smuzhiyun 	}
2769*4882a593Smuzhiyun 
2770*4882a593Smuzhiyun 	/*
2771*4882a593Smuzhiyun 	 * Now we can safely write the result back to the register file.
2772*4882a593Smuzhiyun 	 */
2773*4882a593Smuzhiyun 	switch (rfmt) {
2774*4882a593Smuzhiyun 	case -1:
2775*4882a593Smuzhiyun 
2776*4882a593Smuzhiyun 		if (cpu_has_mips_4_5_r)
2777*4882a593Smuzhiyun 			cbit = fpucondbit[MIPSInst_FD(ir) >> 2];
2778*4882a593Smuzhiyun 		else
2779*4882a593Smuzhiyun 			cbit = FPU_CSR_COND;
2780*4882a593Smuzhiyun 		if (rv.w)
2781*4882a593Smuzhiyun 			ctx->fcr31 |= cbit;
2782*4882a593Smuzhiyun 		else
2783*4882a593Smuzhiyun 			ctx->fcr31 &= ~cbit;
2784*4882a593Smuzhiyun 		break;
2785*4882a593Smuzhiyun 
2786*4882a593Smuzhiyun 	case d_fmt:
2787*4882a593Smuzhiyun 		DPTOREG(rv.d, MIPSInst_FD(ir));
2788*4882a593Smuzhiyun 		break;
2789*4882a593Smuzhiyun 	case s_fmt:
2790*4882a593Smuzhiyun 		SPTOREG(rv.s, MIPSInst_FD(ir));
2791*4882a593Smuzhiyun 		break;
2792*4882a593Smuzhiyun 	case w_fmt:
2793*4882a593Smuzhiyun 		SITOREG(rv.w, MIPSInst_FD(ir));
2794*4882a593Smuzhiyun 		break;
2795*4882a593Smuzhiyun 	case l_fmt:
2796*4882a593Smuzhiyun 		if (!cpu_has_mips_3_4_5_64_r2_r6)
2797*4882a593Smuzhiyun 			return SIGILL;
2798*4882a593Smuzhiyun 
2799*4882a593Smuzhiyun 		DITOREG(rv.l, MIPSInst_FD(ir));
2800*4882a593Smuzhiyun 		break;
2801*4882a593Smuzhiyun 	default:
2802*4882a593Smuzhiyun 		return SIGILL;
2803*4882a593Smuzhiyun 	}
2804*4882a593Smuzhiyun 
2805*4882a593Smuzhiyun 	return 0;
2806*4882a593Smuzhiyun }
2807*4882a593Smuzhiyun 
2808*4882a593Smuzhiyun /*
2809*4882a593Smuzhiyun  * Emulate FPU instructions.
2810*4882a593Smuzhiyun  *
2811*4882a593Smuzhiyun  * If we use FPU hardware, then we have been typically called to handle
2812*4882a593Smuzhiyun  * an unimplemented operation, such as where an operand is a NaN or
2813*4882a593Smuzhiyun  * denormalized.  In that case exit the emulation loop after a single
2814*4882a593Smuzhiyun  * iteration so as to let hardware execute any subsequent instructions.
2815*4882a593Smuzhiyun  *
2816*4882a593Smuzhiyun  * If we have no FPU hardware or it has been disabled, then continue
2817*4882a593Smuzhiyun  * emulating floating-point instructions until one of these conditions
2818*4882a593Smuzhiyun  * has occurred:
2819*4882a593Smuzhiyun  *
2820*4882a593Smuzhiyun  * - a non-FPU instruction has been encountered,
2821*4882a593Smuzhiyun  *
2822*4882a593Smuzhiyun  * - an attempt to emulate has ended with a signal,
2823*4882a593Smuzhiyun  *
2824*4882a593Smuzhiyun  * - the ISA mode has been switched.
2825*4882a593Smuzhiyun  *
2826*4882a593Smuzhiyun  * We need to terminate the emulation loop if we got switched to the
2827*4882a593Smuzhiyun  * MIPS16 mode, whether supported or not, so that we do not attempt
2828*4882a593Smuzhiyun  * to emulate a MIPS16 instruction as a regular MIPS FPU instruction.
2829*4882a593Smuzhiyun  * Similarly if we got switched to the microMIPS mode and only the
2830*4882a593Smuzhiyun  * regular MIPS mode is supported, so that we do not attempt to emulate
2831*4882a593Smuzhiyun  * a microMIPS instruction as a regular MIPS FPU instruction.  Or if
2832*4882a593Smuzhiyun  * we got switched to the regular MIPS mode and only the microMIPS mode
2833*4882a593Smuzhiyun  * is supported, so that we do not attempt to emulate a regular MIPS
2834*4882a593Smuzhiyun  * instruction that should cause an Address Error exception instead.
2835*4882a593Smuzhiyun  * For simplicity we always terminate upon an ISA mode switch.
2836*4882a593Smuzhiyun  */
fpu_emulator_cop1Handler(struct pt_regs * xcp,struct mips_fpu_struct * ctx,int has_fpu,void __user ** fault_addr)2837*4882a593Smuzhiyun int fpu_emulator_cop1Handler(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
2838*4882a593Smuzhiyun 	int has_fpu, void __user **fault_addr)
2839*4882a593Smuzhiyun {
2840*4882a593Smuzhiyun 	unsigned long oldepc, prevepc;
2841*4882a593Smuzhiyun 	struct mm_decoded_insn dec_insn;
2842*4882a593Smuzhiyun 	u16 instr[4];
2843*4882a593Smuzhiyun 	u16 *instr_ptr;
2844*4882a593Smuzhiyun 	int sig = 0;
2845*4882a593Smuzhiyun 
2846*4882a593Smuzhiyun 	/*
2847*4882a593Smuzhiyun 	 * Initialize context if it hasn't been used already, otherwise ensure
2848*4882a593Smuzhiyun 	 * it has been saved to struct thread_struct.
2849*4882a593Smuzhiyun 	 */
2850*4882a593Smuzhiyun 	if (!init_fp_ctx(current))
2851*4882a593Smuzhiyun 		lose_fpu(1);
2852*4882a593Smuzhiyun 
2853*4882a593Smuzhiyun 	oldepc = xcp->cp0_epc;
2854*4882a593Smuzhiyun 	do {
2855*4882a593Smuzhiyun 		prevepc = xcp->cp0_epc;
2856*4882a593Smuzhiyun 
2857*4882a593Smuzhiyun 		if (get_isa16_mode(prevepc) && cpu_has_mmips) {
2858*4882a593Smuzhiyun 			/*
2859*4882a593Smuzhiyun 			 * Get next 2 microMIPS instructions and convert them
2860*4882a593Smuzhiyun 			 * into 32-bit instructions.
2861*4882a593Smuzhiyun 			 */
2862*4882a593Smuzhiyun 			if ((get_user(instr[0], (u16 __user *)msk_isa16_mode(xcp->cp0_epc))) ||
2863*4882a593Smuzhiyun 			    (get_user(instr[1], (u16 __user *)msk_isa16_mode(xcp->cp0_epc + 2))) ||
2864*4882a593Smuzhiyun 			    (get_user(instr[2], (u16 __user *)msk_isa16_mode(xcp->cp0_epc + 4))) ||
2865*4882a593Smuzhiyun 			    (get_user(instr[3], (u16 __user *)msk_isa16_mode(xcp->cp0_epc + 6)))) {
2866*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(errors);
2867*4882a593Smuzhiyun 				return SIGBUS;
2868*4882a593Smuzhiyun 			}
2869*4882a593Smuzhiyun 			instr_ptr = instr;
2870*4882a593Smuzhiyun 
2871*4882a593Smuzhiyun 			/* Get first instruction. */
2872*4882a593Smuzhiyun 			if (mm_insn_16bit(*instr_ptr)) {
2873*4882a593Smuzhiyun 				/* Duplicate the half-word. */
2874*4882a593Smuzhiyun 				dec_insn.insn = (*instr_ptr << 16) |
2875*4882a593Smuzhiyun 					(*instr_ptr);
2876*4882a593Smuzhiyun 				/* 16-bit instruction. */
2877*4882a593Smuzhiyun 				dec_insn.pc_inc = 2;
2878*4882a593Smuzhiyun 				instr_ptr += 1;
2879*4882a593Smuzhiyun 			} else {
2880*4882a593Smuzhiyun 				dec_insn.insn = (*instr_ptr << 16) |
2881*4882a593Smuzhiyun 					*(instr_ptr+1);
2882*4882a593Smuzhiyun 				/* 32-bit instruction. */
2883*4882a593Smuzhiyun 				dec_insn.pc_inc = 4;
2884*4882a593Smuzhiyun 				instr_ptr += 2;
2885*4882a593Smuzhiyun 			}
2886*4882a593Smuzhiyun 			/* Get second instruction. */
2887*4882a593Smuzhiyun 			if (mm_insn_16bit(*instr_ptr)) {
2888*4882a593Smuzhiyun 				/* Duplicate the half-word. */
2889*4882a593Smuzhiyun 				dec_insn.next_insn = (*instr_ptr << 16) |
2890*4882a593Smuzhiyun 					(*instr_ptr);
2891*4882a593Smuzhiyun 				/* 16-bit instruction. */
2892*4882a593Smuzhiyun 				dec_insn.next_pc_inc = 2;
2893*4882a593Smuzhiyun 			} else {
2894*4882a593Smuzhiyun 				dec_insn.next_insn = (*instr_ptr << 16) |
2895*4882a593Smuzhiyun 					*(instr_ptr+1);
2896*4882a593Smuzhiyun 				/* 32-bit instruction. */
2897*4882a593Smuzhiyun 				dec_insn.next_pc_inc = 4;
2898*4882a593Smuzhiyun 			}
2899*4882a593Smuzhiyun 			dec_insn.micro_mips_mode = 1;
2900*4882a593Smuzhiyun 		} else {
2901*4882a593Smuzhiyun 			if ((get_user(dec_insn.insn,
2902*4882a593Smuzhiyun 			    (mips_instruction __user *) xcp->cp0_epc)) ||
2903*4882a593Smuzhiyun 			    (get_user(dec_insn.next_insn,
2904*4882a593Smuzhiyun 			    (mips_instruction __user *)(xcp->cp0_epc+4)))) {
2905*4882a593Smuzhiyun 				MIPS_FPU_EMU_INC_STATS(errors);
2906*4882a593Smuzhiyun 				return SIGBUS;
2907*4882a593Smuzhiyun 			}
2908*4882a593Smuzhiyun 			dec_insn.pc_inc = 4;
2909*4882a593Smuzhiyun 			dec_insn.next_pc_inc = 4;
2910*4882a593Smuzhiyun 			dec_insn.micro_mips_mode = 0;
2911*4882a593Smuzhiyun 		}
2912*4882a593Smuzhiyun 
2913*4882a593Smuzhiyun 		if ((dec_insn.insn == 0) ||
2914*4882a593Smuzhiyun 		   ((dec_insn.pc_inc == 2) &&
2915*4882a593Smuzhiyun 		   ((dec_insn.insn & 0xffff) == MM_NOP16)))
2916*4882a593Smuzhiyun 			xcp->cp0_epc += dec_insn.pc_inc;	/* Skip NOPs */
2917*4882a593Smuzhiyun 		else {
2918*4882a593Smuzhiyun 			/*
2919*4882a593Smuzhiyun 			 * The 'ieee754_csr' is an alias of ctx->fcr31.
2920*4882a593Smuzhiyun 			 * No need to copy ctx->fcr31 to ieee754_csr.
2921*4882a593Smuzhiyun 			 */
2922*4882a593Smuzhiyun 			sig = cop1Emulate(xcp, ctx, dec_insn, fault_addr);
2923*4882a593Smuzhiyun 		}
2924*4882a593Smuzhiyun 
2925*4882a593Smuzhiyun 		if (has_fpu)
2926*4882a593Smuzhiyun 			break;
2927*4882a593Smuzhiyun 		if (sig)
2928*4882a593Smuzhiyun 			break;
2929*4882a593Smuzhiyun 		/*
2930*4882a593Smuzhiyun 		 * We have to check for the ISA bit explicitly here,
2931*4882a593Smuzhiyun 		 * because `get_isa16_mode' may return 0 if support
2932*4882a593Smuzhiyun 		 * for code compression has been globally disabled,
2933*4882a593Smuzhiyun 		 * or otherwise we may produce the wrong signal or
2934*4882a593Smuzhiyun 		 * even proceed successfully where we must not.
2935*4882a593Smuzhiyun 		 */
2936*4882a593Smuzhiyun 		if ((xcp->cp0_epc ^ prevepc) & 0x1)
2937*4882a593Smuzhiyun 			break;
2938*4882a593Smuzhiyun 
2939*4882a593Smuzhiyun 		cond_resched();
2940*4882a593Smuzhiyun 	} while (xcp->cp0_epc > prevepc);
2941*4882a593Smuzhiyun 
2942*4882a593Smuzhiyun 	/* SIGILL indicates a non-fpu instruction */
2943*4882a593Smuzhiyun 	if (sig == SIGILL && xcp->cp0_epc != oldepc)
2944*4882a593Smuzhiyun 		/* but if EPC has advanced, then ignore it */
2945*4882a593Smuzhiyun 		sig = 0;
2946*4882a593Smuzhiyun 
2947*4882a593Smuzhiyun 	return sig;
2948*4882a593Smuzhiyun }
2949