xref: /OK3568_Linux_fs/kernel/arch/powerpc/kvm/book3s_paired_singles.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  *
4*4882a593Smuzhiyun  * Copyright Novell Inc 2010
5*4882a593Smuzhiyun  *
6*4882a593Smuzhiyun  * Authors: Alexander Graf <agraf@suse.de>
7*4882a593Smuzhiyun  */
8*4882a593Smuzhiyun 
9*4882a593Smuzhiyun #include <asm/kvm.h>
10*4882a593Smuzhiyun #include <asm/kvm_ppc.h>
11*4882a593Smuzhiyun #include <asm/disassemble.h>
12*4882a593Smuzhiyun #include <asm/kvm_book3s.h>
13*4882a593Smuzhiyun #include <asm/kvm_fpu.h>
14*4882a593Smuzhiyun #include <asm/reg.h>
15*4882a593Smuzhiyun #include <asm/cacheflush.h>
16*4882a593Smuzhiyun #include <asm/switch_to.h>
17*4882a593Smuzhiyun #include <linux/vmalloc.h>
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun /* #define DEBUG */
20*4882a593Smuzhiyun 
21*4882a593Smuzhiyun #ifdef DEBUG
22*4882a593Smuzhiyun #define dprintk printk
23*4882a593Smuzhiyun #else
24*4882a593Smuzhiyun #define dprintk(...) do { } while(0);
25*4882a593Smuzhiyun #endif
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun #define OP_LFS			48
28*4882a593Smuzhiyun #define OP_LFSU			49
29*4882a593Smuzhiyun #define OP_LFD			50
30*4882a593Smuzhiyun #define OP_LFDU			51
31*4882a593Smuzhiyun #define OP_STFS			52
32*4882a593Smuzhiyun #define OP_STFSU		53
33*4882a593Smuzhiyun #define OP_STFD			54
34*4882a593Smuzhiyun #define OP_STFDU		55
35*4882a593Smuzhiyun #define OP_PSQ_L		56
36*4882a593Smuzhiyun #define OP_PSQ_LU		57
37*4882a593Smuzhiyun #define OP_PSQ_ST		60
38*4882a593Smuzhiyun #define OP_PSQ_STU		61
39*4882a593Smuzhiyun 
40*4882a593Smuzhiyun #define OP_31_LFSX		535
41*4882a593Smuzhiyun #define OP_31_LFSUX		567
42*4882a593Smuzhiyun #define OP_31_LFDX		599
43*4882a593Smuzhiyun #define OP_31_LFDUX		631
44*4882a593Smuzhiyun #define OP_31_STFSX		663
45*4882a593Smuzhiyun #define OP_31_STFSUX		695
46*4882a593Smuzhiyun #define OP_31_STFX		727
47*4882a593Smuzhiyun #define OP_31_STFUX		759
48*4882a593Smuzhiyun #define OP_31_LWIZX		887
49*4882a593Smuzhiyun #define OP_31_STFIWX		983
50*4882a593Smuzhiyun 
51*4882a593Smuzhiyun #define OP_59_FADDS		21
52*4882a593Smuzhiyun #define OP_59_FSUBS		20
53*4882a593Smuzhiyun #define OP_59_FSQRTS		22
54*4882a593Smuzhiyun #define OP_59_FDIVS		18
55*4882a593Smuzhiyun #define OP_59_FRES		24
56*4882a593Smuzhiyun #define OP_59_FMULS		25
57*4882a593Smuzhiyun #define OP_59_FRSQRTES		26
58*4882a593Smuzhiyun #define OP_59_FMSUBS		28
59*4882a593Smuzhiyun #define OP_59_FMADDS		29
60*4882a593Smuzhiyun #define OP_59_FNMSUBS		30
61*4882a593Smuzhiyun #define OP_59_FNMADDS		31
62*4882a593Smuzhiyun 
63*4882a593Smuzhiyun #define OP_63_FCMPU		0
64*4882a593Smuzhiyun #define OP_63_FCPSGN		8
65*4882a593Smuzhiyun #define OP_63_FRSP		12
66*4882a593Smuzhiyun #define OP_63_FCTIW		14
67*4882a593Smuzhiyun #define OP_63_FCTIWZ		15
68*4882a593Smuzhiyun #define OP_63_FDIV		18
69*4882a593Smuzhiyun #define OP_63_FADD		21
70*4882a593Smuzhiyun #define OP_63_FSQRT		22
71*4882a593Smuzhiyun #define OP_63_FSEL		23
72*4882a593Smuzhiyun #define OP_63_FRE		24
73*4882a593Smuzhiyun #define OP_63_FMUL		25
74*4882a593Smuzhiyun #define OP_63_FRSQRTE		26
75*4882a593Smuzhiyun #define OP_63_FMSUB		28
76*4882a593Smuzhiyun #define OP_63_FMADD		29
77*4882a593Smuzhiyun #define OP_63_FNMSUB		30
78*4882a593Smuzhiyun #define OP_63_FNMADD		31
79*4882a593Smuzhiyun #define OP_63_FCMPO		32
80*4882a593Smuzhiyun #define OP_63_MTFSB1		38 // XXX
81*4882a593Smuzhiyun #define OP_63_FSUB		20
82*4882a593Smuzhiyun #define OP_63_FNEG		40
83*4882a593Smuzhiyun #define OP_63_MCRFS		64
84*4882a593Smuzhiyun #define OP_63_MTFSB0		70
85*4882a593Smuzhiyun #define OP_63_FMR		72
86*4882a593Smuzhiyun #define OP_63_MTFSFI		134
87*4882a593Smuzhiyun #define OP_63_FABS		264
88*4882a593Smuzhiyun #define OP_63_MFFS		583
89*4882a593Smuzhiyun #define OP_63_MTFSF		711
90*4882a593Smuzhiyun 
91*4882a593Smuzhiyun #define OP_4X_PS_CMPU0		0
92*4882a593Smuzhiyun #define OP_4X_PSQ_LX		6
93*4882a593Smuzhiyun #define OP_4XW_PSQ_STX		7
94*4882a593Smuzhiyun #define OP_4A_PS_SUM0		10
95*4882a593Smuzhiyun #define OP_4A_PS_SUM1		11
96*4882a593Smuzhiyun #define OP_4A_PS_MULS0		12
97*4882a593Smuzhiyun #define OP_4A_PS_MULS1		13
98*4882a593Smuzhiyun #define OP_4A_PS_MADDS0		14
99*4882a593Smuzhiyun #define OP_4A_PS_MADDS1		15
100*4882a593Smuzhiyun #define OP_4A_PS_DIV		18
101*4882a593Smuzhiyun #define OP_4A_PS_SUB		20
102*4882a593Smuzhiyun #define OP_4A_PS_ADD		21
103*4882a593Smuzhiyun #define OP_4A_PS_SEL		23
104*4882a593Smuzhiyun #define OP_4A_PS_RES		24
105*4882a593Smuzhiyun #define OP_4A_PS_MUL		25
106*4882a593Smuzhiyun #define OP_4A_PS_RSQRTE		26
107*4882a593Smuzhiyun #define OP_4A_PS_MSUB		28
108*4882a593Smuzhiyun #define OP_4A_PS_MADD		29
109*4882a593Smuzhiyun #define OP_4A_PS_NMSUB		30
110*4882a593Smuzhiyun #define OP_4A_PS_NMADD		31
111*4882a593Smuzhiyun #define OP_4X_PS_CMPO0		32
112*4882a593Smuzhiyun #define OP_4X_PSQ_LUX		38
113*4882a593Smuzhiyun #define OP_4XW_PSQ_STUX		39
114*4882a593Smuzhiyun #define OP_4X_PS_NEG		40
115*4882a593Smuzhiyun #define OP_4X_PS_CMPU1		64
116*4882a593Smuzhiyun #define OP_4X_PS_MR		72
117*4882a593Smuzhiyun #define OP_4X_PS_CMPO1		96
118*4882a593Smuzhiyun #define OP_4X_PS_NABS		136
119*4882a593Smuzhiyun #define OP_4X_PS_ABS		264
120*4882a593Smuzhiyun #define OP_4X_PS_MERGE00	528
121*4882a593Smuzhiyun #define OP_4X_PS_MERGE01	560
122*4882a593Smuzhiyun #define OP_4X_PS_MERGE10	592
123*4882a593Smuzhiyun #define OP_4X_PS_MERGE11	624
124*4882a593Smuzhiyun 
125*4882a593Smuzhiyun #define SCALAR_NONE		0
126*4882a593Smuzhiyun #define SCALAR_HIGH		(1 << 0)
127*4882a593Smuzhiyun #define SCALAR_LOW		(1 << 1)
128*4882a593Smuzhiyun #define SCALAR_NO_PS0		(1 << 2)
129*4882a593Smuzhiyun #define SCALAR_NO_PS1		(1 << 3)
130*4882a593Smuzhiyun 
131*4882a593Smuzhiyun #define GQR_ST_TYPE_MASK	0x00000007
132*4882a593Smuzhiyun #define GQR_ST_TYPE_SHIFT	0
133*4882a593Smuzhiyun #define GQR_ST_SCALE_MASK	0x00003f00
134*4882a593Smuzhiyun #define GQR_ST_SCALE_SHIFT	8
135*4882a593Smuzhiyun #define GQR_LD_TYPE_MASK	0x00070000
136*4882a593Smuzhiyun #define GQR_LD_TYPE_SHIFT	16
137*4882a593Smuzhiyun #define GQR_LD_SCALE_MASK	0x3f000000
138*4882a593Smuzhiyun #define GQR_LD_SCALE_SHIFT	24
139*4882a593Smuzhiyun 
140*4882a593Smuzhiyun #define GQR_QUANTIZE_FLOAT	0
141*4882a593Smuzhiyun #define GQR_QUANTIZE_U8		4
142*4882a593Smuzhiyun #define GQR_QUANTIZE_U16	5
143*4882a593Smuzhiyun #define GQR_QUANTIZE_S8		6
144*4882a593Smuzhiyun #define GQR_QUANTIZE_S16	7
145*4882a593Smuzhiyun 
146*4882a593Smuzhiyun #define FPU_LS_SINGLE		0
147*4882a593Smuzhiyun #define FPU_LS_DOUBLE		1
148*4882a593Smuzhiyun #define FPU_LS_SINGLE_LOW	2
149*4882a593Smuzhiyun 
kvmppc_sync_qpr(struct kvm_vcpu * vcpu,int rt)150*4882a593Smuzhiyun static inline void kvmppc_sync_qpr(struct kvm_vcpu *vcpu, int rt)
151*4882a593Smuzhiyun {
152*4882a593Smuzhiyun 	kvm_cvt_df(&VCPU_FPR(vcpu, rt), &vcpu->arch.qpr[rt]);
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun 
kvmppc_inject_pf(struct kvm_vcpu * vcpu,ulong eaddr,bool is_store)155*4882a593Smuzhiyun static void kvmppc_inject_pf(struct kvm_vcpu *vcpu, ulong eaddr, bool is_store)
156*4882a593Smuzhiyun {
157*4882a593Smuzhiyun 	u32 dsisr;
158*4882a593Smuzhiyun 	u64 msr = kvmppc_get_msr(vcpu);
159*4882a593Smuzhiyun 
160*4882a593Smuzhiyun 	msr = kvmppc_set_field(msr, 33, 36, 0);
161*4882a593Smuzhiyun 	msr = kvmppc_set_field(msr, 42, 47, 0);
162*4882a593Smuzhiyun 	kvmppc_set_msr(vcpu, msr);
163*4882a593Smuzhiyun 	kvmppc_set_dar(vcpu, eaddr);
164*4882a593Smuzhiyun 	/* Page Fault */
165*4882a593Smuzhiyun 	dsisr = kvmppc_set_field(0, 33, 33, 1);
166*4882a593Smuzhiyun 	if (is_store)
167*4882a593Smuzhiyun 		dsisr = kvmppc_set_field(dsisr, 38, 38, 1);
168*4882a593Smuzhiyun 	kvmppc_set_dsisr(vcpu, dsisr);
169*4882a593Smuzhiyun 	kvmppc_book3s_queue_irqprio(vcpu, BOOK3S_INTERRUPT_DATA_STORAGE);
170*4882a593Smuzhiyun }
171*4882a593Smuzhiyun 
kvmppc_emulate_fpr_load(struct kvm_vcpu * vcpu,int rs,ulong addr,int ls_type)172*4882a593Smuzhiyun static int kvmppc_emulate_fpr_load(struct kvm_vcpu *vcpu,
173*4882a593Smuzhiyun 				   int rs, ulong addr, int ls_type)
174*4882a593Smuzhiyun {
175*4882a593Smuzhiyun 	int emulated = EMULATE_FAIL;
176*4882a593Smuzhiyun 	int r;
177*4882a593Smuzhiyun 	char tmp[8];
178*4882a593Smuzhiyun 	int len = sizeof(u32);
179*4882a593Smuzhiyun 
180*4882a593Smuzhiyun 	if (ls_type == FPU_LS_DOUBLE)
181*4882a593Smuzhiyun 		len = sizeof(u64);
182*4882a593Smuzhiyun 
183*4882a593Smuzhiyun 	/* read from memory */
184*4882a593Smuzhiyun 	r = kvmppc_ld(vcpu, &addr, len, tmp, true);
185*4882a593Smuzhiyun 	vcpu->arch.paddr_accessed = addr;
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun 	if (r < 0) {
188*4882a593Smuzhiyun 		kvmppc_inject_pf(vcpu, addr, false);
189*4882a593Smuzhiyun 		goto done_load;
190*4882a593Smuzhiyun 	} else if (r == EMULATE_DO_MMIO) {
191*4882a593Smuzhiyun 		emulated = kvmppc_handle_load(vcpu, KVM_MMIO_REG_FPR | rs,
192*4882a593Smuzhiyun 					      len, 1);
193*4882a593Smuzhiyun 		goto done_load;
194*4882a593Smuzhiyun 	}
195*4882a593Smuzhiyun 
196*4882a593Smuzhiyun 	emulated = EMULATE_DONE;
197*4882a593Smuzhiyun 
198*4882a593Smuzhiyun 	/* put in registers */
199*4882a593Smuzhiyun 	switch (ls_type) {
200*4882a593Smuzhiyun 	case FPU_LS_SINGLE:
201*4882a593Smuzhiyun 		kvm_cvt_fd((u32*)tmp, &VCPU_FPR(vcpu, rs));
202*4882a593Smuzhiyun 		vcpu->arch.qpr[rs] = *((u32*)tmp);
203*4882a593Smuzhiyun 		break;
204*4882a593Smuzhiyun 	case FPU_LS_DOUBLE:
205*4882a593Smuzhiyun 		VCPU_FPR(vcpu, rs) = *((u64*)tmp);
206*4882a593Smuzhiyun 		break;
207*4882a593Smuzhiyun 	}
208*4882a593Smuzhiyun 
209*4882a593Smuzhiyun 	dprintk(KERN_INFO "KVM: FPR_LD [0x%llx] at 0x%lx (%d)\n", *(u64*)tmp,
210*4882a593Smuzhiyun 			  addr, len);
211*4882a593Smuzhiyun 
212*4882a593Smuzhiyun done_load:
213*4882a593Smuzhiyun 	return emulated;
214*4882a593Smuzhiyun }
215*4882a593Smuzhiyun 
kvmppc_emulate_fpr_store(struct kvm_vcpu * vcpu,int rs,ulong addr,int ls_type)216*4882a593Smuzhiyun static int kvmppc_emulate_fpr_store(struct kvm_vcpu *vcpu,
217*4882a593Smuzhiyun 				    int rs, ulong addr, int ls_type)
218*4882a593Smuzhiyun {
219*4882a593Smuzhiyun 	int emulated = EMULATE_FAIL;
220*4882a593Smuzhiyun 	int r;
221*4882a593Smuzhiyun 	char tmp[8];
222*4882a593Smuzhiyun 	u64 val;
223*4882a593Smuzhiyun 	int len;
224*4882a593Smuzhiyun 
225*4882a593Smuzhiyun 	switch (ls_type) {
226*4882a593Smuzhiyun 	case FPU_LS_SINGLE:
227*4882a593Smuzhiyun 		kvm_cvt_df(&VCPU_FPR(vcpu, rs), (u32*)tmp);
228*4882a593Smuzhiyun 		val = *((u32*)tmp);
229*4882a593Smuzhiyun 		len = sizeof(u32);
230*4882a593Smuzhiyun 		break;
231*4882a593Smuzhiyun 	case FPU_LS_SINGLE_LOW:
232*4882a593Smuzhiyun 		*((u32*)tmp) = VCPU_FPR(vcpu, rs);
233*4882a593Smuzhiyun 		val = VCPU_FPR(vcpu, rs) & 0xffffffff;
234*4882a593Smuzhiyun 		len = sizeof(u32);
235*4882a593Smuzhiyun 		break;
236*4882a593Smuzhiyun 	case FPU_LS_DOUBLE:
237*4882a593Smuzhiyun 		*((u64*)tmp) = VCPU_FPR(vcpu, rs);
238*4882a593Smuzhiyun 		val = VCPU_FPR(vcpu, rs);
239*4882a593Smuzhiyun 		len = sizeof(u64);
240*4882a593Smuzhiyun 		break;
241*4882a593Smuzhiyun 	default:
242*4882a593Smuzhiyun 		val = 0;
243*4882a593Smuzhiyun 		len = 0;
244*4882a593Smuzhiyun 	}
245*4882a593Smuzhiyun 
246*4882a593Smuzhiyun 	r = kvmppc_st(vcpu, &addr, len, tmp, true);
247*4882a593Smuzhiyun 	vcpu->arch.paddr_accessed = addr;
248*4882a593Smuzhiyun 	if (r < 0) {
249*4882a593Smuzhiyun 		kvmppc_inject_pf(vcpu, addr, true);
250*4882a593Smuzhiyun 	} else if (r == EMULATE_DO_MMIO) {
251*4882a593Smuzhiyun 		emulated = kvmppc_handle_store(vcpu, val, len, 1);
252*4882a593Smuzhiyun 	} else {
253*4882a593Smuzhiyun 		emulated = EMULATE_DONE;
254*4882a593Smuzhiyun 	}
255*4882a593Smuzhiyun 
256*4882a593Smuzhiyun 	dprintk(KERN_INFO "KVM: FPR_ST [0x%llx] at 0x%lx (%d)\n",
257*4882a593Smuzhiyun 			  val, addr, len);
258*4882a593Smuzhiyun 
259*4882a593Smuzhiyun 	return emulated;
260*4882a593Smuzhiyun }
261*4882a593Smuzhiyun 
kvmppc_emulate_psq_load(struct kvm_vcpu * vcpu,int rs,ulong addr,bool w,int i)262*4882a593Smuzhiyun static int kvmppc_emulate_psq_load(struct kvm_vcpu *vcpu,
263*4882a593Smuzhiyun 				   int rs, ulong addr, bool w, int i)
264*4882a593Smuzhiyun {
265*4882a593Smuzhiyun 	int emulated = EMULATE_FAIL;
266*4882a593Smuzhiyun 	int r;
267*4882a593Smuzhiyun 	float one = 1.0;
268*4882a593Smuzhiyun 	u32 tmp[2];
269*4882a593Smuzhiyun 
270*4882a593Smuzhiyun 	/* read from memory */
271*4882a593Smuzhiyun 	if (w) {
272*4882a593Smuzhiyun 		r = kvmppc_ld(vcpu, &addr, sizeof(u32), tmp, true);
273*4882a593Smuzhiyun 		memcpy(&tmp[1], &one, sizeof(u32));
274*4882a593Smuzhiyun 	} else {
275*4882a593Smuzhiyun 		r = kvmppc_ld(vcpu, &addr, sizeof(u32) * 2, tmp, true);
276*4882a593Smuzhiyun 	}
277*4882a593Smuzhiyun 	vcpu->arch.paddr_accessed = addr;
278*4882a593Smuzhiyun 	if (r < 0) {
279*4882a593Smuzhiyun 		kvmppc_inject_pf(vcpu, addr, false);
280*4882a593Smuzhiyun 		goto done_load;
281*4882a593Smuzhiyun 	} else if ((r == EMULATE_DO_MMIO) && w) {
282*4882a593Smuzhiyun 		emulated = kvmppc_handle_load(vcpu, KVM_MMIO_REG_FPR | rs,
283*4882a593Smuzhiyun 					      4, 1);
284*4882a593Smuzhiyun 		vcpu->arch.qpr[rs] = tmp[1];
285*4882a593Smuzhiyun 		goto done_load;
286*4882a593Smuzhiyun 	} else if (r == EMULATE_DO_MMIO) {
287*4882a593Smuzhiyun 		emulated = kvmppc_handle_load(vcpu, KVM_MMIO_REG_FQPR | rs,
288*4882a593Smuzhiyun 					      8, 1);
289*4882a593Smuzhiyun 		goto done_load;
290*4882a593Smuzhiyun 	}
291*4882a593Smuzhiyun 
292*4882a593Smuzhiyun 	emulated = EMULATE_DONE;
293*4882a593Smuzhiyun 
294*4882a593Smuzhiyun 	/* put in registers */
295*4882a593Smuzhiyun 	kvm_cvt_fd(&tmp[0], &VCPU_FPR(vcpu, rs));
296*4882a593Smuzhiyun 	vcpu->arch.qpr[rs] = tmp[1];
297*4882a593Smuzhiyun 
298*4882a593Smuzhiyun 	dprintk(KERN_INFO "KVM: PSQ_LD [0x%x, 0x%x] at 0x%lx (%d)\n", tmp[0],
299*4882a593Smuzhiyun 			  tmp[1], addr, w ? 4 : 8);
300*4882a593Smuzhiyun 
301*4882a593Smuzhiyun done_load:
302*4882a593Smuzhiyun 	return emulated;
303*4882a593Smuzhiyun }
304*4882a593Smuzhiyun 
kvmppc_emulate_psq_store(struct kvm_vcpu * vcpu,int rs,ulong addr,bool w,int i)305*4882a593Smuzhiyun static int kvmppc_emulate_psq_store(struct kvm_vcpu *vcpu,
306*4882a593Smuzhiyun 				    int rs, ulong addr, bool w, int i)
307*4882a593Smuzhiyun {
308*4882a593Smuzhiyun 	int emulated = EMULATE_FAIL;
309*4882a593Smuzhiyun 	int r;
310*4882a593Smuzhiyun 	u32 tmp[2];
311*4882a593Smuzhiyun 	int len = w ? sizeof(u32) : sizeof(u64);
312*4882a593Smuzhiyun 
313*4882a593Smuzhiyun 	kvm_cvt_df(&VCPU_FPR(vcpu, rs), &tmp[0]);
314*4882a593Smuzhiyun 	tmp[1] = vcpu->arch.qpr[rs];
315*4882a593Smuzhiyun 
316*4882a593Smuzhiyun 	r = kvmppc_st(vcpu, &addr, len, tmp, true);
317*4882a593Smuzhiyun 	vcpu->arch.paddr_accessed = addr;
318*4882a593Smuzhiyun 	if (r < 0) {
319*4882a593Smuzhiyun 		kvmppc_inject_pf(vcpu, addr, true);
320*4882a593Smuzhiyun 	} else if ((r == EMULATE_DO_MMIO) && w) {
321*4882a593Smuzhiyun 		emulated = kvmppc_handle_store(vcpu, tmp[0], 4, 1);
322*4882a593Smuzhiyun 	} else if (r == EMULATE_DO_MMIO) {
323*4882a593Smuzhiyun 		u64 val = ((u64)tmp[0] << 32) | tmp[1];
324*4882a593Smuzhiyun 		emulated = kvmppc_handle_store(vcpu, val, 8, 1);
325*4882a593Smuzhiyun 	} else {
326*4882a593Smuzhiyun 		emulated = EMULATE_DONE;
327*4882a593Smuzhiyun 	}
328*4882a593Smuzhiyun 
329*4882a593Smuzhiyun 	dprintk(KERN_INFO "KVM: PSQ_ST [0x%x, 0x%x] at 0x%lx (%d)\n",
330*4882a593Smuzhiyun 			  tmp[0], tmp[1], addr, len);
331*4882a593Smuzhiyun 
332*4882a593Smuzhiyun 	return emulated;
333*4882a593Smuzhiyun }
334*4882a593Smuzhiyun 
335*4882a593Smuzhiyun /*
336*4882a593Smuzhiyun  * Cuts out inst bits with ordering according to spec.
337*4882a593Smuzhiyun  * That means the leftmost bit is zero. All given bits are included.
338*4882a593Smuzhiyun  */
inst_get_field(u32 inst,int msb,int lsb)339*4882a593Smuzhiyun static inline u32 inst_get_field(u32 inst, int msb, int lsb)
340*4882a593Smuzhiyun {
341*4882a593Smuzhiyun 	return kvmppc_get_field(inst, msb + 32, lsb + 32);
342*4882a593Smuzhiyun }
343*4882a593Smuzhiyun 
kvmppc_inst_is_paired_single(struct kvm_vcpu * vcpu,u32 inst)344*4882a593Smuzhiyun static bool kvmppc_inst_is_paired_single(struct kvm_vcpu *vcpu, u32 inst)
345*4882a593Smuzhiyun {
346*4882a593Smuzhiyun 	if (!(vcpu->arch.hflags & BOOK3S_HFLAG_PAIRED_SINGLE))
347*4882a593Smuzhiyun 		return false;
348*4882a593Smuzhiyun 
349*4882a593Smuzhiyun 	switch (get_op(inst)) {
350*4882a593Smuzhiyun 	case OP_PSQ_L:
351*4882a593Smuzhiyun 	case OP_PSQ_LU:
352*4882a593Smuzhiyun 	case OP_PSQ_ST:
353*4882a593Smuzhiyun 	case OP_PSQ_STU:
354*4882a593Smuzhiyun 	case OP_LFS:
355*4882a593Smuzhiyun 	case OP_LFSU:
356*4882a593Smuzhiyun 	case OP_LFD:
357*4882a593Smuzhiyun 	case OP_LFDU:
358*4882a593Smuzhiyun 	case OP_STFS:
359*4882a593Smuzhiyun 	case OP_STFSU:
360*4882a593Smuzhiyun 	case OP_STFD:
361*4882a593Smuzhiyun 	case OP_STFDU:
362*4882a593Smuzhiyun 		return true;
363*4882a593Smuzhiyun 	case 4:
364*4882a593Smuzhiyun 		/* X form */
365*4882a593Smuzhiyun 		switch (inst_get_field(inst, 21, 30)) {
366*4882a593Smuzhiyun 		case OP_4X_PS_CMPU0:
367*4882a593Smuzhiyun 		case OP_4X_PSQ_LX:
368*4882a593Smuzhiyun 		case OP_4X_PS_CMPO0:
369*4882a593Smuzhiyun 		case OP_4X_PSQ_LUX:
370*4882a593Smuzhiyun 		case OP_4X_PS_NEG:
371*4882a593Smuzhiyun 		case OP_4X_PS_CMPU1:
372*4882a593Smuzhiyun 		case OP_4X_PS_MR:
373*4882a593Smuzhiyun 		case OP_4X_PS_CMPO1:
374*4882a593Smuzhiyun 		case OP_4X_PS_NABS:
375*4882a593Smuzhiyun 		case OP_4X_PS_ABS:
376*4882a593Smuzhiyun 		case OP_4X_PS_MERGE00:
377*4882a593Smuzhiyun 		case OP_4X_PS_MERGE01:
378*4882a593Smuzhiyun 		case OP_4X_PS_MERGE10:
379*4882a593Smuzhiyun 		case OP_4X_PS_MERGE11:
380*4882a593Smuzhiyun 			return true;
381*4882a593Smuzhiyun 		}
382*4882a593Smuzhiyun 		/* XW form */
383*4882a593Smuzhiyun 		switch (inst_get_field(inst, 25, 30)) {
384*4882a593Smuzhiyun 		case OP_4XW_PSQ_STX:
385*4882a593Smuzhiyun 		case OP_4XW_PSQ_STUX:
386*4882a593Smuzhiyun 			return true;
387*4882a593Smuzhiyun 		}
388*4882a593Smuzhiyun 		/* A form */
389*4882a593Smuzhiyun 		switch (inst_get_field(inst, 26, 30)) {
390*4882a593Smuzhiyun 		case OP_4A_PS_SUM1:
391*4882a593Smuzhiyun 		case OP_4A_PS_SUM0:
392*4882a593Smuzhiyun 		case OP_4A_PS_MULS0:
393*4882a593Smuzhiyun 		case OP_4A_PS_MULS1:
394*4882a593Smuzhiyun 		case OP_4A_PS_MADDS0:
395*4882a593Smuzhiyun 		case OP_4A_PS_MADDS1:
396*4882a593Smuzhiyun 		case OP_4A_PS_DIV:
397*4882a593Smuzhiyun 		case OP_4A_PS_SUB:
398*4882a593Smuzhiyun 		case OP_4A_PS_ADD:
399*4882a593Smuzhiyun 		case OP_4A_PS_SEL:
400*4882a593Smuzhiyun 		case OP_4A_PS_RES:
401*4882a593Smuzhiyun 		case OP_4A_PS_MUL:
402*4882a593Smuzhiyun 		case OP_4A_PS_RSQRTE:
403*4882a593Smuzhiyun 		case OP_4A_PS_MSUB:
404*4882a593Smuzhiyun 		case OP_4A_PS_MADD:
405*4882a593Smuzhiyun 		case OP_4A_PS_NMSUB:
406*4882a593Smuzhiyun 		case OP_4A_PS_NMADD:
407*4882a593Smuzhiyun 			return true;
408*4882a593Smuzhiyun 		}
409*4882a593Smuzhiyun 		break;
410*4882a593Smuzhiyun 	case 59:
411*4882a593Smuzhiyun 		switch (inst_get_field(inst, 21, 30)) {
412*4882a593Smuzhiyun 		case OP_59_FADDS:
413*4882a593Smuzhiyun 		case OP_59_FSUBS:
414*4882a593Smuzhiyun 		case OP_59_FDIVS:
415*4882a593Smuzhiyun 		case OP_59_FRES:
416*4882a593Smuzhiyun 		case OP_59_FRSQRTES:
417*4882a593Smuzhiyun 			return true;
418*4882a593Smuzhiyun 		}
419*4882a593Smuzhiyun 		switch (inst_get_field(inst, 26, 30)) {
420*4882a593Smuzhiyun 		case OP_59_FMULS:
421*4882a593Smuzhiyun 		case OP_59_FMSUBS:
422*4882a593Smuzhiyun 		case OP_59_FMADDS:
423*4882a593Smuzhiyun 		case OP_59_FNMSUBS:
424*4882a593Smuzhiyun 		case OP_59_FNMADDS:
425*4882a593Smuzhiyun 			return true;
426*4882a593Smuzhiyun 		}
427*4882a593Smuzhiyun 		break;
428*4882a593Smuzhiyun 	case 63:
429*4882a593Smuzhiyun 		switch (inst_get_field(inst, 21, 30)) {
430*4882a593Smuzhiyun 		case OP_63_MTFSB0:
431*4882a593Smuzhiyun 		case OP_63_MTFSB1:
432*4882a593Smuzhiyun 		case OP_63_MTFSF:
433*4882a593Smuzhiyun 		case OP_63_MTFSFI:
434*4882a593Smuzhiyun 		case OP_63_MCRFS:
435*4882a593Smuzhiyun 		case OP_63_MFFS:
436*4882a593Smuzhiyun 		case OP_63_FCMPU:
437*4882a593Smuzhiyun 		case OP_63_FCMPO:
438*4882a593Smuzhiyun 		case OP_63_FNEG:
439*4882a593Smuzhiyun 		case OP_63_FMR:
440*4882a593Smuzhiyun 		case OP_63_FABS:
441*4882a593Smuzhiyun 		case OP_63_FRSP:
442*4882a593Smuzhiyun 		case OP_63_FDIV:
443*4882a593Smuzhiyun 		case OP_63_FADD:
444*4882a593Smuzhiyun 		case OP_63_FSUB:
445*4882a593Smuzhiyun 		case OP_63_FCTIW:
446*4882a593Smuzhiyun 		case OP_63_FCTIWZ:
447*4882a593Smuzhiyun 		case OP_63_FRSQRTE:
448*4882a593Smuzhiyun 		case OP_63_FCPSGN:
449*4882a593Smuzhiyun 			return true;
450*4882a593Smuzhiyun 		}
451*4882a593Smuzhiyun 		switch (inst_get_field(inst, 26, 30)) {
452*4882a593Smuzhiyun 		case OP_63_FMUL:
453*4882a593Smuzhiyun 		case OP_63_FSEL:
454*4882a593Smuzhiyun 		case OP_63_FMSUB:
455*4882a593Smuzhiyun 		case OP_63_FMADD:
456*4882a593Smuzhiyun 		case OP_63_FNMSUB:
457*4882a593Smuzhiyun 		case OP_63_FNMADD:
458*4882a593Smuzhiyun 			return true;
459*4882a593Smuzhiyun 		}
460*4882a593Smuzhiyun 		break;
461*4882a593Smuzhiyun 	case 31:
462*4882a593Smuzhiyun 		switch (inst_get_field(inst, 21, 30)) {
463*4882a593Smuzhiyun 		case OP_31_LFSX:
464*4882a593Smuzhiyun 		case OP_31_LFSUX:
465*4882a593Smuzhiyun 		case OP_31_LFDX:
466*4882a593Smuzhiyun 		case OP_31_LFDUX:
467*4882a593Smuzhiyun 		case OP_31_STFSX:
468*4882a593Smuzhiyun 		case OP_31_STFSUX:
469*4882a593Smuzhiyun 		case OP_31_STFX:
470*4882a593Smuzhiyun 		case OP_31_STFUX:
471*4882a593Smuzhiyun 		case OP_31_STFIWX:
472*4882a593Smuzhiyun 			return true;
473*4882a593Smuzhiyun 		}
474*4882a593Smuzhiyun 		break;
475*4882a593Smuzhiyun 	}
476*4882a593Smuzhiyun 
477*4882a593Smuzhiyun 	return false;
478*4882a593Smuzhiyun }
479*4882a593Smuzhiyun 
get_d_signext(u32 inst)480*4882a593Smuzhiyun static int get_d_signext(u32 inst)
481*4882a593Smuzhiyun {
482*4882a593Smuzhiyun 	int d = inst & 0x8ff;
483*4882a593Smuzhiyun 
484*4882a593Smuzhiyun 	if (d & 0x800)
485*4882a593Smuzhiyun 		return -(d & 0x7ff);
486*4882a593Smuzhiyun 
487*4882a593Smuzhiyun 	return (d & 0x7ff);
488*4882a593Smuzhiyun }
489*4882a593Smuzhiyun 
kvmppc_ps_three_in(struct kvm_vcpu * vcpu,bool rc,int reg_out,int reg_in1,int reg_in2,int reg_in3,int scalar,void (* func)(u64 * fpscr,u32 * dst,u32 * src1,u32 * src2,u32 * src3))490*4882a593Smuzhiyun static int kvmppc_ps_three_in(struct kvm_vcpu *vcpu, bool rc,
491*4882a593Smuzhiyun 				      int reg_out, int reg_in1, int reg_in2,
492*4882a593Smuzhiyun 				      int reg_in3, int scalar,
493*4882a593Smuzhiyun 				      void (*func)(u64 *fpscr,
494*4882a593Smuzhiyun 						 u32 *dst, u32 *src1,
495*4882a593Smuzhiyun 						 u32 *src2, u32 *src3))
496*4882a593Smuzhiyun {
497*4882a593Smuzhiyun 	u32 *qpr = vcpu->arch.qpr;
498*4882a593Smuzhiyun 	u32 ps0_out;
499*4882a593Smuzhiyun 	u32 ps0_in1, ps0_in2, ps0_in3;
500*4882a593Smuzhiyun 	u32 ps1_in1, ps1_in2, ps1_in3;
501*4882a593Smuzhiyun 
502*4882a593Smuzhiyun 	/* RC */
503*4882a593Smuzhiyun 	WARN_ON(rc);
504*4882a593Smuzhiyun 
505*4882a593Smuzhiyun 	/* PS0 */
506*4882a593Smuzhiyun 	kvm_cvt_df(&VCPU_FPR(vcpu, reg_in1), &ps0_in1);
507*4882a593Smuzhiyun 	kvm_cvt_df(&VCPU_FPR(vcpu, reg_in2), &ps0_in2);
508*4882a593Smuzhiyun 	kvm_cvt_df(&VCPU_FPR(vcpu, reg_in3), &ps0_in3);
509*4882a593Smuzhiyun 
510*4882a593Smuzhiyun 	if (scalar & SCALAR_LOW)
511*4882a593Smuzhiyun 		ps0_in2 = qpr[reg_in2];
512*4882a593Smuzhiyun 
513*4882a593Smuzhiyun 	func(&vcpu->arch.fp.fpscr, &ps0_out, &ps0_in1, &ps0_in2, &ps0_in3);
514*4882a593Smuzhiyun 
515*4882a593Smuzhiyun 	dprintk(KERN_INFO "PS3 ps0 -> f(0x%x, 0x%x, 0x%x) = 0x%x\n",
516*4882a593Smuzhiyun 			  ps0_in1, ps0_in2, ps0_in3, ps0_out);
517*4882a593Smuzhiyun 
518*4882a593Smuzhiyun 	if (!(scalar & SCALAR_NO_PS0))
519*4882a593Smuzhiyun 		kvm_cvt_fd(&ps0_out, &VCPU_FPR(vcpu, reg_out));
520*4882a593Smuzhiyun 
521*4882a593Smuzhiyun 	/* PS1 */
522*4882a593Smuzhiyun 	ps1_in1 = qpr[reg_in1];
523*4882a593Smuzhiyun 	ps1_in2 = qpr[reg_in2];
524*4882a593Smuzhiyun 	ps1_in3 = qpr[reg_in3];
525*4882a593Smuzhiyun 
526*4882a593Smuzhiyun 	if (scalar & SCALAR_HIGH)
527*4882a593Smuzhiyun 		ps1_in2 = ps0_in2;
528*4882a593Smuzhiyun 
529*4882a593Smuzhiyun 	if (!(scalar & SCALAR_NO_PS1))
530*4882a593Smuzhiyun 		func(&vcpu->arch.fp.fpscr, &qpr[reg_out], &ps1_in1, &ps1_in2, &ps1_in3);
531*4882a593Smuzhiyun 
532*4882a593Smuzhiyun 	dprintk(KERN_INFO "PS3 ps1 -> f(0x%x, 0x%x, 0x%x) = 0x%x\n",
533*4882a593Smuzhiyun 			  ps1_in1, ps1_in2, ps1_in3, qpr[reg_out]);
534*4882a593Smuzhiyun 
535*4882a593Smuzhiyun 	return EMULATE_DONE;
536*4882a593Smuzhiyun }
537*4882a593Smuzhiyun 
kvmppc_ps_two_in(struct kvm_vcpu * vcpu,bool rc,int reg_out,int reg_in1,int reg_in2,int scalar,void (* func)(u64 * fpscr,u32 * dst,u32 * src1,u32 * src2))538*4882a593Smuzhiyun static int kvmppc_ps_two_in(struct kvm_vcpu *vcpu, bool rc,
539*4882a593Smuzhiyun 				    int reg_out, int reg_in1, int reg_in2,
540*4882a593Smuzhiyun 				    int scalar,
541*4882a593Smuzhiyun 				    void (*func)(u64 *fpscr,
542*4882a593Smuzhiyun 						 u32 *dst, u32 *src1,
543*4882a593Smuzhiyun 						 u32 *src2))
544*4882a593Smuzhiyun {
545*4882a593Smuzhiyun 	u32 *qpr = vcpu->arch.qpr;
546*4882a593Smuzhiyun 	u32 ps0_out;
547*4882a593Smuzhiyun 	u32 ps0_in1, ps0_in2;
548*4882a593Smuzhiyun 	u32 ps1_out;
549*4882a593Smuzhiyun 	u32 ps1_in1, ps1_in2;
550*4882a593Smuzhiyun 
551*4882a593Smuzhiyun 	/* RC */
552*4882a593Smuzhiyun 	WARN_ON(rc);
553*4882a593Smuzhiyun 
554*4882a593Smuzhiyun 	/* PS0 */
555*4882a593Smuzhiyun 	kvm_cvt_df(&VCPU_FPR(vcpu, reg_in1), &ps0_in1);
556*4882a593Smuzhiyun 
557*4882a593Smuzhiyun 	if (scalar & SCALAR_LOW)
558*4882a593Smuzhiyun 		ps0_in2 = qpr[reg_in2];
559*4882a593Smuzhiyun 	else
560*4882a593Smuzhiyun 		kvm_cvt_df(&VCPU_FPR(vcpu, reg_in2), &ps0_in2);
561*4882a593Smuzhiyun 
562*4882a593Smuzhiyun 	func(&vcpu->arch.fp.fpscr, &ps0_out, &ps0_in1, &ps0_in2);
563*4882a593Smuzhiyun 
564*4882a593Smuzhiyun 	if (!(scalar & SCALAR_NO_PS0)) {
565*4882a593Smuzhiyun 		dprintk(KERN_INFO "PS2 ps0 -> f(0x%x, 0x%x) = 0x%x\n",
566*4882a593Smuzhiyun 				  ps0_in1, ps0_in2, ps0_out);
567*4882a593Smuzhiyun 
568*4882a593Smuzhiyun 		kvm_cvt_fd(&ps0_out, &VCPU_FPR(vcpu, reg_out));
569*4882a593Smuzhiyun 	}
570*4882a593Smuzhiyun 
571*4882a593Smuzhiyun 	/* PS1 */
572*4882a593Smuzhiyun 	ps1_in1 = qpr[reg_in1];
573*4882a593Smuzhiyun 	ps1_in2 = qpr[reg_in2];
574*4882a593Smuzhiyun 
575*4882a593Smuzhiyun 	if (scalar & SCALAR_HIGH)
576*4882a593Smuzhiyun 		ps1_in2 = ps0_in2;
577*4882a593Smuzhiyun 
578*4882a593Smuzhiyun 	func(&vcpu->arch.fp.fpscr, &ps1_out, &ps1_in1, &ps1_in2);
579*4882a593Smuzhiyun 
580*4882a593Smuzhiyun 	if (!(scalar & SCALAR_NO_PS1)) {
581*4882a593Smuzhiyun 		qpr[reg_out] = ps1_out;
582*4882a593Smuzhiyun 
583*4882a593Smuzhiyun 		dprintk(KERN_INFO "PS2 ps1 -> f(0x%x, 0x%x) = 0x%x\n",
584*4882a593Smuzhiyun 				  ps1_in1, ps1_in2, qpr[reg_out]);
585*4882a593Smuzhiyun 	}
586*4882a593Smuzhiyun 
587*4882a593Smuzhiyun 	return EMULATE_DONE;
588*4882a593Smuzhiyun }
589*4882a593Smuzhiyun 
kvmppc_ps_one_in(struct kvm_vcpu * vcpu,bool rc,int reg_out,int reg_in,void (* func)(u64 * t,u32 * dst,u32 * src1))590*4882a593Smuzhiyun static int kvmppc_ps_one_in(struct kvm_vcpu *vcpu, bool rc,
591*4882a593Smuzhiyun 				    int reg_out, int reg_in,
592*4882a593Smuzhiyun 				    void (*func)(u64 *t,
593*4882a593Smuzhiyun 						 u32 *dst, u32 *src1))
594*4882a593Smuzhiyun {
595*4882a593Smuzhiyun 	u32 *qpr = vcpu->arch.qpr;
596*4882a593Smuzhiyun 	u32 ps0_out, ps0_in;
597*4882a593Smuzhiyun 	u32 ps1_in;
598*4882a593Smuzhiyun 
599*4882a593Smuzhiyun 	/* RC */
600*4882a593Smuzhiyun 	WARN_ON(rc);
601*4882a593Smuzhiyun 
602*4882a593Smuzhiyun 	/* PS0 */
603*4882a593Smuzhiyun 	kvm_cvt_df(&VCPU_FPR(vcpu, reg_in), &ps0_in);
604*4882a593Smuzhiyun 	func(&vcpu->arch.fp.fpscr, &ps0_out, &ps0_in);
605*4882a593Smuzhiyun 
606*4882a593Smuzhiyun 	dprintk(KERN_INFO "PS1 ps0 -> f(0x%x) = 0x%x\n",
607*4882a593Smuzhiyun 			  ps0_in, ps0_out);
608*4882a593Smuzhiyun 
609*4882a593Smuzhiyun 	kvm_cvt_fd(&ps0_out, &VCPU_FPR(vcpu, reg_out));
610*4882a593Smuzhiyun 
611*4882a593Smuzhiyun 	/* PS1 */
612*4882a593Smuzhiyun 	ps1_in = qpr[reg_in];
613*4882a593Smuzhiyun 	func(&vcpu->arch.fp.fpscr, &qpr[reg_out], &ps1_in);
614*4882a593Smuzhiyun 
615*4882a593Smuzhiyun 	dprintk(KERN_INFO "PS1 ps1 -> f(0x%x) = 0x%x\n",
616*4882a593Smuzhiyun 			  ps1_in, qpr[reg_out]);
617*4882a593Smuzhiyun 
618*4882a593Smuzhiyun 	return EMULATE_DONE;
619*4882a593Smuzhiyun }
620*4882a593Smuzhiyun 
kvmppc_emulate_paired_single(struct kvm_vcpu * vcpu)621*4882a593Smuzhiyun int kvmppc_emulate_paired_single(struct kvm_vcpu *vcpu)
622*4882a593Smuzhiyun {
623*4882a593Smuzhiyun 	u32 inst;
624*4882a593Smuzhiyun 	enum emulation_result emulated = EMULATE_DONE;
625*4882a593Smuzhiyun 	int ax_rd, ax_ra, ax_rb, ax_rc;
626*4882a593Smuzhiyun 	short full_d;
627*4882a593Smuzhiyun 	u64 *fpr_d, *fpr_a, *fpr_b, *fpr_c;
628*4882a593Smuzhiyun 
629*4882a593Smuzhiyun 	bool rcomp;
630*4882a593Smuzhiyun 	u32 cr;
631*4882a593Smuzhiyun #ifdef DEBUG
632*4882a593Smuzhiyun 	int i;
633*4882a593Smuzhiyun #endif
634*4882a593Smuzhiyun 
635*4882a593Smuzhiyun 	emulated = kvmppc_get_last_inst(vcpu, INST_GENERIC, &inst);
636*4882a593Smuzhiyun 	if (emulated != EMULATE_DONE)
637*4882a593Smuzhiyun 		return emulated;
638*4882a593Smuzhiyun 
639*4882a593Smuzhiyun 	ax_rd = inst_get_field(inst, 6, 10);
640*4882a593Smuzhiyun 	ax_ra = inst_get_field(inst, 11, 15);
641*4882a593Smuzhiyun 	ax_rb = inst_get_field(inst, 16, 20);
642*4882a593Smuzhiyun 	ax_rc = inst_get_field(inst, 21, 25);
643*4882a593Smuzhiyun 	full_d = inst_get_field(inst, 16, 31);
644*4882a593Smuzhiyun 
645*4882a593Smuzhiyun 	fpr_d = &VCPU_FPR(vcpu, ax_rd);
646*4882a593Smuzhiyun 	fpr_a = &VCPU_FPR(vcpu, ax_ra);
647*4882a593Smuzhiyun 	fpr_b = &VCPU_FPR(vcpu, ax_rb);
648*4882a593Smuzhiyun 	fpr_c = &VCPU_FPR(vcpu, ax_rc);
649*4882a593Smuzhiyun 
650*4882a593Smuzhiyun 	rcomp = (inst & 1) ? true : false;
651*4882a593Smuzhiyun 	cr = kvmppc_get_cr(vcpu);
652*4882a593Smuzhiyun 
653*4882a593Smuzhiyun 	if (!kvmppc_inst_is_paired_single(vcpu, inst))
654*4882a593Smuzhiyun 		return EMULATE_FAIL;
655*4882a593Smuzhiyun 
656*4882a593Smuzhiyun 	if (!(kvmppc_get_msr(vcpu) & MSR_FP)) {
657*4882a593Smuzhiyun 		kvmppc_book3s_queue_irqprio(vcpu, BOOK3S_INTERRUPT_FP_UNAVAIL);
658*4882a593Smuzhiyun 		return EMULATE_AGAIN;
659*4882a593Smuzhiyun 	}
660*4882a593Smuzhiyun 
661*4882a593Smuzhiyun 	kvmppc_giveup_ext(vcpu, MSR_FP);
662*4882a593Smuzhiyun 	preempt_disable();
663*4882a593Smuzhiyun 	enable_kernel_fp();
664*4882a593Smuzhiyun 	/* Do we need to clear FE0 / FE1 here? Don't think so. */
665*4882a593Smuzhiyun 
666*4882a593Smuzhiyun #ifdef DEBUG
667*4882a593Smuzhiyun 	for (i = 0; i < ARRAY_SIZE(vcpu->arch.fp.fpr); i++) {
668*4882a593Smuzhiyun 		u32 f;
669*4882a593Smuzhiyun 		kvm_cvt_df(&VCPU_FPR(vcpu, i), &f);
670*4882a593Smuzhiyun 		dprintk(KERN_INFO "FPR[%d] = 0x%x / 0x%llx    QPR[%d] = 0x%x\n",
671*4882a593Smuzhiyun 			i, f, VCPU_FPR(vcpu, i), i, vcpu->arch.qpr[i]);
672*4882a593Smuzhiyun 	}
673*4882a593Smuzhiyun #endif
674*4882a593Smuzhiyun 
675*4882a593Smuzhiyun 	switch (get_op(inst)) {
676*4882a593Smuzhiyun 	case OP_PSQ_L:
677*4882a593Smuzhiyun 	{
678*4882a593Smuzhiyun 		ulong addr = ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0;
679*4882a593Smuzhiyun 		bool w = inst_get_field(inst, 16, 16) ? true : false;
680*4882a593Smuzhiyun 		int i = inst_get_field(inst, 17, 19);
681*4882a593Smuzhiyun 
682*4882a593Smuzhiyun 		addr += get_d_signext(inst);
683*4882a593Smuzhiyun 		emulated = kvmppc_emulate_psq_load(vcpu, ax_rd, addr, w, i);
684*4882a593Smuzhiyun 		break;
685*4882a593Smuzhiyun 	}
686*4882a593Smuzhiyun 	case OP_PSQ_LU:
687*4882a593Smuzhiyun 	{
688*4882a593Smuzhiyun 		ulong addr = kvmppc_get_gpr(vcpu, ax_ra);
689*4882a593Smuzhiyun 		bool w = inst_get_field(inst, 16, 16) ? true : false;
690*4882a593Smuzhiyun 		int i = inst_get_field(inst, 17, 19);
691*4882a593Smuzhiyun 
692*4882a593Smuzhiyun 		addr += get_d_signext(inst);
693*4882a593Smuzhiyun 		emulated = kvmppc_emulate_psq_load(vcpu, ax_rd, addr, w, i);
694*4882a593Smuzhiyun 
695*4882a593Smuzhiyun 		if (emulated == EMULATE_DONE)
696*4882a593Smuzhiyun 			kvmppc_set_gpr(vcpu, ax_ra, addr);
697*4882a593Smuzhiyun 		break;
698*4882a593Smuzhiyun 	}
699*4882a593Smuzhiyun 	case OP_PSQ_ST:
700*4882a593Smuzhiyun 	{
701*4882a593Smuzhiyun 		ulong addr = ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0;
702*4882a593Smuzhiyun 		bool w = inst_get_field(inst, 16, 16) ? true : false;
703*4882a593Smuzhiyun 		int i = inst_get_field(inst, 17, 19);
704*4882a593Smuzhiyun 
705*4882a593Smuzhiyun 		addr += get_d_signext(inst);
706*4882a593Smuzhiyun 		emulated = kvmppc_emulate_psq_store(vcpu, ax_rd, addr, w, i);
707*4882a593Smuzhiyun 		break;
708*4882a593Smuzhiyun 	}
709*4882a593Smuzhiyun 	case OP_PSQ_STU:
710*4882a593Smuzhiyun 	{
711*4882a593Smuzhiyun 		ulong addr = kvmppc_get_gpr(vcpu, ax_ra);
712*4882a593Smuzhiyun 		bool w = inst_get_field(inst, 16, 16) ? true : false;
713*4882a593Smuzhiyun 		int i = inst_get_field(inst, 17, 19);
714*4882a593Smuzhiyun 
715*4882a593Smuzhiyun 		addr += get_d_signext(inst);
716*4882a593Smuzhiyun 		emulated = kvmppc_emulate_psq_store(vcpu, ax_rd, addr, w, i);
717*4882a593Smuzhiyun 
718*4882a593Smuzhiyun 		if (emulated == EMULATE_DONE)
719*4882a593Smuzhiyun 			kvmppc_set_gpr(vcpu, ax_ra, addr);
720*4882a593Smuzhiyun 		break;
721*4882a593Smuzhiyun 	}
722*4882a593Smuzhiyun 	case 4:
723*4882a593Smuzhiyun 		/* X form */
724*4882a593Smuzhiyun 		switch (inst_get_field(inst, 21, 30)) {
725*4882a593Smuzhiyun 		case OP_4X_PS_CMPU0:
726*4882a593Smuzhiyun 			/* XXX */
727*4882a593Smuzhiyun 			emulated = EMULATE_FAIL;
728*4882a593Smuzhiyun 			break;
729*4882a593Smuzhiyun 		case OP_4X_PSQ_LX:
730*4882a593Smuzhiyun 		{
731*4882a593Smuzhiyun 			ulong addr = ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0;
732*4882a593Smuzhiyun 			bool w = inst_get_field(inst, 21, 21) ? true : false;
733*4882a593Smuzhiyun 			int i = inst_get_field(inst, 22, 24);
734*4882a593Smuzhiyun 
735*4882a593Smuzhiyun 			addr += kvmppc_get_gpr(vcpu, ax_rb);
736*4882a593Smuzhiyun 			emulated = kvmppc_emulate_psq_load(vcpu, ax_rd, addr, w, i);
737*4882a593Smuzhiyun 			break;
738*4882a593Smuzhiyun 		}
739*4882a593Smuzhiyun 		case OP_4X_PS_CMPO0:
740*4882a593Smuzhiyun 			/* XXX */
741*4882a593Smuzhiyun 			emulated = EMULATE_FAIL;
742*4882a593Smuzhiyun 			break;
743*4882a593Smuzhiyun 		case OP_4X_PSQ_LUX:
744*4882a593Smuzhiyun 		{
745*4882a593Smuzhiyun 			ulong addr = kvmppc_get_gpr(vcpu, ax_ra);
746*4882a593Smuzhiyun 			bool w = inst_get_field(inst, 21, 21) ? true : false;
747*4882a593Smuzhiyun 			int i = inst_get_field(inst, 22, 24);
748*4882a593Smuzhiyun 
749*4882a593Smuzhiyun 			addr += kvmppc_get_gpr(vcpu, ax_rb);
750*4882a593Smuzhiyun 			emulated = kvmppc_emulate_psq_load(vcpu, ax_rd, addr, w, i);
751*4882a593Smuzhiyun 
752*4882a593Smuzhiyun 			if (emulated == EMULATE_DONE)
753*4882a593Smuzhiyun 				kvmppc_set_gpr(vcpu, ax_ra, addr);
754*4882a593Smuzhiyun 			break;
755*4882a593Smuzhiyun 		}
756*4882a593Smuzhiyun 		case OP_4X_PS_NEG:
757*4882a593Smuzhiyun 			VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_rb);
758*4882a593Smuzhiyun 			VCPU_FPR(vcpu, ax_rd) ^= 0x8000000000000000ULL;
759*4882a593Smuzhiyun 			vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
760*4882a593Smuzhiyun 			vcpu->arch.qpr[ax_rd] ^= 0x80000000;
761*4882a593Smuzhiyun 			break;
762*4882a593Smuzhiyun 		case OP_4X_PS_CMPU1:
763*4882a593Smuzhiyun 			/* XXX */
764*4882a593Smuzhiyun 			emulated = EMULATE_FAIL;
765*4882a593Smuzhiyun 			break;
766*4882a593Smuzhiyun 		case OP_4X_PS_MR:
767*4882a593Smuzhiyun 			WARN_ON(rcomp);
768*4882a593Smuzhiyun 			VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_rb);
769*4882a593Smuzhiyun 			vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
770*4882a593Smuzhiyun 			break;
771*4882a593Smuzhiyun 		case OP_4X_PS_CMPO1:
772*4882a593Smuzhiyun 			/* XXX */
773*4882a593Smuzhiyun 			emulated = EMULATE_FAIL;
774*4882a593Smuzhiyun 			break;
775*4882a593Smuzhiyun 		case OP_4X_PS_NABS:
776*4882a593Smuzhiyun 			WARN_ON(rcomp);
777*4882a593Smuzhiyun 			VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_rb);
778*4882a593Smuzhiyun 			VCPU_FPR(vcpu, ax_rd) |= 0x8000000000000000ULL;
779*4882a593Smuzhiyun 			vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
780*4882a593Smuzhiyun 			vcpu->arch.qpr[ax_rd] |= 0x80000000;
781*4882a593Smuzhiyun 			break;
782*4882a593Smuzhiyun 		case OP_4X_PS_ABS:
783*4882a593Smuzhiyun 			WARN_ON(rcomp);
784*4882a593Smuzhiyun 			VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_rb);
785*4882a593Smuzhiyun 			VCPU_FPR(vcpu, ax_rd) &= ~0x8000000000000000ULL;
786*4882a593Smuzhiyun 			vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
787*4882a593Smuzhiyun 			vcpu->arch.qpr[ax_rd] &= ~0x80000000;
788*4882a593Smuzhiyun 			break;
789*4882a593Smuzhiyun 		case OP_4X_PS_MERGE00:
790*4882a593Smuzhiyun 			WARN_ON(rcomp);
791*4882a593Smuzhiyun 			VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_ra);
792*4882a593Smuzhiyun 			/* vcpu->arch.qpr[ax_rd] = VCPU_FPR(vcpu, ax_rb); */
793*4882a593Smuzhiyun 			kvm_cvt_df(&VCPU_FPR(vcpu, ax_rb),
794*4882a593Smuzhiyun 				   &vcpu->arch.qpr[ax_rd]);
795*4882a593Smuzhiyun 			break;
796*4882a593Smuzhiyun 		case OP_4X_PS_MERGE01:
797*4882a593Smuzhiyun 			WARN_ON(rcomp);
798*4882a593Smuzhiyun 			VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_ra);
799*4882a593Smuzhiyun 			vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
800*4882a593Smuzhiyun 			break;
801*4882a593Smuzhiyun 		case OP_4X_PS_MERGE10:
802*4882a593Smuzhiyun 			WARN_ON(rcomp);
803*4882a593Smuzhiyun 			/* VCPU_FPR(vcpu, ax_rd) = vcpu->arch.qpr[ax_ra]; */
804*4882a593Smuzhiyun 			kvm_cvt_fd(&vcpu->arch.qpr[ax_ra],
805*4882a593Smuzhiyun 				   &VCPU_FPR(vcpu, ax_rd));
806*4882a593Smuzhiyun 			/* vcpu->arch.qpr[ax_rd] = VCPU_FPR(vcpu, ax_rb); */
807*4882a593Smuzhiyun 			kvm_cvt_df(&VCPU_FPR(vcpu, ax_rb),
808*4882a593Smuzhiyun 				   &vcpu->arch.qpr[ax_rd]);
809*4882a593Smuzhiyun 			break;
810*4882a593Smuzhiyun 		case OP_4X_PS_MERGE11:
811*4882a593Smuzhiyun 			WARN_ON(rcomp);
812*4882a593Smuzhiyun 			/* VCPU_FPR(vcpu, ax_rd) = vcpu->arch.qpr[ax_ra]; */
813*4882a593Smuzhiyun 			kvm_cvt_fd(&vcpu->arch.qpr[ax_ra],
814*4882a593Smuzhiyun 				   &VCPU_FPR(vcpu, ax_rd));
815*4882a593Smuzhiyun 			vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
816*4882a593Smuzhiyun 			break;
817*4882a593Smuzhiyun 		}
818*4882a593Smuzhiyun 		/* XW form */
819*4882a593Smuzhiyun 		switch (inst_get_field(inst, 25, 30)) {
820*4882a593Smuzhiyun 		case OP_4XW_PSQ_STX:
821*4882a593Smuzhiyun 		{
822*4882a593Smuzhiyun 			ulong addr = ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0;
823*4882a593Smuzhiyun 			bool w = inst_get_field(inst, 21, 21) ? true : false;
824*4882a593Smuzhiyun 			int i = inst_get_field(inst, 22, 24);
825*4882a593Smuzhiyun 
826*4882a593Smuzhiyun 			addr += kvmppc_get_gpr(vcpu, ax_rb);
827*4882a593Smuzhiyun 			emulated = kvmppc_emulate_psq_store(vcpu, ax_rd, addr, w, i);
828*4882a593Smuzhiyun 			break;
829*4882a593Smuzhiyun 		}
830*4882a593Smuzhiyun 		case OP_4XW_PSQ_STUX:
831*4882a593Smuzhiyun 		{
832*4882a593Smuzhiyun 			ulong addr = kvmppc_get_gpr(vcpu, ax_ra);
833*4882a593Smuzhiyun 			bool w = inst_get_field(inst, 21, 21) ? true : false;
834*4882a593Smuzhiyun 			int i = inst_get_field(inst, 22, 24);
835*4882a593Smuzhiyun 
836*4882a593Smuzhiyun 			addr += kvmppc_get_gpr(vcpu, ax_rb);
837*4882a593Smuzhiyun 			emulated = kvmppc_emulate_psq_store(vcpu, ax_rd, addr, w, i);
838*4882a593Smuzhiyun 
839*4882a593Smuzhiyun 			if (emulated == EMULATE_DONE)
840*4882a593Smuzhiyun 				kvmppc_set_gpr(vcpu, ax_ra, addr);
841*4882a593Smuzhiyun 			break;
842*4882a593Smuzhiyun 		}
843*4882a593Smuzhiyun 		}
844*4882a593Smuzhiyun 		/* A form */
845*4882a593Smuzhiyun 		switch (inst_get_field(inst, 26, 30)) {
846*4882a593Smuzhiyun 		case OP_4A_PS_SUM1:
847*4882a593Smuzhiyun 			emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
848*4882a593Smuzhiyun 					ax_rb, ax_ra, SCALAR_NO_PS0 | SCALAR_HIGH, fps_fadds);
849*4882a593Smuzhiyun 			VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_rc);
850*4882a593Smuzhiyun 			break;
851*4882a593Smuzhiyun 		case OP_4A_PS_SUM0:
852*4882a593Smuzhiyun 			emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
853*4882a593Smuzhiyun 					ax_ra, ax_rb, SCALAR_NO_PS1 | SCALAR_LOW, fps_fadds);
854*4882a593Smuzhiyun 			vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rc];
855*4882a593Smuzhiyun 			break;
856*4882a593Smuzhiyun 		case OP_4A_PS_MULS0:
857*4882a593Smuzhiyun 			emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
858*4882a593Smuzhiyun 					ax_ra, ax_rc, SCALAR_HIGH, fps_fmuls);
859*4882a593Smuzhiyun 			break;
860*4882a593Smuzhiyun 		case OP_4A_PS_MULS1:
861*4882a593Smuzhiyun 			emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
862*4882a593Smuzhiyun 					ax_ra, ax_rc, SCALAR_LOW, fps_fmuls);
863*4882a593Smuzhiyun 			break;
864*4882a593Smuzhiyun 		case OP_4A_PS_MADDS0:
865*4882a593Smuzhiyun 			emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
866*4882a593Smuzhiyun 					ax_ra, ax_rc, ax_rb, SCALAR_HIGH, fps_fmadds);
867*4882a593Smuzhiyun 			break;
868*4882a593Smuzhiyun 		case OP_4A_PS_MADDS1:
869*4882a593Smuzhiyun 			emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
870*4882a593Smuzhiyun 					ax_ra, ax_rc, ax_rb, SCALAR_LOW, fps_fmadds);
871*4882a593Smuzhiyun 			break;
872*4882a593Smuzhiyun 		case OP_4A_PS_DIV:
873*4882a593Smuzhiyun 			emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
874*4882a593Smuzhiyun 					ax_ra, ax_rb, SCALAR_NONE, fps_fdivs);
875*4882a593Smuzhiyun 			break;
876*4882a593Smuzhiyun 		case OP_4A_PS_SUB:
877*4882a593Smuzhiyun 			emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
878*4882a593Smuzhiyun 					ax_ra, ax_rb, SCALAR_NONE, fps_fsubs);
879*4882a593Smuzhiyun 			break;
880*4882a593Smuzhiyun 		case OP_4A_PS_ADD:
881*4882a593Smuzhiyun 			emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
882*4882a593Smuzhiyun 					ax_ra, ax_rb, SCALAR_NONE, fps_fadds);
883*4882a593Smuzhiyun 			break;
884*4882a593Smuzhiyun 		case OP_4A_PS_SEL:
885*4882a593Smuzhiyun 			emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
886*4882a593Smuzhiyun 					ax_ra, ax_rc, ax_rb, SCALAR_NONE, fps_fsel);
887*4882a593Smuzhiyun 			break;
888*4882a593Smuzhiyun 		case OP_4A_PS_RES:
889*4882a593Smuzhiyun 			emulated = kvmppc_ps_one_in(vcpu, rcomp, ax_rd,
890*4882a593Smuzhiyun 					ax_rb, fps_fres);
891*4882a593Smuzhiyun 			break;
892*4882a593Smuzhiyun 		case OP_4A_PS_MUL:
893*4882a593Smuzhiyun 			emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
894*4882a593Smuzhiyun 					ax_ra, ax_rc, SCALAR_NONE, fps_fmuls);
895*4882a593Smuzhiyun 			break;
896*4882a593Smuzhiyun 		case OP_4A_PS_RSQRTE:
897*4882a593Smuzhiyun 			emulated = kvmppc_ps_one_in(vcpu, rcomp, ax_rd,
898*4882a593Smuzhiyun 					ax_rb, fps_frsqrte);
899*4882a593Smuzhiyun 			break;
900*4882a593Smuzhiyun 		case OP_4A_PS_MSUB:
901*4882a593Smuzhiyun 			emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
902*4882a593Smuzhiyun 					ax_ra, ax_rc, ax_rb, SCALAR_NONE, fps_fmsubs);
903*4882a593Smuzhiyun 			break;
904*4882a593Smuzhiyun 		case OP_4A_PS_MADD:
905*4882a593Smuzhiyun 			emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
906*4882a593Smuzhiyun 					ax_ra, ax_rc, ax_rb, SCALAR_NONE, fps_fmadds);
907*4882a593Smuzhiyun 			break;
908*4882a593Smuzhiyun 		case OP_4A_PS_NMSUB:
909*4882a593Smuzhiyun 			emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
910*4882a593Smuzhiyun 					ax_ra, ax_rc, ax_rb, SCALAR_NONE, fps_fnmsubs);
911*4882a593Smuzhiyun 			break;
912*4882a593Smuzhiyun 		case OP_4A_PS_NMADD:
913*4882a593Smuzhiyun 			emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
914*4882a593Smuzhiyun 					ax_ra, ax_rc, ax_rb, SCALAR_NONE, fps_fnmadds);
915*4882a593Smuzhiyun 			break;
916*4882a593Smuzhiyun 		}
917*4882a593Smuzhiyun 		break;
918*4882a593Smuzhiyun 
919*4882a593Smuzhiyun 	/* Real FPU operations */
920*4882a593Smuzhiyun 
921*4882a593Smuzhiyun 	case OP_LFS:
922*4882a593Smuzhiyun 	{
923*4882a593Smuzhiyun 		ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) + full_d;
924*4882a593Smuzhiyun 
925*4882a593Smuzhiyun 		emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd, addr,
926*4882a593Smuzhiyun 						   FPU_LS_SINGLE);
927*4882a593Smuzhiyun 		break;
928*4882a593Smuzhiyun 	}
929*4882a593Smuzhiyun 	case OP_LFSU:
930*4882a593Smuzhiyun 	{
931*4882a593Smuzhiyun 		ulong addr = kvmppc_get_gpr(vcpu, ax_ra) + full_d;
932*4882a593Smuzhiyun 
933*4882a593Smuzhiyun 		emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd, addr,
934*4882a593Smuzhiyun 						   FPU_LS_SINGLE);
935*4882a593Smuzhiyun 
936*4882a593Smuzhiyun 		if (emulated == EMULATE_DONE)
937*4882a593Smuzhiyun 			kvmppc_set_gpr(vcpu, ax_ra, addr);
938*4882a593Smuzhiyun 		break;
939*4882a593Smuzhiyun 	}
940*4882a593Smuzhiyun 	case OP_LFD:
941*4882a593Smuzhiyun 	{
942*4882a593Smuzhiyun 		ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) + full_d;
943*4882a593Smuzhiyun 
944*4882a593Smuzhiyun 		emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd, addr,
945*4882a593Smuzhiyun 						   FPU_LS_DOUBLE);
946*4882a593Smuzhiyun 		break;
947*4882a593Smuzhiyun 	}
948*4882a593Smuzhiyun 	case OP_LFDU:
949*4882a593Smuzhiyun 	{
950*4882a593Smuzhiyun 		ulong addr = kvmppc_get_gpr(vcpu, ax_ra) + full_d;
951*4882a593Smuzhiyun 
952*4882a593Smuzhiyun 		emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd, addr,
953*4882a593Smuzhiyun 						   FPU_LS_DOUBLE);
954*4882a593Smuzhiyun 
955*4882a593Smuzhiyun 		if (emulated == EMULATE_DONE)
956*4882a593Smuzhiyun 			kvmppc_set_gpr(vcpu, ax_ra, addr);
957*4882a593Smuzhiyun 		break;
958*4882a593Smuzhiyun 	}
959*4882a593Smuzhiyun 	case OP_STFS:
960*4882a593Smuzhiyun 	{
961*4882a593Smuzhiyun 		ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) + full_d;
962*4882a593Smuzhiyun 
963*4882a593Smuzhiyun 		emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd, addr,
964*4882a593Smuzhiyun 						    FPU_LS_SINGLE);
965*4882a593Smuzhiyun 		break;
966*4882a593Smuzhiyun 	}
967*4882a593Smuzhiyun 	case OP_STFSU:
968*4882a593Smuzhiyun 	{
969*4882a593Smuzhiyun 		ulong addr = kvmppc_get_gpr(vcpu, ax_ra) + full_d;
970*4882a593Smuzhiyun 
971*4882a593Smuzhiyun 		emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd, addr,
972*4882a593Smuzhiyun 						    FPU_LS_SINGLE);
973*4882a593Smuzhiyun 
974*4882a593Smuzhiyun 		if (emulated == EMULATE_DONE)
975*4882a593Smuzhiyun 			kvmppc_set_gpr(vcpu, ax_ra, addr);
976*4882a593Smuzhiyun 		break;
977*4882a593Smuzhiyun 	}
978*4882a593Smuzhiyun 	case OP_STFD:
979*4882a593Smuzhiyun 	{
980*4882a593Smuzhiyun 		ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) + full_d;
981*4882a593Smuzhiyun 
982*4882a593Smuzhiyun 		emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd, addr,
983*4882a593Smuzhiyun 						    FPU_LS_DOUBLE);
984*4882a593Smuzhiyun 		break;
985*4882a593Smuzhiyun 	}
986*4882a593Smuzhiyun 	case OP_STFDU:
987*4882a593Smuzhiyun 	{
988*4882a593Smuzhiyun 		ulong addr = kvmppc_get_gpr(vcpu, ax_ra) + full_d;
989*4882a593Smuzhiyun 
990*4882a593Smuzhiyun 		emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd, addr,
991*4882a593Smuzhiyun 						    FPU_LS_DOUBLE);
992*4882a593Smuzhiyun 
993*4882a593Smuzhiyun 		if (emulated == EMULATE_DONE)
994*4882a593Smuzhiyun 			kvmppc_set_gpr(vcpu, ax_ra, addr);
995*4882a593Smuzhiyun 		break;
996*4882a593Smuzhiyun 	}
997*4882a593Smuzhiyun 	case 31:
998*4882a593Smuzhiyun 		switch (inst_get_field(inst, 21, 30)) {
999*4882a593Smuzhiyun 		case OP_31_LFSX:
1000*4882a593Smuzhiyun 		{
1001*4882a593Smuzhiyun 			ulong addr = ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0;
1002*4882a593Smuzhiyun 
1003*4882a593Smuzhiyun 			addr += kvmppc_get_gpr(vcpu, ax_rb);
1004*4882a593Smuzhiyun 			emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd,
1005*4882a593Smuzhiyun 							   addr, FPU_LS_SINGLE);
1006*4882a593Smuzhiyun 			break;
1007*4882a593Smuzhiyun 		}
1008*4882a593Smuzhiyun 		case OP_31_LFSUX:
1009*4882a593Smuzhiyun 		{
1010*4882a593Smuzhiyun 			ulong addr = kvmppc_get_gpr(vcpu, ax_ra) +
1011*4882a593Smuzhiyun 				     kvmppc_get_gpr(vcpu, ax_rb);
1012*4882a593Smuzhiyun 
1013*4882a593Smuzhiyun 			emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd,
1014*4882a593Smuzhiyun 							   addr, FPU_LS_SINGLE);
1015*4882a593Smuzhiyun 
1016*4882a593Smuzhiyun 			if (emulated == EMULATE_DONE)
1017*4882a593Smuzhiyun 				kvmppc_set_gpr(vcpu, ax_ra, addr);
1018*4882a593Smuzhiyun 			break;
1019*4882a593Smuzhiyun 		}
1020*4882a593Smuzhiyun 		case OP_31_LFDX:
1021*4882a593Smuzhiyun 		{
1022*4882a593Smuzhiyun 			ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) +
1023*4882a593Smuzhiyun 				     kvmppc_get_gpr(vcpu, ax_rb);
1024*4882a593Smuzhiyun 
1025*4882a593Smuzhiyun 			emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd,
1026*4882a593Smuzhiyun 							   addr, FPU_LS_DOUBLE);
1027*4882a593Smuzhiyun 			break;
1028*4882a593Smuzhiyun 		}
1029*4882a593Smuzhiyun 		case OP_31_LFDUX:
1030*4882a593Smuzhiyun 		{
1031*4882a593Smuzhiyun 			ulong addr = kvmppc_get_gpr(vcpu, ax_ra) +
1032*4882a593Smuzhiyun 				     kvmppc_get_gpr(vcpu, ax_rb);
1033*4882a593Smuzhiyun 
1034*4882a593Smuzhiyun 			emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd,
1035*4882a593Smuzhiyun 							   addr, FPU_LS_DOUBLE);
1036*4882a593Smuzhiyun 
1037*4882a593Smuzhiyun 			if (emulated == EMULATE_DONE)
1038*4882a593Smuzhiyun 				kvmppc_set_gpr(vcpu, ax_ra, addr);
1039*4882a593Smuzhiyun 			break;
1040*4882a593Smuzhiyun 		}
1041*4882a593Smuzhiyun 		case OP_31_STFSX:
1042*4882a593Smuzhiyun 		{
1043*4882a593Smuzhiyun 			ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) +
1044*4882a593Smuzhiyun 				     kvmppc_get_gpr(vcpu, ax_rb);
1045*4882a593Smuzhiyun 
1046*4882a593Smuzhiyun 			emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd,
1047*4882a593Smuzhiyun 							    addr, FPU_LS_SINGLE);
1048*4882a593Smuzhiyun 			break;
1049*4882a593Smuzhiyun 		}
1050*4882a593Smuzhiyun 		case OP_31_STFSUX:
1051*4882a593Smuzhiyun 		{
1052*4882a593Smuzhiyun 			ulong addr = kvmppc_get_gpr(vcpu, ax_ra) +
1053*4882a593Smuzhiyun 				     kvmppc_get_gpr(vcpu, ax_rb);
1054*4882a593Smuzhiyun 
1055*4882a593Smuzhiyun 			emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd,
1056*4882a593Smuzhiyun 							    addr, FPU_LS_SINGLE);
1057*4882a593Smuzhiyun 
1058*4882a593Smuzhiyun 			if (emulated == EMULATE_DONE)
1059*4882a593Smuzhiyun 				kvmppc_set_gpr(vcpu, ax_ra, addr);
1060*4882a593Smuzhiyun 			break;
1061*4882a593Smuzhiyun 		}
1062*4882a593Smuzhiyun 		case OP_31_STFX:
1063*4882a593Smuzhiyun 		{
1064*4882a593Smuzhiyun 			ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) +
1065*4882a593Smuzhiyun 				     kvmppc_get_gpr(vcpu, ax_rb);
1066*4882a593Smuzhiyun 
1067*4882a593Smuzhiyun 			emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd,
1068*4882a593Smuzhiyun 							    addr, FPU_LS_DOUBLE);
1069*4882a593Smuzhiyun 			break;
1070*4882a593Smuzhiyun 		}
1071*4882a593Smuzhiyun 		case OP_31_STFUX:
1072*4882a593Smuzhiyun 		{
1073*4882a593Smuzhiyun 			ulong addr = kvmppc_get_gpr(vcpu, ax_ra) +
1074*4882a593Smuzhiyun 				     kvmppc_get_gpr(vcpu, ax_rb);
1075*4882a593Smuzhiyun 
1076*4882a593Smuzhiyun 			emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd,
1077*4882a593Smuzhiyun 							    addr, FPU_LS_DOUBLE);
1078*4882a593Smuzhiyun 
1079*4882a593Smuzhiyun 			if (emulated == EMULATE_DONE)
1080*4882a593Smuzhiyun 				kvmppc_set_gpr(vcpu, ax_ra, addr);
1081*4882a593Smuzhiyun 			break;
1082*4882a593Smuzhiyun 		}
1083*4882a593Smuzhiyun 		case OP_31_STFIWX:
1084*4882a593Smuzhiyun 		{
1085*4882a593Smuzhiyun 			ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) +
1086*4882a593Smuzhiyun 				     kvmppc_get_gpr(vcpu, ax_rb);
1087*4882a593Smuzhiyun 
1088*4882a593Smuzhiyun 			emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd,
1089*4882a593Smuzhiyun 							    addr,
1090*4882a593Smuzhiyun 							    FPU_LS_SINGLE_LOW);
1091*4882a593Smuzhiyun 			break;
1092*4882a593Smuzhiyun 		}
1093*4882a593Smuzhiyun 			break;
1094*4882a593Smuzhiyun 		}
1095*4882a593Smuzhiyun 		break;
1096*4882a593Smuzhiyun 	case 59:
1097*4882a593Smuzhiyun 		switch (inst_get_field(inst, 21, 30)) {
1098*4882a593Smuzhiyun 		case OP_59_FADDS:
1099*4882a593Smuzhiyun 			fpd_fadds(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1100*4882a593Smuzhiyun 			kvmppc_sync_qpr(vcpu, ax_rd);
1101*4882a593Smuzhiyun 			break;
1102*4882a593Smuzhiyun 		case OP_59_FSUBS:
1103*4882a593Smuzhiyun 			fpd_fsubs(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1104*4882a593Smuzhiyun 			kvmppc_sync_qpr(vcpu, ax_rd);
1105*4882a593Smuzhiyun 			break;
1106*4882a593Smuzhiyun 		case OP_59_FDIVS:
1107*4882a593Smuzhiyun 			fpd_fdivs(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1108*4882a593Smuzhiyun 			kvmppc_sync_qpr(vcpu, ax_rd);
1109*4882a593Smuzhiyun 			break;
1110*4882a593Smuzhiyun 		case OP_59_FRES:
1111*4882a593Smuzhiyun 			fpd_fres(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1112*4882a593Smuzhiyun 			kvmppc_sync_qpr(vcpu, ax_rd);
1113*4882a593Smuzhiyun 			break;
1114*4882a593Smuzhiyun 		case OP_59_FRSQRTES:
1115*4882a593Smuzhiyun 			fpd_frsqrtes(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1116*4882a593Smuzhiyun 			kvmppc_sync_qpr(vcpu, ax_rd);
1117*4882a593Smuzhiyun 			break;
1118*4882a593Smuzhiyun 		}
1119*4882a593Smuzhiyun 		switch (inst_get_field(inst, 26, 30)) {
1120*4882a593Smuzhiyun 		case OP_59_FMULS:
1121*4882a593Smuzhiyun 			fpd_fmuls(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c);
1122*4882a593Smuzhiyun 			kvmppc_sync_qpr(vcpu, ax_rd);
1123*4882a593Smuzhiyun 			break;
1124*4882a593Smuzhiyun 		case OP_59_FMSUBS:
1125*4882a593Smuzhiyun 			fpd_fmsubs(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1126*4882a593Smuzhiyun 			kvmppc_sync_qpr(vcpu, ax_rd);
1127*4882a593Smuzhiyun 			break;
1128*4882a593Smuzhiyun 		case OP_59_FMADDS:
1129*4882a593Smuzhiyun 			fpd_fmadds(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1130*4882a593Smuzhiyun 			kvmppc_sync_qpr(vcpu, ax_rd);
1131*4882a593Smuzhiyun 			break;
1132*4882a593Smuzhiyun 		case OP_59_FNMSUBS:
1133*4882a593Smuzhiyun 			fpd_fnmsubs(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1134*4882a593Smuzhiyun 			kvmppc_sync_qpr(vcpu, ax_rd);
1135*4882a593Smuzhiyun 			break;
1136*4882a593Smuzhiyun 		case OP_59_FNMADDS:
1137*4882a593Smuzhiyun 			fpd_fnmadds(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1138*4882a593Smuzhiyun 			kvmppc_sync_qpr(vcpu, ax_rd);
1139*4882a593Smuzhiyun 			break;
1140*4882a593Smuzhiyun 		}
1141*4882a593Smuzhiyun 		break;
1142*4882a593Smuzhiyun 	case 63:
1143*4882a593Smuzhiyun 		switch (inst_get_field(inst, 21, 30)) {
1144*4882a593Smuzhiyun 		case OP_63_MTFSB0:
1145*4882a593Smuzhiyun 		case OP_63_MTFSB1:
1146*4882a593Smuzhiyun 		case OP_63_MCRFS:
1147*4882a593Smuzhiyun 		case OP_63_MTFSFI:
1148*4882a593Smuzhiyun 			/* XXX need to implement */
1149*4882a593Smuzhiyun 			break;
1150*4882a593Smuzhiyun 		case OP_63_MFFS:
1151*4882a593Smuzhiyun 			/* XXX missing CR */
1152*4882a593Smuzhiyun 			*fpr_d = vcpu->arch.fp.fpscr;
1153*4882a593Smuzhiyun 			break;
1154*4882a593Smuzhiyun 		case OP_63_MTFSF:
1155*4882a593Smuzhiyun 			/* XXX missing fm bits */
1156*4882a593Smuzhiyun 			/* XXX missing CR */
1157*4882a593Smuzhiyun 			vcpu->arch.fp.fpscr = *fpr_b;
1158*4882a593Smuzhiyun 			break;
1159*4882a593Smuzhiyun 		case OP_63_FCMPU:
1160*4882a593Smuzhiyun 		{
1161*4882a593Smuzhiyun 			u32 tmp_cr;
1162*4882a593Smuzhiyun 			u32 cr0_mask = 0xf0000000;
1163*4882a593Smuzhiyun 			u32 cr_shift = inst_get_field(inst, 6, 8) * 4;
1164*4882a593Smuzhiyun 
1165*4882a593Smuzhiyun 			fpd_fcmpu(&vcpu->arch.fp.fpscr, &tmp_cr, fpr_a, fpr_b);
1166*4882a593Smuzhiyun 			cr &= ~(cr0_mask >> cr_shift);
1167*4882a593Smuzhiyun 			cr |= (cr & cr0_mask) >> cr_shift;
1168*4882a593Smuzhiyun 			break;
1169*4882a593Smuzhiyun 		}
1170*4882a593Smuzhiyun 		case OP_63_FCMPO:
1171*4882a593Smuzhiyun 		{
1172*4882a593Smuzhiyun 			u32 tmp_cr;
1173*4882a593Smuzhiyun 			u32 cr0_mask = 0xf0000000;
1174*4882a593Smuzhiyun 			u32 cr_shift = inst_get_field(inst, 6, 8) * 4;
1175*4882a593Smuzhiyun 
1176*4882a593Smuzhiyun 			fpd_fcmpo(&vcpu->arch.fp.fpscr, &tmp_cr, fpr_a, fpr_b);
1177*4882a593Smuzhiyun 			cr &= ~(cr0_mask >> cr_shift);
1178*4882a593Smuzhiyun 			cr |= (cr & cr0_mask) >> cr_shift;
1179*4882a593Smuzhiyun 			break;
1180*4882a593Smuzhiyun 		}
1181*4882a593Smuzhiyun 		case OP_63_FNEG:
1182*4882a593Smuzhiyun 			fpd_fneg(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1183*4882a593Smuzhiyun 			break;
1184*4882a593Smuzhiyun 		case OP_63_FMR:
1185*4882a593Smuzhiyun 			*fpr_d = *fpr_b;
1186*4882a593Smuzhiyun 			break;
1187*4882a593Smuzhiyun 		case OP_63_FABS:
1188*4882a593Smuzhiyun 			fpd_fabs(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1189*4882a593Smuzhiyun 			break;
1190*4882a593Smuzhiyun 		case OP_63_FCPSGN:
1191*4882a593Smuzhiyun 			fpd_fcpsgn(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1192*4882a593Smuzhiyun 			break;
1193*4882a593Smuzhiyun 		case OP_63_FDIV:
1194*4882a593Smuzhiyun 			fpd_fdiv(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1195*4882a593Smuzhiyun 			break;
1196*4882a593Smuzhiyun 		case OP_63_FADD:
1197*4882a593Smuzhiyun 			fpd_fadd(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1198*4882a593Smuzhiyun 			break;
1199*4882a593Smuzhiyun 		case OP_63_FSUB:
1200*4882a593Smuzhiyun 			fpd_fsub(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1201*4882a593Smuzhiyun 			break;
1202*4882a593Smuzhiyun 		case OP_63_FCTIW:
1203*4882a593Smuzhiyun 			fpd_fctiw(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1204*4882a593Smuzhiyun 			break;
1205*4882a593Smuzhiyun 		case OP_63_FCTIWZ:
1206*4882a593Smuzhiyun 			fpd_fctiwz(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1207*4882a593Smuzhiyun 			break;
1208*4882a593Smuzhiyun 		case OP_63_FRSP:
1209*4882a593Smuzhiyun 			fpd_frsp(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1210*4882a593Smuzhiyun 			kvmppc_sync_qpr(vcpu, ax_rd);
1211*4882a593Smuzhiyun 			break;
1212*4882a593Smuzhiyun 		case OP_63_FRSQRTE:
1213*4882a593Smuzhiyun 		{
1214*4882a593Smuzhiyun 			double one = 1.0f;
1215*4882a593Smuzhiyun 
1216*4882a593Smuzhiyun 			/* fD = sqrt(fB) */
1217*4882a593Smuzhiyun 			fpd_fsqrt(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1218*4882a593Smuzhiyun 			/* fD = 1.0f / fD */
1219*4882a593Smuzhiyun 			fpd_fdiv(&vcpu->arch.fp.fpscr, &cr, fpr_d, (u64*)&one, fpr_d);
1220*4882a593Smuzhiyun 			break;
1221*4882a593Smuzhiyun 		}
1222*4882a593Smuzhiyun 		}
1223*4882a593Smuzhiyun 		switch (inst_get_field(inst, 26, 30)) {
1224*4882a593Smuzhiyun 		case OP_63_FMUL:
1225*4882a593Smuzhiyun 			fpd_fmul(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c);
1226*4882a593Smuzhiyun 			break;
1227*4882a593Smuzhiyun 		case OP_63_FSEL:
1228*4882a593Smuzhiyun 			fpd_fsel(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1229*4882a593Smuzhiyun 			break;
1230*4882a593Smuzhiyun 		case OP_63_FMSUB:
1231*4882a593Smuzhiyun 			fpd_fmsub(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1232*4882a593Smuzhiyun 			break;
1233*4882a593Smuzhiyun 		case OP_63_FMADD:
1234*4882a593Smuzhiyun 			fpd_fmadd(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1235*4882a593Smuzhiyun 			break;
1236*4882a593Smuzhiyun 		case OP_63_FNMSUB:
1237*4882a593Smuzhiyun 			fpd_fnmsub(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1238*4882a593Smuzhiyun 			break;
1239*4882a593Smuzhiyun 		case OP_63_FNMADD:
1240*4882a593Smuzhiyun 			fpd_fnmadd(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1241*4882a593Smuzhiyun 			break;
1242*4882a593Smuzhiyun 		}
1243*4882a593Smuzhiyun 		break;
1244*4882a593Smuzhiyun 	}
1245*4882a593Smuzhiyun 
1246*4882a593Smuzhiyun #ifdef DEBUG
1247*4882a593Smuzhiyun 	for (i = 0; i < ARRAY_SIZE(vcpu->arch.fp.fpr); i++) {
1248*4882a593Smuzhiyun 		u32 f;
1249*4882a593Smuzhiyun 		kvm_cvt_df(&VCPU_FPR(vcpu, i), &f);
1250*4882a593Smuzhiyun 		dprintk(KERN_INFO "FPR[%d] = 0x%x\n", i, f);
1251*4882a593Smuzhiyun 	}
1252*4882a593Smuzhiyun #endif
1253*4882a593Smuzhiyun 
1254*4882a593Smuzhiyun 	if (rcomp)
1255*4882a593Smuzhiyun 		kvmppc_set_cr(vcpu, cr);
1256*4882a593Smuzhiyun 
1257*4882a593Smuzhiyun 	disable_kernel_fp();
1258*4882a593Smuzhiyun 	preempt_enable();
1259*4882a593Smuzhiyun 
1260*4882a593Smuzhiyun 	return emulated;
1261*4882a593Smuzhiyun }
1262