1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-only */
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * MIPS floating point support
4*4882a593Smuzhiyun * Copyright (C) 1994-2000 Algorithmics Ltd.
5*4882a593Smuzhiyun *
6*4882a593Smuzhiyun * Nov 7, 2000
7*4882a593Smuzhiyun * Modification to allow integration with Linux kernel
8*4882a593Smuzhiyun *
9*4882a593Smuzhiyun * Kevin D. Kissell, kevink@mips.com and Carsten Langgard, carstenl@mips.com
10*4882a593Smuzhiyun * Copyright (C) 2000 MIPS Technologies, Inc. All rights reserved.
11*4882a593Smuzhiyun */
12*4882a593Smuzhiyun #ifndef __ARCH_MIPS_MATH_EMU_IEEE754_H
13*4882a593Smuzhiyun #define __ARCH_MIPS_MATH_EMU_IEEE754_H
14*4882a593Smuzhiyun
15*4882a593Smuzhiyun #include <linux/compiler.h>
16*4882a593Smuzhiyun #include <asm/byteorder.h>
17*4882a593Smuzhiyun #include <linux/kernel.h>
18*4882a593Smuzhiyun #include <linux/types.h>
19*4882a593Smuzhiyun #include <linux/sched.h>
20*4882a593Smuzhiyun #include <asm/bitfield.h>
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun union ieee754dp {
23*4882a593Smuzhiyun struct {
24*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned int sign:1,
25*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned int bexp:11,
26*4882a593Smuzhiyun __BITFIELD_FIELD(u64 mant:52,
27*4882a593Smuzhiyun ;)))
28*4882a593Smuzhiyun };
29*4882a593Smuzhiyun u64 bits;
30*4882a593Smuzhiyun };
31*4882a593Smuzhiyun
32*4882a593Smuzhiyun union ieee754sp {
33*4882a593Smuzhiyun struct {
34*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned sign:1,
35*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned bexp:8,
36*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned mant:23,
37*4882a593Smuzhiyun ;)))
38*4882a593Smuzhiyun };
39*4882a593Smuzhiyun u32 bits;
40*4882a593Smuzhiyun };
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun /*
43*4882a593Smuzhiyun * single precision (often aka float)
44*4882a593Smuzhiyun */
45*4882a593Smuzhiyun int ieee754sp_class(union ieee754sp x);
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun union ieee754sp ieee754sp_abs(union ieee754sp x);
48*4882a593Smuzhiyun union ieee754sp ieee754sp_neg(union ieee754sp x);
49*4882a593Smuzhiyun
50*4882a593Smuzhiyun union ieee754sp ieee754sp_add(union ieee754sp x, union ieee754sp y);
51*4882a593Smuzhiyun union ieee754sp ieee754sp_sub(union ieee754sp x, union ieee754sp y);
52*4882a593Smuzhiyun union ieee754sp ieee754sp_mul(union ieee754sp x, union ieee754sp y);
53*4882a593Smuzhiyun union ieee754sp ieee754sp_div(union ieee754sp x, union ieee754sp y);
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun union ieee754sp ieee754sp_fint(int x);
56*4882a593Smuzhiyun union ieee754sp ieee754sp_flong(s64 x);
57*4882a593Smuzhiyun union ieee754sp ieee754sp_fdp(union ieee754dp x);
58*4882a593Smuzhiyun union ieee754sp ieee754sp_rint(union ieee754sp x);
59*4882a593Smuzhiyun
60*4882a593Smuzhiyun int ieee754sp_tint(union ieee754sp x);
61*4882a593Smuzhiyun s64 ieee754sp_tlong(union ieee754sp x);
62*4882a593Smuzhiyun
63*4882a593Smuzhiyun int ieee754sp_cmp(union ieee754sp x, union ieee754sp y, int cop, int sig);
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun union ieee754sp ieee754sp_sqrt(union ieee754sp x);
66*4882a593Smuzhiyun
67*4882a593Smuzhiyun union ieee754sp ieee754sp_maddf(union ieee754sp z, union ieee754sp x,
68*4882a593Smuzhiyun union ieee754sp y);
69*4882a593Smuzhiyun union ieee754sp ieee754sp_msubf(union ieee754sp z, union ieee754sp x,
70*4882a593Smuzhiyun union ieee754sp y);
71*4882a593Smuzhiyun union ieee754sp ieee754sp_madd(union ieee754sp z, union ieee754sp x,
72*4882a593Smuzhiyun union ieee754sp y);
73*4882a593Smuzhiyun union ieee754sp ieee754sp_msub(union ieee754sp z, union ieee754sp x,
74*4882a593Smuzhiyun union ieee754sp y);
75*4882a593Smuzhiyun union ieee754sp ieee754sp_nmadd(union ieee754sp z, union ieee754sp x,
76*4882a593Smuzhiyun union ieee754sp y);
77*4882a593Smuzhiyun union ieee754sp ieee754sp_nmsub(union ieee754sp z, union ieee754sp x,
78*4882a593Smuzhiyun union ieee754sp y);
79*4882a593Smuzhiyun int ieee754sp_2008class(union ieee754sp x);
80*4882a593Smuzhiyun union ieee754sp ieee754sp_fmin(union ieee754sp x, union ieee754sp y);
81*4882a593Smuzhiyun union ieee754sp ieee754sp_fmina(union ieee754sp x, union ieee754sp y);
82*4882a593Smuzhiyun union ieee754sp ieee754sp_fmax(union ieee754sp x, union ieee754sp y);
83*4882a593Smuzhiyun union ieee754sp ieee754sp_fmaxa(union ieee754sp x, union ieee754sp y);
84*4882a593Smuzhiyun
85*4882a593Smuzhiyun /*
86*4882a593Smuzhiyun * double precision (often aka double)
87*4882a593Smuzhiyun */
88*4882a593Smuzhiyun int ieee754dp_class(union ieee754dp x);
89*4882a593Smuzhiyun
90*4882a593Smuzhiyun union ieee754dp ieee754dp_add(union ieee754dp x, union ieee754dp y);
91*4882a593Smuzhiyun union ieee754dp ieee754dp_sub(union ieee754dp x, union ieee754dp y);
92*4882a593Smuzhiyun union ieee754dp ieee754dp_mul(union ieee754dp x, union ieee754dp y);
93*4882a593Smuzhiyun union ieee754dp ieee754dp_div(union ieee754dp x, union ieee754dp y);
94*4882a593Smuzhiyun
95*4882a593Smuzhiyun union ieee754dp ieee754dp_abs(union ieee754dp x);
96*4882a593Smuzhiyun union ieee754dp ieee754dp_neg(union ieee754dp x);
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun union ieee754dp ieee754dp_fint(int x);
99*4882a593Smuzhiyun union ieee754dp ieee754dp_flong(s64 x);
100*4882a593Smuzhiyun union ieee754dp ieee754dp_fsp(union ieee754sp x);
101*4882a593Smuzhiyun union ieee754dp ieee754dp_rint(union ieee754dp x);
102*4882a593Smuzhiyun
103*4882a593Smuzhiyun int ieee754dp_tint(union ieee754dp x);
104*4882a593Smuzhiyun s64 ieee754dp_tlong(union ieee754dp x);
105*4882a593Smuzhiyun
106*4882a593Smuzhiyun int ieee754dp_cmp(union ieee754dp x, union ieee754dp y, int cop, int sig);
107*4882a593Smuzhiyun
108*4882a593Smuzhiyun union ieee754dp ieee754dp_sqrt(union ieee754dp x);
109*4882a593Smuzhiyun
110*4882a593Smuzhiyun union ieee754dp ieee754dp_maddf(union ieee754dp z, union ieee754dp x,
111*4882a593Smuzhiyun union ieee754dp y);
112*4882a593Smuzhiyun union ieee754dp ieee754dp_msubf(union ieee754dp z, union ieee754dp x,
113*4882a593Smuzhiyun union ieee754dp y);
114*4882a593Smuzhiyun union ieee754dp ieee754dp_madd(union ieee754dp z, union ieee754dp x,
115*4882a593Smuzhiyun union ieee754dp y);
116*4882a593Smuzhiyun union ieee754dp ieee754dp_msub(union ieee754dp z, union ieee754dp x,
117*4882a593Smuzhiyun union ieee754dp y);
118*4882a593Smuzhiyun union ieee754dp ieee754dp_nmadd(union ieee754dp z, union ieee754dp x,
119*4882a593Smuzhiyun union ieee754dp y);
120*4882a593Smuzhiyun union ieee754dp ieee754dp_nmsub(union ieee754dp z, union ieee754dp x,
121*4882a593Smuzhiyun union ieee754dp y);
122*4882a593Smuzhiyun int ieee754dp_2008class(union ieee754dp x);
123*4882a593Smuzhiyun union ieee754dp ieee754dp_fmin(union ieee754dp x, union ieee754dp y);
124*4882a593Smuzhiyun union ieee754dp ieee754dp_fmina(union ieee754dp x, union ieee754dp y);
125*4882a593Smuzhiyun union ieee754dp ieee754dp_fmax(union ieee754dp x, union ieee754dp y);
126*4882a593Smuzhiyun union ieee754dp ieee754dp_fmaxa(union ieee754dp x, union ieee754dp y);
127*4882a593Smuzhiyun
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun /* 5 types of floating point number
130*4882a593Smuzhiyun */
131*4882a593Smuzhiyun enum {
132*4882a593Smuzhiyun IEEE754_CLASS_NORM = 0x00,
133*4882a593Smuzhiyun IEEE754_CLASS_ZERO = 0x01,
134*4882a593Smuzhiyun IEEE754_CLASS_DNORM = 0x02,
135*4882a593Smuzhiyun IEEE754_CLASS_INF = 0x03,
136*4882a593Smuzhiyun IEEE754_CLASS_SNAN = 0x04,
137*4882a593Smuzhiyun IEEE754_CLASS_QNAN = 0x05,
138*4882a593Smuzhiyun };
139*4882a593Smuzhiyun
140*4882a593Smuzhiyun /* exception numbers */
141*4882a593Smuzhiyun #define IEEE754_INEXACT 0x01
142*4882a593Smuzhiyun #define IEEE754_UNDERFLOW 0x02
143*4882a593Smuzhiyun #define IEEE754_OVERFLOW 0x04
144*4882a593Smuzhiyun #define IEEE754_ZERO_DIVIDE 0x08
145*4882a593Smuzhiyun #define IEEE754_INVALID_OPERATION 0x10
146*4882a593Smuzhiyun
147*4882a593Smuzhiyun /* cmp operators
148*4882a593Smuzhiyun */
149*4882a593Smuzhiyun #define IEEE754_CLT 0x01
150*4882a593Smuzhiyun #define IEEE754_CEQ 0x02
151*4882a593Smuzhiyun #define IEEE754_CGT 0x04
152*4882a593Smuzhiyun #define IEEE754_CUN 0x08
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun /*
155*4882a593Smuzhiyun * The control status register
156*4882a593Smuzhiyun */
157*4882a593Smuzhiyun struct _ieee754_csr {
158*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned fcc:7, /* condition[7:1] */
159*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned nod:1, /* set 1 for no denormals */
160*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned c:1, /* condition[0] */
161*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned pad0:3,
162*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned abs2008:1, /* IEEE 754-2008 ABS/NEG.fmt */
163*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned nan2008:1, /* IEEE 754-2008 NaN mode */
164*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned cx:6, /* exceptions this operation */
165*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned mx:5, /* exception enable mask */
166*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned sx:5, /* exceptions total */
167*4882a593Smuzhiyun __BITFIELD_FIELD(unsigned rm:2, /* current rounding mode */
168*4882a593Smuzhiyun ;))))))))))
169*4882a593Smuzhiyun };
170*4882a593Smuzhiyun #define ieee754_csr (*(struct _ieee754_csr *)(¤t->thread.fpu.fcr31))
171*4882a593Smuzhiyun
ieee754_getrm(void)172*4882a593Smuzhiyun static inline unsigned int ieee754_getrm(void)
173*4882a593Smuzhiyun {
174*4882a593Smuzhiyun return (ieee754_csr.rm);
175*4882a593Smuzhiyun }
176*4882a593Smuzhiyun
ieee754_setrm(unsigned int rm)177*4882a593Smuzhiyun static inline unsigned int ieee754_setrm(unsigned int rm)
178*4882a593Smuzhiyun {
179*4882a593Smuzhiyun return (ieee754_csr.rm = rm);
180*4882a593Smuzhiyun }
181*4882a593Smuzhiyun
182*4882a593Smuzhiyun /*
183*4882a593Smuzhiyun * get current exceptions
184*4882a593Smuzhiyun */
ieee754_getcx(void)185*4882a593Smuzhiyun static inline unsigned int ieee754_getcx(void)
186*4882a593Smuzhiyun {
187*4882a593Smuzhiyun return (ieee754_csr.cx);
188*4882a593Smuzhiyun }
189*4882a593Smuzhiyun
190*4882a593Smuzhiyun /* test for current exception condition
191*4882a593Smuzhiyun */
ieee754_cxtest(unsigned int n)192*4882a593Smuzhiyun static inline int ieee754_cxtest(unsigned int n)
193*4882a593Smuzhiyun {
194*4882a593Smuzhiyun return (ieee754_csr.cx & n);
195*4882a593Smuzhiyun }
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun /*
198*4882a593Smuzhiyun * get sticky exceptions
199*4882a593Smuzhiyun */
ieee754_getsx(void)200*4882a593Smuzhiyun static inline unsigned int ieee754_getsx(void)
201*4882a593Smuzhiyun {
202*4882a593Smuzhiyun return (ieee754_csr.sx);
203*4882a593Smuzhiyun }
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun /* clear sticky conditions
206*4882a593Smuzhiyun */
ieee754_clrsx(void)207*4882a593Smuzhiyun static inline unsigned int ieee754_clrsx(void)
208*4882a593Smuzhiyun {
209*4882a593Smuzhiyun return (ieee754_csr.sx = 0);
210*4882a593Smuzhiyun }
211*4882a593Smuzhiyun
212*4882a593Smuzhiyun /* test for sticky exception condition
213*4882a593Smuzhiyun */
ieee754_sxtest(unsigned int n)214*4882a593Smuzhiyun static inline int ieee754_sxtest(unsigned int n)
215*4882a593Smuzhiyun {
216*4882a593Smuzhiyun return (ieee754_csr.sx & n);
217*4882a593Smuzhiyun }
218*4882a593Smuzhiyun
219*4882a593Smuzhiyun /* debugging */
220*4882a593Smuzhiyun union ieee754sp ieee754sp_dump(char *s, union ieee754sp x);
221*4882a593Smuzhiyun union ieee754dp ieee754dp_dump(char *s, union ieee754dp x);
222*4882a593Smuzhiyun
223*4882a593Smuzhiyun #define IEEE754_SPCVAL_PZERO 0 /* +0.0 */
224*4882a593Smuzhiyun #define IEEE754_SPCVAL_NZERO 1 /* -0.0 */
225*4882a593Smuzhiyun #define IEEE754_SPCVAL_PONE 2 /* +1.0 */
226*4882a593Smuzhiyun #define IEEE754_SPCVAL_NONE 3 /* -1.0 */
227*4882a593Smuzhiyun #define IEEE754_SPCVAL_PTEN 4 /* +10.0 */
228*4882a593Smuzhiyun #define IEEE754_SPCVAL_NTEN 5 /* -10.0 */
229*4882a593Smuzhiyun #define IEEE754_SPCVAL_PINFINITY 6 /* +inf */
230*4882a593Smuzhiyun #define IEEE754_SPCVAL_NINFINITY 7 /* -inf */
231*4882a593Smuzhiyun #define IEEE754_SPCVAL_INDEF_LEG 8 /* legacy quiet NaN */
232*4882a593Smuzhiyun #define IEEE754_SPCVAL_INDEF_2008 9 /* IEEE 754-2008 quiet NaN */
233*4882a593Smuzhiyun #define IEEE754_SPCVAL_PMAX 10 /* +max norm */
234*4882a593Smuzhiyun #define IEEE754_SPCVAL_NMAX 11 /* -max norm */
235*4882a593Smuzhiyun #define IEEE754_SPCVAL_PMIN 12 /* +min norm */
236*4882a593Smuzhiyun #define IEEE754_SPCVAL_NMIN 13 /* -min norm */
237*4882a593Smuzhiyun #define IEEE754_SPCVAL_PMIND 14 /* +min denorm */
238*4882a593Smuzhiyun #define IEEE754_SPCVAL_NMIND 15 /* -min denorm */
239*4882a593Smuzhiyun #define IEEE754_SPCVAL_P1E31 16 /* + 1.0e31 */
240*4882a593Smuzhiyun #define IEEE754_SPCVAL_P1E63 17 /* + 1.0e63 */
241*4882a593Smuzhiyun
242*4882a593Smuzhiyun extern const union ieee754dp __ieee754dp_spcvals[];
243*4882a593Smuzhiyun extern const union ieee754sp __ieee754sp_spcvals[];
244*4882a593Smuzhiyun #define ieee754dp_spcvals ((const union ieee754dp *)__ieee754dp_spcvals)
245*4882a593Smuzhiyun #define ieee754sp_spcvals ((const union ieee754sp *)__ieee754sp_spcvals)
246*4882a593Smuzhiyun
247*4882a593Smuzhiyun /*
248*4882a593Smuzhiyun * Return infinity with given sign
249*4882a593Smuzhiyun */
250*4882a593Smuzhiyun #define ieee754dp_inf(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PINFINITY+(sn)])
251*4882a593Smuzhiyun #define ieee754dp_zero(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PZERO+(sn)])
252*4882a593Smuzhiyun #define ieee754dp_one(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PONE+(sn)])
253*4882a593Smuzhiyun #define ieee754dp_ten(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PTEN+(sn)])
254*4882a593Smuzhiyun #define ieee754dp_indef() (ieee754dp_spcvals[IEEE754_SPCVAL_INDEF_LEG + \
255*4882a593Smuzhiyun ieee754_csr.nan2008])
256*4882a593Smuzhiyun #define ieee754dp_max(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMAX+(sn)])
257*4882a593Smuzhiyun #define ieee754dp_min(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMIN+(sn)])
258*4882a593Smuzhiyun #define ieee754dp_mind(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMIND+(sn)])
259*4882a593Smuzhiyun #define ieee754dp_1e31() (ieee754dp_spcvals[IEEE754_SPCVAL_P1E31])
260*4882a593Smuzhiyun #define ieee754dp_1e63() (ieee754dp_spcvals[IEEE754_SPCVAL_P1E63])
261*4882a593Smuzhiyun
262*4882a593Smuzhiyun #define ieee754sp_inf(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PINFINITY+(sn)])
263*4882a593Smuzhiyun #define ieee754sp_zero(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PZERO+(sn)])
264*4882a593Smuzhiyun #define ieee754sp_one(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PONE+(sn)])
265*4882a593Smuzhiyun #define ieee754sp_ten(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PTEN+(sn)])
266*4882a593Smuzhiyun #define ieee754sp_indef() (ieee754sp_spcvals[IEEE754_SPCVAL_INDEF_LEG + \
267*4882a593Smuzhiyun ieee754_csr.nan2008])
268*4882a593Smuzhiyun #define ieee754sp_max(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMAX+(sn)])
269*4882a593Smuzhiyun #define ieee754sp_min(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMIN+(sn)])
270*4882a593Smuzhiyun #define ieee754sp_mind(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMIND+(sn)])
271*4882a593Smuzhiyun #define ieee754sp_1e31() (ieee754sp_spcvals[IEEE754_SPCVAL_P1E31])
272*4882a593Smuzhiyun #define ieee754sp_1e63() (ieee754sp_spcvals[IEEE754_SPCVAL_P1E63])
273*4882a593Smuzhiyun
274*4882a593Smuzhiyun /*
275*4882a593Smuzhiyun * Indefinite integer value
276*4882a593Smuzhiyun */
ieee754si_indef(void)277*4882a593Smuzhiyun static inline int ieee754si_indef(void)
278*4882a593Smuzhiyun {
279*4882a593Smuzhiyun return ieee754_csr.nan2008 ? 0 : INT_MAX;
280*4882a593Smuzhiyun }
281*4882a593Smuzhiyun
ieee754di_indef(void)282*4882a593Smuzhiyun static inline s64 ieee754di_indef(void)
283*4882a593Smuzhiyun {
284*4882a593Smuzhiyun return ieee754_csr.nan2008 ? 0 : S64_MAX;
285*4882a593Smuzhiyun }
286*4882a593Smuzhiyun
287*4882a593Smuzhiyun /*
288*4882a593Smuzhiyun * Overflow integer value
289*4882a593Smuzhiyun */
ieee754si_overflow(int xs)290*4882a593Smuzhiyun static inline int ieee754si_overflow(int xs)
291*4882a593Smuzhiyun {
292*4882a593Smuzhiyun return ieee754_csr.nan2008 && xs ? INT_MIN : INT_MAX;
293*4882a593Smuzhiyun }
294*4882a593Smuzhiyun
ieee754di_overflow(int xs)295*4882a593Smuzhiyun static inline s64 ieee754di_overflow(int xs)
296*4882a593Smuzhiyun {
297*4882a593Smuzhiyun return ieee754_csr.nan2008 && xs ? S64_MIN : S64_MAX;
298*4882a593Smuzhiyun }
299*4882a593Smuzhiyun
300*4882a593Smuzhiyun /* result types for xctx.rt */
301*4882a593Smuzhiyun #define IEEE754_RT_SP 0
302*4882a593Smuzhiyun #define IEEE754_RT_DP 1
303*4882a593Smuzhiyun #define IEEE754_RT_XP 2
304*4882a593Smuzhiyun #define IEEE754_RT_SI 3
305*4882a593Smuzhiyun #define IEEE754_RT_DI 4
306*4882a593Smuzhiyun
307*4882a593Smuzhiyun /* compat */
308*4882a593Smuzhiyun #define ieee754dp_fix(x) ieee754dp_tint(x)
309*4882a593Smuzhiyun #define ieee754sp_fix(x) ieee754sp_tint(x)
310*4882a593Smuzhiyun
311*4882a593Smuzhiyun #endif /* __ARCH_MIPS_MATH_EMU_IEEE754_H */
312