xref: /OK3568_Linux_fs/kernel/arch/parisc/math-emu/sgl_float.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-or-later */
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Linux/PA-RISC Project (http://www.parisc-linux.org/)
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Floating-point emulation code
6*4882a593Smuzhiyun  *  Copyright (C) 2001 Hewlett-Packard (Paul Bame) <bame@debian.org>
7*4882a593Smuzhiyun  */
8*4882a593Smuzhiyun 
9*4882a593Smuzhiyun #ifdef __NO_PA_HDRS
10*4882a593Smuzhiyun     PA header file -- do not include this header file for non-PA builds.
11*4882a593Smuzhiyun #endif
12*4882a593Smuzhiyun 
13*4882a593Smuzhiyun /* 32-bit word grabbing functions */
14*4882a593Smuzhiyun #define Sgl_firstword(value) Sall(value)
15*4882a593Smuzhiyun #define Sgl_secondword(value) dummy_location
16*4882a593Smuzhiyun #define Sgl_thirdword(value) dummy_location
17*4882a593Smuzhiyun #define Sgl_fourthword(value) dummy_location
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #define Sgl_sign(object) Ssign(object)
20*4882a593Smuzhiyun #define Sgl_exponent(object) Sexponent(object)
21*4882a593Smuzhiyun #define Sgl_signexponent(object) Ssignexponent(object)
22*4882a593Smuzhiyun #define Sgl_mantissa(object) Smantissa(object)
23*4882a593Smuzhiyun #define Sgl_exponentmantissa(object) Sexponentmantissa(object)
24*4882a593Smuzhiyun #define Sgl_all(object) Sall(object)
25*4882a593Smuzhiyun 
26*4882a593Smuzhiyun /* sgl_and_signs ANDs the sign bits of each argument and puts the result
27*4882a593Smuzhiyun  * into the first argument. sgl_or_signs ors those same sign bits */
28*4882a593Smuzhiyun #define Sgl_and_signs( src1dst, src2)		\
29*4882a593Smuzhiyun     Sall(src1dst) = (Sall(src2)|~((unsigned int)1<<31)) & Sall(src1dst)
30*4882a593Smuzhiyun #define Sgl_or_signs( src1dst, src2)		\
31*4882a593Smuzhiyun     Sall(src1dst) = (Sall(src2)&((unsigned int)1<<31)) | Sall(src1dst)
32*4882a593Smuzhiyun 
33*4882a593Smuzhiyun /* The hidden bit is always the low bit of the exponent */
34*4882a593Smuzhiyun #define Sgl_clear_exponent_set_hidden(srcdst) Deposit_sexponent(srcdst,1)
35*4882a593Smuzhiyun #define Sgl_clear_signexponent_set_hidden(srcdst) \
36*4882a593Smuzhiyun     Deposit_ssignexponent(srcdst,1)
37*4882a593Smuzhiyun #define Sgl_clear_sign(srcdst) Sall(srcdst) &= ~((unsigned int)1<<31)
38*4882a593Smuzhiyun #define Sgl_clear_signexponent(srcdst) Sall(srcdst) &= 0x007fffff
39*4882a593Smuzhiyun 
40*4882a593Smuzhiyun /* varamount must be less than 32 for the next three functions */
41*4882a593Smuzhiyun #define Sgl_rightshift(srcdst, varamount)	\
42*4882a593Smuzhiyun     Sall(srcdst) >>= varamount
43*4882a593Smuzhiyun #define Sgl_leftshift(srcdst, varamount)	\
44*4882a593Smuzhiyun     Sall(srcdst) <<= varamount
45*4882a593Smuzhiyun #define Sgl_rightshift_exponentmantissa(srcdst, varamount) \
46*4882a593Smuzhiyun     Sall(srcdst) = \
47*4882a593Smuzhiyun 	(Sexponentmantissa(srcdst) >> varamount) | \
48*4882a593Smuzhiyun 	(Sall(srcdst) & ((unsigned int)1<<31))
49*4882a593Smuzhiyun 
50*4882a593Smuzhiyun #define Sgl_leftshiftby1_withextent(left,right,result) \
51*4882a593Smuzhiyun     Shiftdouble(Sall(left),Extall(right),31,Sall(result))
52*4882a593Smuzhiyun 
53*4882a593Smuzhiyun #define Sgl_rightshiftby1_withextent(left,right,dst)		\
54*4882a593Smuzhiyun     Shiftdouble(Sall(left),Extall(right),1,Extall(right))
55*4882a593Smuzhiyun #define Sgl_arithrightshiftby1(srcdst)	\
56*4882a593Smuzhiyun     Sall(srcdst) = (int)Sall(srcdst) >> 1
57*4882a593Smuzhiyun 
58*4882a593Smuzhiyun /* Sign extend the sign bit with an integer destination */
59*4882a593Smuzhiyun #define Sgl_signextendedsign(value) Ssignedsign(value)
60*4882a593Smuzhiyun 
61*4882a593Smuzhiyun #define Sgl_isone_hidden(sgl_value) (Shidden(sgl_value))
62*4882a593Smuzhiyun #define Sgl_increment(sgl_value) Sall(sgl_value) += 1
63*4882a593Smuzhiyun #define Sgl_increment_mantissa(sgl_value) \
64*4882a593Smuzhiyun     Deposit_smantissa(sgl_value,sgl_value+1)
65*4882a593Smuzhiyun #define Sgl_decrement(sgl_value) Sall(sgl_value) -= 1
66*4882a593Smuzhiyun 
67*4882a593Smuzhiyun #define Sgl_isone_sign(sgl_value) (Is_ssign(sgl_value)!=0)
68*4882a593Smuzhiyun #define Sgl_isone_hiddenoverflow(sgl_value) \
69*4882a593Smuzhiyun     (Is_shiddenoverflow(sgl_value)!=0)
70*4882a593Smuzhiyun #define Sgl_isone_lowmantissa(sgl_value) (Is_slow(sgl_value)!=0)
71*4882a593Smuzhiyun #define Sgl_isone_signaling(sgl_value) (Is_ssignaling(sgl_value)!=0)
72*4882a593Smuzhiyun #define Sgl_is_signalingnan(sgl_value) (Ssignalingnan(sgl_value)==0x1ff)
73*4882a593Smuzhiyun #define Sgl_isnotzero(sgl_value) (Sall(sgl_value)!=0)
74*4882a593Smuzhiyun #define Sgl_isnotzero_hiddenhigh7mantissa(sgl_value) \
75*4882a593Smuzhiyun     (Shiddenhigh7mantissa(sgl_value)!=0)
76*4882a593Smuzhiyun #define Sgl_isnotzero_low4(sgl_value) (Slow4(sgl_value)!=0)
77*4882a593Smuzhiyun #define Sgl_isnotzero_exponent(sgl_value) (Sexponent(sgl_value)!=0)
78*4882a593Smuzhiyun #define Sgl_isnotzero_mantissa(sgl_value) (Smantissa(sgl_value)!=0)
79*4882a593Smuzhiyun #define Sgl_isnotzero_exponentmantissa(sgl_value) \
80*4882a593Smuzhiyun     (Sexponentmantissa(sgl_value)!=0)
81*4882a593Smuzhiyun #define Sgl_iszero(sgl_value) (Sall(sgl_value)==0)
82*4882a593Smuzhiyun #define Sgl_iszero_signaling(sgl_value) (Is_ssignaling(sgl_value)==0)
83*4882a593Smuzhiyun #define Sgl_iszero_hidden(sgl_value) (Is_shidden(sgl_value)==0)
84*4882a593Smuzhiyun #define Sgl_iszero_hiddenoverflow(sgl_value) \
85*4882a593Smuzhiyun     (Is_shiddenoverflow(sgl_value)==0)
86*4882a593Smuzhiyun #define Sgl_iszero_hiddenhigh3mantissa(sgl_value) \
87*4882a593Smuzhiyun     (Shiddenhigh3mantissa(sgl_value)==0)
88*4882a593Smuzhiyun #define Sgl_iszero_hiddenhigh7mantissa(sgl_value) \
89*4882a593Smuzhiyun     (Shiddenhigh7mantissa(sgl_value)==0)
90*4882a593Smuzhiyun #define Sgl_iszero_sign(sgl_value) (Is_ssign(sgl_value)==0)
91*4882a593Smuzhiyun #define Sgl_iszero_exponent(sgl_value) (Sexponent(sgl_value)==0)
92*4882a593Smuzhiyun #define Sgl_iszero_mantissa(sgl_value) (Smantissa(sgl_value)==0)
93*4882a593Smuzhiyun #define Sgl_iszero_exponentmantissa(sgl_value) \
94*4882a593Smuzhiyun     (Sexponentmantissa(sgl_value)==0)
95*4882a593Smuzhiyun #define Sgl_isinfinity_exponent(sgl_value) 		\
96*4882a593Smuzhiyun     (Sgl_exponent(sgl_value)==SGL_INFINITY_EXPONENT)
97*4882a593Smuzhiyun #define Sgl_isnotinfinity_exponent(sgl_value) 		\
98*4882a593Smuzhiyun     (Sgl_exponent(sgl_value)!=SGL_INFINITY_EXPONENT)
99*4882a593Smuzhiyun #define Sgl_isinfinity(sgl_value)			\
100*4882a593Smuzhiyun     (Sgl_exponent(sgl_value)==SGL_INFINITY_EXPONENT &&	\
101*4882a593Smuzhiyun     Sgl_mantissa(sgl_value)==0)
102*4882a593Smuzhiyun #define Sgl_isnan(sgl_value)				\
103*4882a593Smuzhiyun     (Sgl_exponent(sgl_value)==SGL_INFINITY_EXPONENT &&	\
104*4882a593Smuzhiyun     Sgl_mantissa(sgl_value)!=0)
105*4882a593Smuzhiyun #define Sgl_isnotnan(sgl_value)				\
106*4882a593Smuzhiyun     (Sgl_exponent(sgl_value)!=SGL_INFINITY_EXPONENT ||	\
107*4882a593Smuzhiyun     Sgl_mantissa(sgl_value)==0)
108*4882a593Smuzhiyun #define Sgl_islessthan(sgl_op1,sgl_op2)			\
109*4882a593Smuzhiyun     (Sall(sgl_op1) < Sall(sgl_op2))
110*4882a593Smuzhiyun #define Sgl_isgreaterthan(sgl_op1,sgl_op2)		\
111*4882a593Smuzhiyun     (Sall(sgl_op1) > Sall(sgl_op2))
112*4882a593Smuzhiyun #define Sgl_isnotlessthan(sgl_op1,sgl_op2)		\
113*4882a593Smuzhiyun     (Sall(sgl_op1) >= Sall(sgl_op2))
114*4882a593Smuzhiyun #define Sgl_isequal(sgl_op1,sgl_op2)			\
115*4882a593Smuzhiyun     (Sall(sgl_op1) == Sall(sgl_op2))
116*4882a593Smuzhiyun 
117*4882a593Smuzhiyun #define Sgl_leftshiftby8(sgl_value) \
118*4882a593Smuzhiyun     Sall(sgl_value) <<= 8
119*4882a593Smuzhiyun #define Sgl_leftshiftby4(sgl_value) \
120*4882a593Smuzhiyun     Sall(sgl_value) <<= 4
121*4882a593Smuzhiyun #define Sgl_leftshiftby3(sgl_value) \
122*4882a593Smuzhiyun     Sall(sgl_value) <<= 3
123*4882a593Smuzhiyun #define Sgl_leftshiftby2(sgl_value) \
124*4882a593Smuzhiyun     Sall(sgl_value) <<= 2
125*4882a593Smuzhiyun #define Sgl_leftshiftby1(sgl_value) \
126*4882a593Smuzhiyun     Sall(sgl_value) <<= 1
127*4882a593Smuzhiyun #define Sgl_rightshiftby1(sgl_value) \
128*4882a593Smuzhiyun     Sall(sgl_value) >>= 1
129*4882a593Smuzhiyun #define Sgl_rightshiftby4(sgl_value) \
130*4882a593Smuzhiyun     Sall(sgl_value) >>= 4
131*4882a593Smuzhiyun #define Sgl_rightshiftby8(sgl_value) \
132*4882a593Smuzhiyun     Sall(sgl_value) >>= 8
133*4882a593Smuzhiyun 
134*4882a593Smuzhiyun #define Sgl_ismagnitudeless(signlessleft,signlessright)			\
135*4882a593Smuzhiyun /*  unsigned int signlessleft, signlessright; */			\
136*4882a593Smuzhiyun       (signlessleft < signlessright)
137*4882a593Smuzhiyun 
138*4882a593Smuzhiyun 
139*4882a593Smuzhiyun #define Sgl_copytoint_exponentmantissa(source,dest)     \
140*4882a593Smuzhiyun     dest = Sexponentmantissa(source)
141*4882a593Smuzhiyun 
142*4882a593Smuzhiyun /* A quiet NaN has the high mantissa bit clear and at least on other (in this
143*4882a593Smuzhiyun  * case the adjacent bit) bit set. */
144*4882a593Smuzhiyun #define Sgl_set_quiet(sgl_value) Deposit_shigh2mantissa(sgl_value,1)
145*4882a593Smuzhiyun #define Sgl_set_exponent(sgl_value,exp) Deposit_sexponent(sgl_value,exp)
146*4882a593Smuzhiyun 
147*4882a593Smuzhiyun #define Sgl_set_mantissa(dest,value) Deposit_smantissa(dest,value)
148*4882a593Smuzhiyun #define Sgl_set_exponentmantissa(dest,value) \
149*4882a593Smuzhiyun     Deposit_sexponentmantissa(dest,value)
150*4882a593Smuzhiyun 
151*4882a593Smuzhiyun /*  An infinity is represented with the max exponent and a zero mantissa */
152*4882a593Smuzhiyun #define Sgl_setinfinity_exponent(sgl_value) \
153*4882a593Smuzhiyun     Deposit_sexponent(sgl_value,SGL_INFINITY_EXPONENT)
154*4882a593Smuzhiyun #define Sgl_setinfinity_exponentmantissa(sgl_value)	\
155*4882a593Smuzhiyun     Deposit_sexponentmantissa(sgl_value, \
156*4882a593Smuzhiyun 	(SGL_INFINITY_EXPONENT << (32-(1+SGL_EXP_LENGTH))))
157*4882a593Smuzhiyun #define Sgl_setinfinitypositive(sgl_value)		\
158*4882a593Smuzhiyun     Sall(sgl_value) = (SGL_INFINITY_EXPONENT << (32-(1+SGL_EXP_LENGTH)))
159*4882a593Smuzhiyun #define Sgl_setinfinitynegative(sgl_value)		\
160*4882a593Smuzhiyun     Sall(sgl_value) = (SGL_INFINITY_EXPONENT << (32-(1+SGL_EXP_LENGTH))) \
161*4882a593Smuzhiyun     | ((unsigned int)1<<31)
162*4882a593Smuzhiyun #define Sgl_setinfinity(sgl_value,sign)					\
163*4882a593Smuzhiyun     Sall(sgl_value) = (SGL_INFINITY_EXPONENT << (32-(1+SGL_EXP_LENGTH))) | \
164*4882a593Smuzhiyun      ((unsigned int)sign << 31)
165*4882a593Smuzhiyun #define Sgl_sethigh4bits(sgl_value, extsign)  \
166*4882a593Smuzhiyun     Deposit_shigh4(sgl_value,extsign)
167*4882a593Smuzhiyun #define Sgl_set_sign(sgl_value,sign) Deposit_ssign(sgl_value,sign)
168*4882a593Smuzhiyun #define Sgl_invert_sign(sgl_value)  \
169*4882a593Smuzhiyun     Deposit_ssign(sgl_value,~Ssign(sgl_value))
170*4882a593Smuzhiyun #define Sgl_setone_sign(sgl_value) Deposit_ssign(sgl_value,1)
171*4882a593Smuzhiyun #define Sgl_setone_lowmantissa(sgl_value) Deposit_slow(sgl_value,1)
172*4882a593Smuzhiyun #define Sgl_setzero_sign(sgl_value)  Sall(sgl_value) &= 0x7fffffff
173*4882a593Smuzhiyun #define Sgl_setzero_exponent(sgl_value) Sall(sgl_value) &= 0x807fffff
174*4882a593Smuzhiyun #define Sgl_setzero_mantissa(sgl_value) Sall(sgl_value) &= 0xff800000
175*4882a593Smuzhiyun #define Sgl_setzero_exponentmantissa(sgl_value)  Sall(sgl_value) &= 0x80000000
176*4882a593Smuzhiyun #define Sgl_setzero(sgl_value) Sall(sgl_value) = 0
177*4882a593Smuzhiyun #define Sgl_setnegativezero(sgl_value) Sall(sgl_value) = (unsigned int)1 << 31
178*4882a593Smuzhiyun 
179*4882a593Smuzhiyun /* Use following macro for both overflow & underflow conditions */
180*4882a593Smuzhiyun #define ovfl -
181*4882a593Smuzhiyun #define unfl +
182*4882a593Smuzhiyun #define Sgl_setwrapped_exponent(sgl_value,exponent,op) \
183*4882a593Smuzhiyun     Deposit_sexponent(sgl_value,(exponent op SGL_WRAP))
184*4882a593Smuzhiyun 
185*4882a593Smuzhiyun #define Sgl_setlargestpositive(sgl_value) 				\
186*4882a593Smuzhiyun     Sall(sgl_value) = ((SGL_EMAX+SGL_BIAS) << (32-(1+SGL_EXP_LENGTH)))	\
187*4882a593Smuzhiyun                       | ((1<<(32-(1+SGL_EXP_LENGTH))) - 1 )
188*4882a593Smuzhiyun #define Sgl_setlargestnegative(sgl_value)				\
189*4882a593Smuzhiyun     Sall(sgl_value) = ((SGL_EMAX+SGL_BIAS) << (32-(1+SGL_EXP_LENGTH)))	\
190*4882a593Smuzhiyun                       | ((1<<(32-(1+SGL_EXP_LENGTH))) - 1 )		\
191*4882a593Smuzhiyun 		      | ((unsigned int)1<<31)
192*4882a593Smuzhiyun 
193*4882a593Smuzhiyun #define Sgl_setnegativeinfinity(sgl_value)	\
194*4882a593Smuzhiyun     Sall(sgl_value) = 				\
195*4882a593Smuzhiyun     ((1<<SGL_EXP_LENGTH) | SGL_INFINITY_EXPONENT) << (32-(1+SGL_EXP_LENGTH))
196*4882a593Smuzhiyun #define Sgl_setlargest(sgl_value,sign) 					\
197*4882a593Smuzhiyun     Sall(sgl_value) = (unsigned int)sign << 31 |			\
198*4882a593Smuzhiyun         (((SGL_EMAX+SGL_BIAS) << (32-(1+SGL_EXP_LENGTH)))		\
199*4882a593Smuzhiyun 	  | ((1 << (32-(1+SGL_EXP_LENGTH))) - 1 ))
200*4882a593Smuzhiyun #define Sgl_setlargest_exponentmantissa(sgl_value)			\
201*4882a593Smuzhiyun     Sall(sgl_value) = Sall(sgl_value) & ((unsigned int)1<<31) |		\
202*4882a593Smuzhiyun         (((SGL_EMAX+SGL_BIAS) << (32-(1+SGL_EXP_LENGTH)))		\
203*4882a593Smuzhiyun 	  | ((1 << (32-(1+SGL_EXP_LENGTH))) - 1 ))
204*4882a593Smuzhiyun 
205*4882a593Smuzhiyun /* The high bit is always zero so arithmetic or logical shifts will work. */
206*4882a593Smuzhiyun #define Sgl_right_align(srcdst,shift,extent)				\
207*4882a593Smuzhiyun     /* sgl_floating_point srcdst; int shift; extension extent */	\
208*4882a593Smuzhiyun     if (shift < 32) {							\
209*4882a593Smuzhiyun 	Extall(extent) = Sall(srcdst) << (32-(shift));			\
210*4882a593Smuzhiyun     	Sall(srcdst) >>= shift;						\
211*4882a593Smuzhiyun     }									\
212*4882a593Smuzhiyun     else {								\
213*4882a593Smuzhiyun 	Extall(extent) = Sall(srcdst);					\
214*4882a593Smuzhiyun 	Sall(srcdst) = 0;						\
215*4882a593Smuzhiyun     }
216*4882a593Smuzhiyun #define Sgl_hiddenhigh3mantissa(sgl_value) Shiddenhigh3mantissa(sgl_value)
217*4882a593Smuzhiyun #define Sgl_hidden(sgl_value) Shidden(sgl_value)
218*4882a593Smuzhiyun #define Sgl_lowmantissa(sgl_value) Slow(sgl_value)
219*4882a593Smuzhiyun 
220*4882a593Smuzhiyun /* The left argument is never smaller than the right argument */
221*4882a593Smuzhiyun #define Sgl_subtract(sgl_left,sgl_right,sgl_result) \
222*4882a593Smuzhiyun     Sall(sgl_result) = Sall(sgl_left) - Sall(sgl_right)
223*4882a593Smuzhiyun 
224*4882a593Smuzhiyun /* Subtract right augmented with extension from left augmented with zeros and
225*4882a593Smuzhiyun  * store into result and extension. */
226*4882a593Smuzhiyun #define Sgl_subtract_withextension(left,right,extent,result)		\
227*4882a593Smuzhiyun     /* sgl_floating_point left,right,result; extension extent */	\
228*4882a593Smuzhiyun   Sgl_subtract(left,right,result);					\
229*4882a593Smuzhiyun   if((Extall(extent) = 0-Extall(extent)))				\
230*4882a593Smuzhiyun       Sall(result) = Sall(result)-1
231*4882a593Smuzhiyun 
232*4882a593Smuzhiyun #define Sgl_addition(sgl_left,sgl_right,sgl_result) \
233*4882a593Smuzhiyun     Sall(sgl_result) = Sall(sgl_left) + Sall(sgl_right)
234*4882a593Smuzhiyun 
235*4882a593Smuzhiyun #define Sgl_xortointp1(left,right,result)			\
236*4882a593Smuzhiyun     result = Sall(left) XOR Sall(right);
237*4882a593Smuzhiyun 
238*4882a593Smuzhiyun #define Sgl_xorfromintp1(left,right,result)			\
239*4882a593Smuzhiyun     Sall(result) = left XOR Sall(right)
240*4882a593Smuzhiyun 
241*4882a593Smuzhiyun /* Need to Initialize */
242*4882a593Smuzhiyun #define Sgl_makequietnan(dest)						\
243*4882a593Smuzhiyun     Sall(dest) = ((SGL_EMAX+SGL_BIAS)+1)<< (32-(1+SGL_EXP_LENGTH))	\
244*4882a593Smuzhiyun                  | (1<<(32-(1+SGL_EXP_LENGTH+2)))
245*4882a593Smuzhiyun #define Sgl_makesignalingnan(dest)					\
246*4882a593Smuzhiyun     Sall(dest) = ((SGL_EMAX+SGL_BIAS)+1)<< (32-(1+SGL_EXP_LENGTH))	\
247*4882a593Smuzhiyun                  | (1<<(32-(1+SGL_EXP_LENGTH+1)))
248*4882a593Smuzhiyun 
249*4882a593Smuzhiyun #define Sgl_normalize(sgl_opnd,exponent)			\
250*4882a593Smuzhiyun 	while(Sgl_iszero_hiddenhigh7mantissa(sgl_opnd)) {	\
251*4882a593Smuzhiyun 		Sgl_leftshiftby8(sgl_opnd);			\
252*4882a593Smuzhiyun 		exponent -= 8;					\
253*4882a593Smuzhiyun 	}							\
254*4882a593Smuzhiyun 	if(Sgl_iszero_hiddenhigh3mantissa(sgl_opnd)) {		\
255*4882a593Smuzhiyun 		Sgl_leftshiftby4(sgl_opnd);			\
256*4882a593Smuzhiyun 		exponent -= 4;					\
257*4882a593Smuzhiyun 	}							\
258*4882a593Smuzhiyun 	while(Sgl_iszero_hidden(sgl_opnd)) {			\
259*4882a593Smuzhiyun 		Sgl_leftshiftby1(sgl_opnd);			\
260*4882a593Smuzhiyun 		exponent -= 1;					\
261*4882a593Smuzhiyun 	}
262*4882a593Smuzhiyun 
263*4882a593Smuzhiyun #define Sgl_setoverflow(sgl_opnd)				\
264*4882a593Smuzhiyun 	/* set result to infinity or largest number */		\
265*4882a593Smuzhiyun 	switch (Rounding_mode()) {				\
266*4882a593Smuzhiyun 		case ROUNDPLUS:					\
267*4882a593Smuzhiyun 			if (Sgl_isone_sign(sgl_opnd)) {		\
268*4882a593Smuzhiyun 				Sgl_setlargestnegative(sgl_opnd); \
269*4882a593Smuzhiyun 			}					\
270*4882a593Smuzhiyun 			else {					\
271*4882a593Smuzhiyun 				Sgl_setinfinitypositive(sgl_opnd); \
272*4882a593Smuzhiyun 			}					\
273*4882a593Smuzhiyun 			break;					\
274*4882a593Smuzhiyun 		case ROUNDMINUS:				\
275*4882a593Smuzhiyun 			if (Sgl_iszero_sign(sgl_opnd)) {	\
276*4882a593Smuzhiyun 				Sgl_setlargestpositive(sgl_opnd); \
277*4882a593Smuzhiyun 			}					\
278*4882a593Smuzhiyun 			else {					\
279*4882a593Smuzhiyun 				Sgl_setinfinitynegative(sgl_opnd); \
280*4882a593Smuzhiyun 			}					\
281*4882a593Smuzhiyun 			break;					\
282*4882a593Smuzhiyun 		case ROUNDNEAREST:				\
283*4882a593Smuzhiyun 			Sgl_setinfinity_exponentmantissa(sgl_opnd); \
284*4882a593Smuzhiyun 			break;					\
285*4882a593Smuzhiyun 		case ROUNDZERO:					\
286*4882a593Smuzhiyun 			Sgl_setlargest_exponentmantissa(sgl_opnd); \
287*4882a593Smuzhiyun 	}
288*4882a593Smuzhiyun 
289*4882a593Smuzhiyun #define Sgl_denormalize(opnd,exponent,guard,sticky,inexact)		\
290*4882a593Smuzhiyun 	Sgl_clear_signexponent_set_hidden(opnd);			\
291*4882a593Smuzhiyun 	if (exponent >= (1 - SGL_P)) {					\
292*4882a593Smuzhiyun 		guard = (Sall(opnd) >> -exponent) & 1;			\
293*4882a593Smuzhiyun 		if (exponent < 0) sticky |= Sall(opnd) << (32+exponent); \
294*4882a593Smuzhiyun 		inexact = guard | sticky;				\
295*4882a593Smuzhiyun 		Sall(opnd) >>= (1-exponent);				\
296*4882a593Smuzhiyun 	}								\
297*4882a593Smuzhiyun 	else {								\
298*4882a593Smuzhiyun 		guard = 0;						\
299*4882a593Smuzhiyun 		sticky |= Sall(opnd);					\
300*4882a593Smuzhiyun 		inexact = sticky;					\
301*4882a593Smuzhiyun 		Sgl_setzero(opnd);					\
302*4882a593Smuzhiyun 	}
303*4882a593Smuzhiyun 
304*4882a593Smuzhiyun /*
305*4882a593Smuzhiyun  * The fused multiply add instructions requires a single extended format,
306*4882a593Smuzhiyun  * with 48 bits of mantissa.
307*4882a593Smuzhiyun  */
308*4882a593Smuzhiyun #define SGLEXT_THRESHOLD 48
309*4882a593Smuzhiyun 
310*4882a593Smuzhiyun #define Sglext_setzero(valA,valB)	\
311*4882a593Smuzhiyun     Sextallp1(valA) = 0; Sextallp2(valB) = 0
312*4882a593Smuzhiyun 
313*4882a593Smuzhiyun #define Sglext_isnotzero_mantissap2(valB) (Sextallp2(valB)!=0)
314*4882a593Smuzhiyun #define Sglext_isone_lowp1(val) (Sextlowp1(val)!=0)
315*4882a593Smuzhiyun #define Sglext_isone_highp2(val) (Sexthighp2(val)!=0)
316*4882a593Smuzhiyun #define Sglext_isnotzero_low31p2(val) (Sextlow31p2(val)!=0)
317*4882a593Smuzhiyun #define Sglext_iszero(valA,valB) (Sextallp1(valA)==0 && Sextallp2(valB)==0)
318*4882a593Smuzhiyun 
319*4882a593Smuzhiyun #define Sgl_copytoptr(src,destptr) *destptr = src
320*4882a593Smuzhiyun #define Sgl_copyfromptr(srcptr,dest) dest = *srcptr
321*4882a593Smuzhiyun #define Sglext_copy(srca,srcb,desta,destb) \
322*4882a593Smuzhiyun     Sextallp1(desta) = Sextallp1(srca);	\
323*4882a593Smuzhiyun     Sextallp2(destb) = Sextallp2(srcb)
324*4882a593Smuzhiyun #define Sgl_copyto_sglext(src1,dest1,dest2) \
325*4882a593Smuzhiyun 	Sextallp1(dest1) = Sall(src1); Sextallp2(dest2) = 0
326*4882a593Smuzhiyun 
327*4882a593Smuzhiyun #define Sglext_swap_lower(leftp2,rightp2)  \
328*4882a593Smuzhiyun     Sextallp2(leftp2)  = Sextallp2(leftp2) XOR Sextallp2(rightp2);  \
329*4882a593Smuzhiyun     Sextallp2(rightp2) = Sextallp2(leftp2) XOR Sextallp2(rightp2);  \
330*4882a593Smuzhiyun     Sextallp2(leftp2)  = Sextallp2(leftp2) XOR Sextallp2(rightp2)
331*4882a593Smuzhiyun 
332*4882a593Smuzhiyun #define Sglext_setone_lowmantissap2(value) Deposit_dlowp2(value,1)
333*4882a593Smuzhiyun 
334*4882a593Smuzhiyun /* The high bit is always zero so arithmetic or logical shifts will work. */
335*4882a593Smuzhiyun #define Sglext_right_align(srcdstA,srcdstB,shift) \
336*4882a593Smuzhiyun   {int shiftamt, sticky;						\
337*4882a593Smuzhiyun     shiftamt = shift % 32;						\
338*4882a593Smuzhiyun     sticky = 0;								\
339*4882a593Smuzhiyun     switch (shift/32) {							\
340*4882a593Smuzhiyun      case 0: if (shiftamt > 0) {					\
341*4882a593Smuzhiyun 	        sticky = Sextallp2(srcdstB) << 32 - (shiftamt);		\
342*4882a593Smuzhiyun                 Variable_shift_double(Sextallp1(srcdstA),		\
343*4882a593Smuzhiyun 		 Sextallp2(srcdstB),shiftamt,Sextallp2(srcdstB));	\
344*4882a593Smuzhiyun 	        Sextallp1(srcdstA) >>= shiftamt;			\
345*4882a593Smuzhiyun 	     }								\
346*4882a593Smuzhiyun 	     break;							\
347*4882a593Smuzhiyun      case 1: if (shiftamt > 0) {					\
348*4882a593Smuzhiyun 	        sticky = (Sextallp1(srcdstA) << 32 - (shiftamt)) |	\
349*4882a593Smuzhiyun 			 Sextallp2(srcdstB);				\
350*4882a593Smuzhiyun 	     }								\
351*4882a593Smuzhiyun 	     else {							\
352*4882a593Smuzhiyun 		sticky = Sextallp2(srcdstB);				\
353*4882a593Smuzhiyun 	     }								\
354*4882a593Smuzhiyun 	     Sextallp2(srcdstB) = Sextallp1(srcdstA) >> shiftamt;	\
355*4882a593Smuzhiyun 	     Sextallp1(srcdstA) = 0;					\
356*4882a593Smuzhiyun 	     break;							\
357*4882a593Smuzhiyun     }									\
358*4882a593Smuzhiyun     if (sticky) Sglext_setone_lowmantissap2(srcdstB);			\
359*4882a593Smuzhiyun   }
360*4882a593Smuzhiyun 
361*4882a593Smuzhiyun /* The left argument is never smaller than the right argument */
362*4882a593Smuzhiyun #define Sglext_subtract(lefta,leftb,righta,rightb,resulta,resultb) \
363*4882a593Smuzhiyun     if( Sextallp2(rightb) > Sextallp2(leftb) ) Sextallp1(lefta)--; \
364*4882a593Smuzhiyun     Sextallp2(resultb) = Sextallp2(leftb) - Sextallp2(rightb);	\
365*4882a593Smuzhiyun     Sextallp1(resulta) = Sextallp1(lefta) - Sextallp1(righta)
366*4882a593Smuzhiyun 
367*4882a593Smuzhiyun #define Sglext_addition(lefta,leftb,righta,rightb,resulta,resultb) \
368*4882a593Smuzhiyun     /* If the sum of the low words is less than either source, then \
369*4882a593Smuzhiyun      * an overflow into the next word occurred. */ \
370*4882a593Smuzhiyun     if ((Sextallp2(resultb) = Sextallp2(leftb)+Sextallp2(rightb)) < \
371*4882a593Smuzhiyun         Sextallp2(rightb)) \
372*4882a593Smuzhiyun 	    Sextallp1(resulta) = Sextallp1(lefta)+Sextallp1(righta)+1; \
373*4882a593Smuzhiyun     else Sextallp1(resulta) = Sextallp1(lefta)+Sextallp1(righta)
374*4882a593Smuzhiyun 
375*4882a593Smuzhiyun 
376*4882a593Smuzhiyun #define Sglext_arithrightshiftby1(srcdstA,srcdstB)	\
377*4882a593Smuzhiyun     Shiftdouble(Sextallp1(srcdstA),Sextallp2(srcdstB),1,Sextallp2(srcdstB)); \
378*4882a593Smuzhiyun     Sextallp1(srcdstA) = (int)Sextallp1(srcdstA) >> 1
379*4882a593Smuzhiyun 
380*4882a593Smuzhiyun #define Sglext_leftshiftby8(valA,valB) \
381*4882a593Smuzhiyun     Shiftdouble(Sextallp1(valA),Sextallp2(valB),24,Sextallp1(valA)); \
382*4882a593Smuzhiyun     Sextallp2(valB) <<= 8
383*4882a593Smuzhiyun #define Sglext_leftshiftby4(valA,valB) \
384*4882a593Smuzhiyun     Shiftdouble(Sextallp1(valA),Sextallp2(valB),28,Sextallp1(valA)); \
385*4882a593Smuzhiyun     Sextallp2(valB) <<= 4
386*4882a593Smuzhiyun #define Sglext_leftshiftby3(valA,valB) \
387*4882a593Smuzhiyun     Shiftdouble(Sextallp1(valA),Sextallp2(valB),29,Sextallp1(valA)); \
388*4882a593Smuzhiyun     Sextallp2(valB) <<= 3
389*4882a593Smuzhiyun #define Sglext_leftshiftby2(valA,valB) \
390*4882a593Smuzhiyun     Shiftdouble(Sextallp1(valA),Sextallp2(valB),30,Sextallp1(valA)); \
391*4882a593Smuzhiyun     Sextallp2(valB) <<= 2
392*4882a593Smuzhiyun #define Sglext_leftshiftby1(valA,valB) \
393*4882a593Smuzhiyun     Shiftdouble(Sextallp1(valA),Sextallp2(valB),31,Sextallp1(valA)); \
394*4882a593Smuzhiyun     Sextallp2(valB) <<= 1
395*4882a593Smuzhiyun 
396*4882a593Smuzhiyun #define Sglext_rightshiftby4(valueA,valueB) \
397*4882a593Smuzhiyun     Shiftdouble(Sextallp1(valueA),Sextallp2(valueB),4,Sextallp2(valueB)); \
398*4882a593Smuzhiyun     Sextallp1(valueA) >>= 4
399*4882a593Smuzhiyun #define Sglext_rightshiftby3(valueA,valueB) \
400*4882a593Smuzhiyun     Shiftdouble(Sextallp1(valueA),Sextallp2(valueB),3,Sextallp2(valueB)); \
401*4882a593Smuzhiyun     Sextallp1(valueA) >>= 3
402*4882a593Smuzhiyun #define Sglext_rightshiftby1(valueA,valueB) \
403*4882a593Smuzhiyun     Shiftdouble(Sextallp1(valueA),Sextallp2(valueB),1,Sextallp2(valueB)); \
404*4882a593Smuzhiyun     Sextallp1(valueA) >>= 1
405*4882a593Smuzhiyun 
406*4882a593Smuzhiyun #define Sglext_xortointp1(left,right,result) Sgl_xortointp1(left,right,result)
407*4882a593Smuzhiyun #define Sglext_xorfromintp1(left,right,result) \
408*4882a593Smuzhiyun 	Sgl_xorfromintp1(left,right,result)
409*4882a593Smuzhiyun #define Sglext_copytoint_exponentmantissa(src,dest) \
410*4882a593Smuzhiyun 	Sgl_copytoint_exponentmantissa(src,dest)
411*4882a593Smuzhiyun #define Sglext_ismagnitudeless(signlessleft,signlessright) \
412*4882a593Smuzhiyun 	Sgl_ismagnitudeless(signlessleft,signlessright)
413*4882a593Smuzhiyun 
414*4882a593Smuzhiyun #define Sglext_set_sign(dbl_value,sign)  Sgl_set_sign(dbl_value,sign)
415*4882a593Smuzhiyun #define Sglext_clear_signexponent_set_hidden(srcdst) \
416*4882a593Smuzhiyun 	Sgl_clear_signexponent_set_hidden(srcdst)
417*4882a593Smuzhiyun #define Sglext_clear_signexponent(srcdst) Sgl_clear_signexponent(srcdst)
418*4882a593Smuzhiyun #define Sglext_clear_sign(srcdst) Sgl_clear_sign(srcdst)
419*4882a593Smuzhiyun #define Sglext_isone_hidden(dbl_value) Sgl_isone_hidden(dbl_value)
420*4882a593Smuzhiyun 
421*4882a593Smuzhiyun #define Sglext_denormalize(opndp1,opndp2,exponent,is_tiny)		\
422*4882a593Smuzhiyun   {int sticky;								\
423*4882a593Smuzhiyun     is_tiny = TRUE;							\
424*4882a593Smuzhiyun     if (exponent == 0 && Sextallp2(opndp2)) {				\
425*4882a593Smuzhiyun 	switch (Rounding_mode()) {					\
426*4882a593Smuzhiyun 	case ROUNDPLUS:							\
427*4882a593Smuzhiyun 		if (Sgl_iszero_sign(opndp1))				\
428*4882a593Smuzhiyun 			if (Sgl_isone_hiddenoverflow(opndp1 + 1))	\
429*4882a593Smuzhiyun 				is_tiny = FALSE;			\
430*4882a593Smuzhiyun 		break;							\
431*4882a593Smuzhiyun 	case ROUNDMINUS:						\
432*4882a593Smuzhiyun 		if (Sgl_isone_sign(opndp1)) {				\
433*4882a593Smuzhiyun 			if (Sgl_isone_hiddenoverflow(opndp1 + 1))	\
434*4882a593Smuzhiyun 				is_tiny = FALSE;			\
435*4882a593Smuzhiyun 		}							\
436*4882a593Smuzhiyun 		break;							\
437*4882a593Smuzhiyun 	case ROUNDNEAREST:						\
438*4882a593Smuzhiyun 		if (Sglext_isone_highp2(opndp2) &&			\
439*4882a593Smuzhiyun 		    (Sglext_isone_lowp1(opndp1) || 			\
440*4882a593Smuzhiyun 		     Sglext_isnotzero_low31p2(opndp2)))			\
441*4882a593Smuzhiyun 			if (Sgl_isone_hiddenoverflow(opndp1 + 1))	\
442*4882a593Smuzhiyun 				is_tiny = FALSE;			\
443*4882a593Smuzhiyun 		break;							\
444*4882a593Smuzhiyun 	}								\
445*4882a593Smuzhiyun     }									\
446*4882a593Smuzhiyun     Sglext_clear_signexponent_set_hidden(opndp1);			\
447*4882a593Smuzhiyun     if (exponent >= (1-DBL_P)) {					\
448*4882a593Smuzhiyun 	if (exponent >= -31) {						\
449*4882a593Smuzhiyun 	    if (exponent > -31) {					\
450*4882a593Smuzhiyun 		sticky = Sextallp2(opndp2) << 31+exponent;		\
451*4882a593Smuzhiyun 		Variable_shift_double(opndp1,opndp2,1-exponent,opndp2);	\
452*4882a593Smuzhiyun 		Sextallp1(opndp1) >>= 1-exponent;			\
453*4882a593Smuzhiyun 	    }								\
454*4882a593Smuzhiyun 	    else {							\
455*4882a593Smuzhiyun 		sticky = Sextallp2(opndp2);				\
456*4882a593Smuzhiyun 		Sextallp2(opndp2) = Sextallp1(opndp1);			\
457*4882a593Smuzhiyun 		Sextallp1(opndp1) = 0;					\
458*4882a593Smuzhiyun 	    }								\
459*4882a593Smuzhiyun 	}								\
460*4882a593Smuzhiyun 	else {								\
461*4882a593Smuzhiyun 	    sticky = (Sextallp1(opndp1) << 31+exponent) | 		\
462*4882a593Smuzhiyun 		     Sextallp2(opndp2);					\
463*4882a593Smuzhiyun 	    Sextallp2(opndp2) = Sextallp1(opndp1) >> -31-exponent;	\
464*4882a593Smuzhiyun 	    Sextallp1(opndp1) = 0;					\
465*4882a593Smuzhiyun 	}								\
466*4882a593Smuzhiyun     }									\
467*4882a593Smuzhiyun     else {								\
468*4882a593Smuzhiyun 	sticky = Sextallp1(opndp1) | Sextallp2(opndp2);			\
469*4882a593Smuzhiyun 	Sglext_setzero(opndp1,opndp2);					\
470*4882a593Smuzhiyun     }									\
471*4882a593Smuzhiyun     if (sticky) Sglext_setone_lowmantissap2(opndp2);			\
472*4882a593Smuzhiyun     exponent = 0;							\
473*4882a593Smuzhiyun   }
474