1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-or-later */ 2*4882a593Smuzhiyun /* 3*4882a593Smuzhiyun * Linux/PA-RISC Project (http://www.parisc-linux.org/) 4*4882a593Smuzhiyun * 5*4882a593Smuzhiyun * Floating-point emulation code 6*4882a593Smuzhiyun * Copyright (C) 2001 Hewlett-Packard (Paul Bame) <bame@debian.org> 7*4882a593Smuzhiyun */ 8*4882a593Smuzhiyun 9*4882a593Smuzhiyun #ifdef __NO_PA_HDRS 10*4882a593Smuzhiyun PA header file -- do not include this header file for non-PA builds. 11*4882a593Smuzhiyun #endif 12*4882a593Smuzhiyun 13*4882a593Smuzhiyun /* 32-bit word grabbing functions */ 14*4882a593Smuzhiyun #define Sgl_firstword(value) Sall(value) 15*4882a593Smuzhiyun #define Sgl_secondword(value) dummy_location 16*4882a593Smuzhiyun #define Sgl_thirdword(value) dummy_location 17*4882a593Smuzhiyun #define Sgl_fourthword(value) dummy_location 18*4882a593Smuzhiyun 19*4882a593Smuzhiyun #define Sgl_sign(object) Ssign(object) 20*4882a593Smuzhiyun #define Sgl_exponent(object) Sexponent(object) 21*4882a593Smuzhiyun #define Sgl_signexponent(object) Ssignexponent(object) 22*4882a593Smuzhiyun #define Sgl_mantissa(object) Smantissa(object) 23*4882a593Smuzhiyun #define Sgl_exponentmantissa(object) Sexponentmantissa(object) 24*4882a593Smuzhiyun #define Sgl_all(object) Sall(object) 25*4882a593Smuzhiyun 26*4882a593Smuzhiyun /* sgl_and_signs ANDs the sign bits of each argument and puts the result 27*4882a593Smuzhiyun * into the first argument. sgl_or_signs ors those same sign bits */ 28*4882a593Smuzhiyun #define Sgl_and_signs( src1dst, src2) \ 29*4882a593Smuzhiyun Sall(src1dst) = (Sall(src2)|~((unsigned int)1<<31)) & Sall(src1dst) 30*4882a593Smuzhiyun #define Sgl_or_signs( src1dst, src2) \ 31*4882a593Smuzhiyun Sall(src1dst) = (Sall(src2)&((unsigned int)1<<31)) | Sall(src1dst) 32*4882a593Smuzhiyun 33*4882a593Smuzhiyun /* The hidden bit is always the low bit of the exponent */ 34*4882a593Smuzhiyun #define Sgl_clear_exponent_set_hidden(srcdst) Deposit_sexponent(srcdst,1) 35*4882a593Smuzhiyun #define Sgl_clear_signexponent_set_hidden(srcdst) \ 36*4882a593Smuzhiyun Deposit_ssignexponent(srcdst,1) 37*4882a593Smuzhiyun #define Sgl_clear_sign(srcdst) Sall(srcdst) &= ~((unsigned int)1<<31) 38*4882a593Smuzhiyun #define Sgl_clear_signexponent(srcdst) Sall(srcdst) &= 0x007fffff 39*4882a593Smuzhiyun 40*4882a593Smuzhiyun /* varamount must be less than 32 for the next three functions */ 41*4882a593Smuzhiyun #define Sgl_rightshift(srcdst, varamount) \ 42*4882a593Smuzhiyun Sall(srcdst) >>= varamount 43*4882a593Smuzhiyun #define Sgl_leftshift(srcdst, varamount) \ 44*4882a593Smuzhiyun Sall(srcdst) <<= varamount 45*4882a593Smuzhiyun #define Sgl_rightshift_exponentmantissa(srcdst, varamount) \ 46*4882a593Smuzhiyun Sall(srcdst) = \ 47*4882a593Smuzhiyun (Sexponentmantissa(srcdst) >> varamount) | \ 48*4882a593Smuzhiyun (Sall(srcdst) & ((unsigned int)1<<31)) 49*4882a593Smuzhiyun 50*4882a593Smuzhiyun #define Sgl_leftshiftby1_withextent(left,right,result) \ 51*4882a593Smuzhiyun Shiftdouble(Sall(left),Extall(right),31,Sall(result)) 52*4882a593Smuzhiyun 53*4882a593Smuzhiyun #define Sgl_rightshiftby1_withextent(left,right,dst) \ 54*4882a593Smuzhiyun Shiftdouble(Sall(left),Extall(right),1,Extall(right)) 55*4882a593Smuzhiyun #define Sgl_arithrightshiftby1(srcdst) \ 56*4882a593Smuzhiyun Sall(srcdst) = (int)Sall(srcdst) >> 1 57*4882a593Smuzhiyun 58*4882a593Smuzhiyun /* Sign extend the sign bit with an integer destination */ 59*4882a593Smuzhiyun #define Sgl_signextendedsign(value) Ssignedsign(value) 60*4882a593Smuzhiyun 61*4882a593Smuzhiyun #define Sgl_isone_hidden(sgl_value) (Shidden(sgl_value)) 62*4882a593Smuzhiyun #define Sgl_increment(sgl_value) Sall(sgl_value) += 1 63*4882a593Smuzhiyun #define Sgl_increment_mantissa(sgl_value) \ 64*4882a593Smuzhiyun Deposit_smantissa(sgl_value,sgl_value+1) 65*4882a593Smuzhiyun #define Sgl_decrement(sgl_value) Sall(sgl_value) -= 1 66*4882a593Smuzhiyun 67*4882a593Smuzhiyun #define Sgl_isone_sign(sgl_value) (Is_ssign(sgl_value)!=0) 68*4882a593Smuzhiyun #define Sgl_isone_hiddenoverflow(sgl_value) \ 69*4882a593Smuzhiyun (Is_shiddenoverflow(sgl_value)!=0) 70*4882a593Smuzhiyun #define Sgl_isone_lowmantissa(sgl_value) (Is_slow(sgl_value)!=0) 71*4882a593Smuzhiyun #define Sgl_isone_signaling(sgl_value) (Is_ssignaling(sgl_value)!=0) 72*4882a593Smuzhiyun #define Sgl_is_signalingnan(sgl_value) (Ssignalingnan(sgl_value)==0x1ff) 73*4882a593Smuzhiyun #define Sgl_isnotzero(sgl_value) (Sall(sgl_value)!=0) 74*4882a593Smuzhiyun #define Sgl_isnotzero_hiddenhigh7mantissa(sgl_value) \ 75*4882a593Smuzhiyun (Shiddenhigh7mantissa(sgl_value)!=0) 76*4882a593Smuzhiyun #define Sgl_isnotzero_low4(sgl_value) (Slow4(sgl_value)!=0) 77*4882a593Smuzhiyun #define Sgl_isnotzero_exponent(sgl_value) (Sexponent(sgl_value)!=0) 78*4882a593Smuzhiyun #define Sgl_isnotzero_mantissa(sgl_value) (Smantissa(sgl_value)!=0) 79*4882a593Smuzhiyun #define Sgl_isnotzero_exponentmantissa(sgl_value) \ 80*4882a593Smuzhiyun (Sexponentmantissa(sgl_value)!=0) 81*4882a593Smuzhiyun #define Sgl_iszero(sgl_value) (Sall(sgl_value)==0) 82*4882a593Smuzhiyun #define Sgl_iszero_signaling(sgl_value) (Is_ssignaling(sgl_value)==0) 83*4882a593Smuzhiyun #define Sgl_iszero_hidden(sgl_value) (Is_shidden(sgl_value)==0) 84*4882a593Smuzhiyun #define Sgl_iszero_hiddenoverflow(sgl_value) \ 85*4882a593Smuzhiyun (Is_shiddenoverflow(sgl_value)==0) 86*4882a593Smuzhiyun #define Sgl_iszero_hiddenhigh3mantissa(sgl_value) \ 87*4882a593Smuzhiyun (Shiddenhigh3mantissa(sgl_value)==0) 88*4882a593Smuzhiyun #define Sgl_iszero_hiddenhigh7mantissa(sgl_value) \ 89*4882a593Smuzhiyun (Shiddenhigh7mantissa(sgl_value)==0) 90*4882a593Smuzhiyun #define Sgl_iszero_sign(sgl_value) (Is_ssign(sgl_value)==0) 91*4882a593Smuzhiyun #define Sgl_iszero_exponent(sgl_value) (Sexponent(sgl_value)==0) 92*4882a593Smuzhiyun #define Sgl_iszero_mantissa(sgl_value) (Smantissa(sgl_value)==0) 93*4882a593Smuzhiyun #define Sgl_iszero_exponentmantissa(sgl_value) \ 94*4882a593Smuzhiyun (Sexponentmantissa(sgl_value)==0) 95*4882a593Smuzhiyun #define Sgl_isinfinity_exponent(sgl_value) \ 96*4882a593Smuzhiyun (Sgl_exponent(sgl_value)==SGL_INFINITY_EXPONENT) 97*4882a593Smuzhiyun #define Sgl_isnotinfinity_exponent(sgl_value) \ 98*4882a593Smuzhiyun (Sgl_exponent(sgl_value)!=SGL_INFINITY_EXPONENT) 99*4882a593Smuzhiyun #define Sgl_isinfinity(sgl_value) \ 100*4882a593Smuzhiyun (Sgl_exponent(sgl_value)==SGL_INFINITY_EXPONENT && \ 101*4882a593Smuzhiyun Sgl_mantissa(sgl_value)==0) 102*4882a593Smuzhiyun #define Sgl_isnan(sgl_value) \ 103*4882a593Smuzhiyun (Sgl_exponent(sgl_value)==SGL_INFINITY_EXPONENT && \ 104*4882a593Smuzhiyun Sgl_mantissa(sgl_value)!=0) 105*4882a593Smuzhiyun #define Sgl_isnotnan(sgl_value) \ 106*4882a593Smuzhiyun (Sgl_exponent(sgl_value)!=SGL_INFINITY_EXPONENT || \ 107*4882a593Smuzhiyun Sgl_mantissa(sgl_value)==0) 108*4882a593Smuzhiyun #define Sgl_islessthan(sgl_op1,sgl_op2) \ 109*4882a593Smuzhiyun (Sall(sgl_op1) < Sall(sgl_op2)) 110*4882a593Smuzhiyun #define Sgl_isgreaterthan(sgl_op1,sgl_op2) \ 111*4882a593Smuzhiyun (Sall(sgl_op1) > Sall(sgl_op2)) 112*4882a593Smuzhiyun #define Sgl_isnotlessthan(sgl_op1,sgl_op2) \ 113*4882a593Smuzhiyun (Sall(sgl_op1) >= Sall(sgl_op2)) 114*4882a593Smuzhiyun #define Sgl_isequal(sgl_op1,sgl_op2) \ 115*4882a593Smuzhiyun (Sall(sgl_op1) == Sall(sgl_op2)) 116*4882a593Smuzhiyun 117*4882a593Smuzhiyun #define Sgl_leftshiftby8(sgl_value) \ 118*4882a593Smuzhiyun Sall(sgl_value) <<= 8 119*4882a593Smuzhiyun #define Sgl_leftshiftby4(sgl_value) \ 120*4882a593Smuzhiyun Sall(sgl_value) <<= 4 121*4882a593Smuzhiyun #define Sgl_leftshiftby3(sgl_value) \ 122*4882a593Smuzhiyun Sall(sgl_value) <<= 3 123*4882a593Smuzhiyun #define Sgl_leftshiftby2(sgl_value) \ 124*4882a593Smuzhiyun Sall(sgl_value) <<= 2 125*4882a593Smuzhiyun #define Sgl_leftshiftby1(sgl_value) \ 126*4882a593Smuzhiyun Sall(sgl_value) <<= 1 127*4882a593Smuzhiyun #define Sgl_rightshiftby1(sgl_value) \ 128*4882a593Smuzhiyun Sall(sgl_value) >>= 1 129*4882a593Smuzhiyun #define Sgl_rightshiftby4(sgl_value) \ 130*4882a593Smuzhiyun Sall(sgl_value) >>= 4 131*4882a593Smuzhiyun #define Sgl_rightshiftby8(sgl_value) \ 132*4882a593Smuzhiyun Sall(sgl_value) >>= 8 133*4882a593Smuzhiyun 134*4882a593Smuzhiyun #define Sgl_ismagnitudeless(signlessleft,signlessright) \ 135*4882a593Smuzhiyun /* unsigned int signlessleft, signlessright; */ \ 136*4882a593Smuzhiyun (signlessleft < signlessright) 137*4882a593Smuzhiyun 138*4882a593Smuzhiyun 139*4882a593Smuzhiyun #define Sgl_copytoint_exponentmantissa(source,dest) \ 140*4882a593Smuzhiyun dest = Sexponentmantissa(source) 141*4882a593Smuzhiyun 142*4882a593Smuzhiyun /* A quiet NaN has the high mantissa bit clear and at least on other (in this 143*4882a593Smuzhiyun * case the adjacent bit) bit set. */ 144*4882a593Smuzhiyun #define Sgl_set_quiet(sgl_value) Deposit_shigh2mantissa(sgl_value,1) 145*4882a593Smuzhiyun #define Sgl_set_exponent(sgl_value,exp) Deposit_sexponent(sgl_value,exp) 146*4882a593Smuzhiyun 147*4882a593Smuzhiyun #define Sgl_set_mantissa(dest,value) Deposit_smantissa(dest,value) 148*4882a593Smuzhiyun #define Sgl_set_exponentmantissa(dest,value) \ 149*4882a593Smuzhiyun Deposit_sexponentmantissa(dest,value) 150*4882a593Smuzhiyun 151*4882a593Smuzhiyun /* An infinity is represented with the max exponent and a zero mantissa */ 152*4882a593Smuzhiyun #define Sgl_setinfinity_exponent(sgl_value) \ 153*4882a593Smuzhiyun Deposit_sexponent(sgl_value,SGL_INFINITY_EXPONENT) 154*4882a593Smuzhiyun #define Sgl_setinfinity_exponentmantissa(sgl_value) \ 155*4882a593Smuzhiyun Deposit_sexponentmantissa(sgl_value, \ 156*4882a593Smuzhiyun (SGL_INFINITY_EXPONENT << (32-(1+SGL_EXP_LENGTH)))) 157*4882a593Smuzhiyun #define Sgl_setinfinitypositive(sgl_value) \ 158*4882a593Smuzhiyun Sall(sgl_value) = (SGL_INFINITY_EXPONENT << (32-(1+SGL_EXP_LENGTH))) 159*4882a593Smuzhiyun #define Sgl_setinfinitynegative(sgl_value) \ 160*4882a593Smuzhiyun Sall(sgl_value) = (SGL_INFINITY_EXPONENT << (32-(1+SGL_EXP_LENGTH))) \ 161*4882a593Smuzhiyun | ((unsigned int)1<<31) 162*4882a593Smuzhiyun #define Sgl_setinfinity(sgl_value,sign) \ 163*4882a593Smuzhiyun Sall(sgl_value) = (SGL_INFINITY_EXPONENT << (32-(1+SGL_EXP_LENGTH))) | \ 164*4882a593Smuzhiyun ((unsigned int)sign << 31) 165*4882a593Smuzhiyun #define Sgl_sethigh4bits(sgl_value, extsign) \ 166*4882a593Smuzhiyun Deposit_shigh4(sgl_value,extsign) 167*4882a593Smuzhiyun #define Sgl_set_sign(sgl_value,sign) Deposit_ssign(sgl_value,sign) 168*4882a593Smuzhiyun #define Sgl_invert_sign(sgl_value) \ 169*4882a593Smuzhiyun Deposit_ssign(sgl_value,~Ssign(sgl_value)) 170*4882a593Smuzhiyun #define Sgl_setone_sign(sgl_value) Deposit_ssign(sgl_value,1) 171*4882a593Smuzhiyun #define Sgl_setone_lowmantissa(sgl_value) Deposit_slow(sgl_value,1) 172*4882a593Smuzhiyun #define Sgl_setzero_sign(sgl_value) Sall(sgl_value) &= 0x7fffffff 173*4882a593Smuzhiyun #define Sgl_setzero_exponent(sgl_value) Sall(sgl_value) &= 0x807fffff 174*4882a593Smuzhiyun #define Sgl_setzero_mantissa(sgl_value) Sall(sgl_value) &= 0xff800000 175*4882a593Smuzhiyun #define Sgl_setzero_exponentmantissa(sgl_value) Sall(sgl_value) &= 0x80000000 176*4882a593Smuzhiyun #define Sgl_setzero(sgl_value) Sall(sgl_value) = 0 177*4882a593Smuzhiyun #define Sgl_setnegativezero(sgl_value) Sall(sgl_value) = (unsigned int)1 << 31 178*4882a593Smuzhiyun 179*4882a593Smuzhiyun /* Use following macro for both overflow & underflow conditions */ 180*4882a593Smuzhiyun #define ovfl - 181*4882a593Smuzhiyun #define unfl + 182*4882a593Smuzhiyun #define Sgl_setwrapped_exponent(sgl_value,exponent,op) \ 183*4882a593Smuzhiyun Deposit_sexponent(sgl_value,(exponent op SGL_WRAP)) 184*4882a593Smuzhiyun 185*4882a593Smuzhiyun #define Sgl_setlargestpositive(sgl_value) \ 186*4882a593Smuzhiyun Sall(sgl_value) = ((SGL_EMAX+SGL_BIAS) << (32-(1+SGL_EXP_LENGTH))) \ 187*4882a593Smuzhiyun | ((1<<(32-(1+SGL_EXP_LENGTH))) - 1 ) 188*4882a593Smuzhiyun #define Sgl_setlargestnegative(sgl_value) \ 189*4882a593Smuzhiyun Sall(sgl_value) = ((SGL_EMAX+SGL_BIAS) << (32-(1+SGL_EXP_LENGTH))) \ 190*4882a593Smuzhiyun | ((1<<(32-(1+SGL_EXP_LENGTH))) - 1 ) \ 191*4882a593Smuzhiyun | ((unsigned int)1<<31) 192*4882a593Smuzhiyun 193*4882a593Smuzhiyun #define Sgl_setnegativeinfinity(sgl_value) \ 194*4882a593Smuzhiyun Sall(sgl_value) = \ 195*4882a593Smuzhiyun ((1<<SGL_EXP_LENGTH) | SGL_INFINITY_EXPONENT) << (32-(1+SGL_EXP_LENGTH)) 196*4882a593Smuzhiyun #define Sgl_setlargest(sgl_value,sign) \ 197*4882a593Smuzhiyun Sall(sgl_value) = (unsigned int)sign << 31 | \ 198*4882a593Smuzhiyun (((SGL_EMAX+SGL_BIAS) << (32-(1+SGL_EXP_LENGTH))) \ 199*4882a593Smuzhiyun | ((1 << (32-(1+SGL_EXP_LENGTH))) - 1 )) 200*4882a593Smuzhiyun #define Sgl_setlargest_exponentmantissa(sgl_value) \ 201*4882a593Smuzhiyun Sall(sgl_value) = Sall(sgl_value) & ((unsigned int)1<<31) | \ 202*4882a593Smuzhiyun (((SGL_EMAX+SGL_BIAS) << (32-(1+SGL_EXP_LENGTH))) \ 203*4882a593Smuzhiyun | ((1 << (32-(1+SGL_EXP_LENGTH))) - 1 )) 204*4882a593Smuzhiyun 205*4882a593Smuzhiyun /* The high bit is always zero so arithmetic or logical shifts will work. */ 206*4882a593Smuzhiyun #define Sgl_right_align(srcdst,shift,extent) \ 207*4882a593Smuzhiyun /* sgl_floating_point srcdst; int shift; extension extent */ \ 208*4882a593Smuzhiyun if (shift < 32) { \ 209*4882a593Smuzhiyun Extall(extent) = Sall(srcdst) << (32-(shift)); \ 210*4882a593Smuzhiyun Sall(srcdst) >>= shift; \ 211*4882a593Smuzhiyun } \ 212*4882a593Smuzhiyun else { \ 213*4882a593Smuzhiyun Extall(extent) = Sall(srcdst); \ 214*4882a593Smuzhiyun Sall(srcdst) = 0; \ 215*4882a593Smuzhiyun } 216*4882a593Smuzhiyun #define Sgl_hiddenhigh3mantissa(sgl_value) Shiddenhigh3mantissa(sgl_value) 217*4882a593Smuzhiyun #define Sgl_hidden(sgl_value) Shidden(sgl_value) 218*4882a593Smuzhiyun #define Sgl_lowmantissa(sgl_value) Slow(sgl_value) 219*4882a593Smuzhiyun 220*4882a593Smuzhiyun /* The left argument is never smaller than the right argument */ 221*4882a593Smuzhiyun #define Sgl_subtract(sgl_left,sgl_right,sgl_result) \ 222*4882a593Smuzhiyun Sall(sgl_result) = Sall(sgl_left) - Sall(sgl_right) 223*4882a593Smuzhiyun 224*4882a593Smuzhiyun /* Subtract right augmented with extension from left augmented with zeros and 225*4882a593Smuzhiyun * store into result and extension. */ 226*4882a593Smuzhiyun #define Sgl_subtract_withextension(left,right,extent,result) \ 227*4882a593Smuzhiyun /* sgl_floating_point left,right,result; extension extent */ \ 228*4882a593Smuzhiyun Sgl_subtract(left,right,result); \ 229*4882a593Smuzhiyun if((Extall(extent) = 0-Extall(extent))) \ 230*4882a593Smuzhiyun Sall(result) = Sall(result)-1 231*4882a593Smuzhiyun 232*4882a593Smuzhiyun #define Sgl_addition(sgl_left,sgl_right,sgl_result) \ 233*4882a593Smuzhiyun Sall(sgl_result) = Sall(sgl_left) + Sall(sgl_right) 234*4882a593Smuzhiyun 235*4882a593Smuzhiyun #define Sgl_xortointp1(left,right,result) \ 236*4882a593Smuzhiyun result = Sall(left) XOR Sall(right); 237*4882a593Smuzhiyun 238*4882a593Smuzhiyun #define Sgl_xorfromintp1(left,right,result) \ 239*4882a593Smuzhiyun Sall(result) = left XOR Sall(right) 240*4882a593Smuzhiyun 241*4882a593Smuzhiyun /* Need to Initialize */ 242*4882a593Smuzhiyun #define Sgl_makequietnan(dest) \ 243*4882a593Smuzhiyun Sall(dest) = ((SGL_EMAX+SGL_BIAS)+1)<< (32-(1+SGL_EXP_LENGTH)) \ 244*4882a593Smuzhiyun | (1<<(32-(1+SGL_EXP_LENGTH+2))) 245*4882a593Smuzhiyun #define Sgl_makesignalingnan(dest) \ 246*4882a593Smuzhiyun Sall(dest) = ((SGL_EMAX+SGL_BIAS)+1)<< (32-(1+SGL_EXP_LENGTH)) \ 247*4882a593Smuzhiyun | (1<<(32-(1+SGL_EXP_LENGTH+1))) 248*4882a593Smuzhiyun 249*4882a593Smuzhiyun #define Sgl_normalize(sgl_opnd,exponent) \ 250*4882a593Smuzhiyun while(Sgl_iszero_hiddenhigh7mantissa(sgl_opnd)) { \ 251*4882a593Smuzhiyun Sgl_leftshiftby8(sgl_opnd); \ 252*4882a593Smuzhiyun exponent -= 8; \ 253*4882a593Smuzhiyun } \ 254*4882a593Smuzhiyun if(Sgl_iszero_hiddenhigh3mantissa(sgl_opnd)) { \ 255*4882a593Smuzhiyun Sgl_leftshiftby4(sgl_opnd); \ 256*4882a593Smuzhiyun exponent -= 4; \ 257*4882a593Smuzhiyun } \ 258*4882a593Smuzhiyun while(Sgl_iszero_hidden(sgl_opnd)) { \ 259*4882a593Smuzhiyun Sgl_leftshiftby1(sgl_opnd); \ 260*4882a593Smuzhiyun exponent -= 1; \ 261*4882a593Smuzhiyun } 262*4882a593Smuzhiyun 263*4882a593Smuzhiyun #define Sgl_setoverflow(sgl_opnd) \ 264*4882a593Smuzhiyun /* set result to infinity or largest number */ \ 265*4882a593Smuzhiyun switch (Rounding_mode()) { \ 266*4882a593Smuzhiyun case ROUNDPLUS: \ 267*4882a593Smuzhiyun if (Sgl_isone_sign(sgl_opnd)) { \ 268*4882a593Smuzhiyun Sgl_setlargestnegative(sgl_opnd); \ 269*4882a593Smuzhiyun } \ 270*4882a593Smuzhiyun else { \ 271*4882a593Smuzhiyun Sgl_setinfinitypositive(sgl_opnd); \ 272*4882a593Smuzhiyun } \ 273*4882a593Smuzhiyun break; \ 274*4882a593Smuzhiyun case ROUNDMINUS: \ 275*4882a593Smuzhiyun if (Sgl_iszero_sign(sgl_opnd)) { \ 276*4882a593Smuzhiyun Sgl_setlargestpositive(sgl_opnd); \ 277*4882a593Smuzhiyun } \ 278*4882a593Smuzhiyun else { \ 279*4882a593Smuzhiyun Sgl_setinfinitynegative(sgl_opnd); \ 280*4882a593Smuzhiyun } \ 281*4882a593Smuzhiyun break; \ 282*4882a593Smuzhiyun case ROUNDNEAREST: \ 283*4882a593Smuzhiyun Sgl_setinfinity_exponentmantissa(sgl_opnd); \ 284*4882a593Smuzhiyun break; \ 285*4882a593Smuzhiyun case ROUNDZERO: \ 286*4882a593Smuzhiyun Sgl_setlargest_exponentmantissa(sgl_opnd); \ 287*4882a593Smuzhiyun } 288*4882a593Smuzhiyun 289*4882a593Smuzhiyun #define Sgl_denormalize(opnd,exponent,guard,sticky,inexact) \ 290*4882a593Smuzhiyun Sgl_clear_signexponent_set_hidden(opnd); \ 291*4882a593Smuzhiyun if (exponent >= (1 - SGL_P)) { \ 292*4882a593Smuzhiyun guard = (Sall(opnd) >> -exponent) & 1; \ 293*4882a593Smuzhiyun if (exponent < 0) sticky |= Sall(opnd) << (32+exponent); \ 294*4882a593Smuzhiyun inexact = guard | sticky; \ 295*4882a593Smuzhiyun Sall(opnd) >>= (1-exponent); \ 296*4882a593Smuzhiyun } \ 297*4882a593Smuzhiyun else { \ 298*4882a593Smuzhiyun guard = 0; \ 299*4882a593Smuzhiyun sticky |= Sall(opnd); \ 300*4882a593Smuzhiyun inexact = sticky; \ 301*4882a593Smuzhiyun Sgl_setzero(opnd); \ 302*4882a593Smuzhiyun } 303*4882a593Smuzhiyun 304*4882a593Smuzhiyun /* 305*4882a593Smuzhiyun * The fused multiply add instructions requires a single extended format, 306*4882a593Smuzhiyun * with 48 bits of mantissa. 307*4882a593Smuzhiyun */ 308*4882a593Smuzhiyun #define SGLEXT_THRESHOLD 48 309*4882a593Smuzhiyun 310*4882a593Smuzhiyun #define Sglext_setzero(valA,valB) \ 311*4882a593Smuzhiyun Sextallp1(valA) = 0; Sextallp2(valB) = 0 312*4882a593Smuzhiyun 313*4882a593Smuzhiyun #define Sglext_isnotzero_mantissap2(valB) (Sextallp2(valB)!=0) 314*4882a593Smuzhiyun #define Sglext_isone_lowp1(val) (Sextlowp1(val)!=0) 315*4882a593Smuzhiyun #define Sglext_isone_highp2(val) (Sexthighp2(val)!=0) 316*4882a593Smuzhiyun #define Sglext_isnotzero_low31p2(val) (Sextlow31p2(val)!=0) 317*4882a593Smuzhiyun #define Sglext_iszero(valA,valB) (Sextallp1(valA)==0 && Sextallp2(valB)==0) 318*4882a593Smuzhiyun 319*4882a593Smuzhiyun #define Sgl_copytoptr(src,destptr) *destptr = src 320*4882a593Smuzhiyun #define Sgl_copyfromptr(srcptr,dest) dest = *srcptr 321*4882a593Smuzhiyun #define Sglext_copy(srca,srcb,desta,destb) \ 322*4882a593Smuzhiyun Sextallp1(desta) = Sextallp1(srca); \ 323*4882a593Smuzhiyun Sextallp2(destb) = Sextallp2(srcb) 324*4882a593Smuzhiyun #define Sgl_copyto_sglext(src1,dest1,dest2) \ 325*4882a593Smuzhiyun Sextallp1(dest1) = Sall(src1); Sextallp2(dest2) = 0 326*4882a593Smuzhiyun 327*4882a593Smuzhiyun #define Sglext_swap_lower(leftp2,rightp2) \ 328*4882a593Smuzhiyun Sextallp2(leftp2) = Sextallp2(leftp2) XOR Sextallp2(rightp2); \ 329*4882a593Smuzhiyun Sextallp2(rightp2) = Sextallp2(leftp2) XOR Sextallp2(rightp2); \ 330*4882a593Smuzhiyun Sextallp2(leftp2) = Sextallp2(leftp2) XOR Sextallp2(rightp2) 331*4882a593Smuzhiyun 332*4882a593Smuzhiyun #define Sglext_setone_lowmantissap2(value) Deposit_dlowp2(value,1) 333*4882a593Smuzhiyun 334*4882a593Smuzhiyun /* The high bit is always zero so arithmetic or logical shifts will work. */ 335*4882a593Smuzhiyun #define Sglext_right_align(srcdstA,srcdstB,shift) \ 336*4882a593Smuzhiyun {int shiftamt, sticky; \ 337*4882a593Smuzhiyun shiftamt = shift % 32; \ 338*4882a593Smuzhiyun sticky = 0; \ 339*4882a593Smuzhiyun switch (shift/32) { \ 340*4882a593Smuzhiyun case 0: if (shiftamt > 0) { \ 341*4882a593Smuzhiyun sticky = Sextallp2(srcdstB) << 32 - (shiftamt); \ 342*4882a593Smuzhiyun Variable_shift_double(Sextallp1(srcdstA), \ 343*4882a593Smuzhiyun Sextallp2(srcdstB),shiftamt,Sextallp2(srcdstB)); \ 344*4882a593Smuzhiyun Sextallp1(srcdstA) >>= shiftamt; \ 345*4882a593Smuzhiyun } \ 346*4882a593Smuzhiyun break; \ 347*4882a593Smuzhiyun case 1: if (shiftamt > 0) { \ 348*4882a593Smuzhiyun sticky = (Sextallp1(srcdstA) << 32 - (shiftamt)) | \ 349*4882a593Smuzhiyun Sextallp2(srcdstB); \ 350*4882a593Smuzhiyun } \ 351*4882a593Smuzhiyun else { \ 352*4882a593Smuzhiyun sticky = Sextallp2(srcdstB); \ 353*4882a593Smuzhiyun } \ 354*4882a593Smuzhiyun Sextallp2(srcdstB) = Sextallp1(srcdstA) >> shiftamt; \ 355*4882a593Smuzhiyun Sextallp1(srcdstA) = 0; \ 356*4882a593Smuzhiyun break; \ 357*4882a593Smuzhiyun } \ 358*4882a593Smuzhiyun if (sticky) Sglext_setone_lowmantissap2(srcdstB); \ 359*4882a593Smuzhiyun } 360*4882a593Smuzhiyun 361*4882a593Smuzhiyun /* The left argument is never smaller than the right argument */ 362*4882a593Smuzhiyun #define Sglext_subtract(lefta,leftb,righta,rightb,resulta,resultb) \ 363*4882a593Smuzhiyun if( Sextallp2(rightb) > Sextallp2(leftb) ) Sextallp1(lefta)--; \ 364*4882a593Smuzhiyun Sextallp2(resultb) = Sextallp2(leftb) - Sextallp2(rightb); \ 365*4882a593Smuzhiyun Sextallp1(resulta) = Sextallp1(lefta) - Sextallp1(righta) 366*4882a593Smuzhiyun 367*4882a593Smuzhiyun #define Sglext_addition(lefta,leftb,righta,rightb,resulta,resultb) \ 368*4882a593Smuzhiyun /* If the sum of the low words is less than either source, then \ 369*4882a593Smuzhiyun * an overflow into the next word occurred. */ \ 370*4882a593Smuzhiyun if ((Sextallp2(resultb) = Sextallp2(leftb)+Sextallp2(rightb)) < \ 371*4882a593Smuzhiyun Sextallp2(rightb)) \ 372*4882a593Smuzhiyun Sextallp1(resulta) = Sextallp1(lefta)+Sextallp1(righta)+1; \ 373*4882a593Smuzhiyun else Sextallp1(resulta) = Sextallp1(lefta)+Sextallp1(righta) 374*4882a593Smuzhiyun 375*4882a593Smuzhiyun 376*4882a593Smuzhiyun #define Sglext_arithrightshiftby1(srcdstA,srcdstB) \ 377*4882a593Smuzhiyun Shiftdouble(Sextallp1(srcdstA),Sextallp2(srcdstB),1,Sextallp2(srcdstB)); \ 378*4882a593Smuzhiyun Sextallp1(srcdstA) = (int)Sextallp1(srcdstA) >> 1 379*4882a593Smuzhiyun 380*4882a593Smuzhiyun #define Sglext_leftshiftby8(valA,valB) \ 381*4882a593Smuzhiyun Shiftdouble(Sextallp1(valA),Sextallp2(valB),24,Sextallp1(valA)); \ 382*4882a593Smuzhiyun Sextallp2(valB) <<= 8 383*4882a593Smuzhiyun #define Sglext_leftshiftby4(valA,valB) \ 384*4882a593Smuzhiyun Shiftdouble(Sextallp1(valA),Sextallp2(valB),28,Sextallp1(valA)); \ 385*4882a593Smuzhiyun Sextallp2(valB) <<= 4 386*4882a593Smuzhiyun #define Sglext_leftshiftby3(valA,valB) \ 387*4882a593Smuzhiyun Shiftdouble(Sextallp1(valA),Sextallp2(valB),29,Sextallp1(valA)); \ 388*4882a593Smuzhiyun Sextallp2(valB) <<= 3 389*4882a593Smuzhiyun #define Sglext_leftshiftby2(valA,valB) \ 390*4882a593Smuzhiyun Shiftdouble(Sextallp1(valA),Sextallp2(valB),30,Sextallp1(valA)); \ 391*4882a593Smuzhiyun Sextallp2(valB) <<= 2 392*4882a593Smuzhiyun #define Sglext_leftshiftby1(valA,valB) \ 393*4882a593Smuzhiyun Shiftdouble(Sextallp1(valA),Sextallp2(valB),31,Sextallp1(valA)); \ 394*4882a593Smuzhiyun Sextallp2(valB) <<= 1 395*4882a593Smuzhiyun 396*4882a593Smuzhiyun #define Sglext_rightshiftby4(valueA,valueB) \ 397*4882a593Smuzhiyun Shiftdouble(Sextallp1(valueA),Sextallp2(valueB),4,Sextallp2(valueB)); \ 398*4882a593Smuzhiyun Sextallp1(valueA) >>= 4 399*4882a593Smuzhiyun #define Sglext_rightshiftby3(valueA,valueB) \ 400*4882a593Smuzhiyun Shiftdouble(Sextallp1(valueA),Sextallp2(valueB),3,Sextallp2(valueB)); \ 401*4882a593Smuzhiyun Sextallp1(valueA) >>= 3 402*4882a593Smuzhiyun #define Sglext_rightshiftby1(valueA,valueB) \ 403*4882a593Smuzhiyun Shiftdouble(Sextallp1(valueA),Sextallp2(valueB),1,Sextallp2(valueB)); \ 404*4882a593Smuzhiyun Sextallp1(valueA) >>= 1 405*4882a593Smuzhiyun 406*4882a593Smuzhiyun #define Sglext_xortointp1(left,right,result) Sgl_xortointp1(left,right,result) 407*4882a593Smuzhiyun #define Sglext_xorfromintp1(left,right,result) \ 408*4882a593Smuzhiyun Sgl_xorfromintp1(left,right,result) 409*4882a593Smuzhiyun #define Sglext_copytoint_exponentmantissa(src,dest) \ 410*4882a593Smuzhiyun Sgl_copytoint_exponentmantissa(src,dest) 411*4882a593Smuzhiyun #define Sglext_ismagnitudeless(signlessleft,signlessright) \ 412*4882a593Smuzhiyun Sgl_ismagnitudeless(signlessleft,signlessright) 413*4882a593Smuzhiyun 414*4882a593Smuzhiyun #define Sglext_set_sign(dbl_value,sign) Sgl_set_sign(dbl_value,sign) 415*4882a593Smuzhiyun #define Sglext_clear_signexponent_set_hidden(srcdst) \ 416*4882a593Smuzhiyun Sgl_clear_signexponent_set_hidden(srcdst) 417*4882a593Smuzhiyun #define Sglext_clear_signexponent(srcdst) Sgl_clear_signexponent(srcdst) 418*4882a593Smuzhiyun #define Sglext_clear_sign(srcdst) Sgl_clear_sign(srcdst) 419*4882a593Smuzhiyun #define Sglext_isone_hidden(dbl_value) Sgl_isone_hidden(dbl_value) 420*4882a593Smuzhiyun 421*4882a593Smuzhiyun #define Sglext_denormalize(opndp1,opndp2,exponent,is_tiny) \ 422*4882a593Smuzhiyun {int sticky; \ 423*4882a593Smuzhiyun is_tiny = TRUE; \ 424*4882a593Smuzhiyun if (exponent == 0 && Sextallp2(opndp2)) { \ 425*4882a593Smuzhiyun switch (Rounding_mode()) { \ 426*4882a593Smuzhiyun case ROUNDPLUS: \ 427*4882a593Smuzhiyun if (Sgl_iszero_sign(opndp1)) \ 428*4882a593Smuzhiyun if (Sgl_isone_hiddenoverflow(opndp1 + 1)) \ 429*4882a593Smuzhiyun is_tiny = FALSE; \ 430*4882a593Smuzhiyun break; \ 431*4882a593Smuzhiyun case ROUNDMINUS: \ 432*4882a593Smuzhiyun if (Sgl_isone_sign(opndp1)) { \ 433*4882a593Smuzhiyun if (Sgl_isone_hiddenoverflow(opndp1 + 1)) \ 434*4882a593Smuzhiyun is_tiny = FALSE; \ 435*4882a593Smuzhiyun } \ 436*4882a593Smuzhiyun break; \ 437*4882a593Smuzhiyun case ROUNDNEAREST: \ 438*4882a593Smuzhiyun if (Sglext_isone_highp2(opndp2) && \ 439*4882a593Smuzhiyun (Sglext_isone_lowp1(opndp1) || \ 440*4882a593Smuzhiyun Sglext_isnotzero_low31p2(opndp2))) \ 441*4882a593Smuzhiyun if (Sgl_isone_hiddenoverflow(opndp1 + 1)) \ 442*4882a593Smuzhiyun is_tiny = FALSE; \ 443*4882a593Smuzhiyun break; \ 444*4882a593Smuzhiyun } \ 445*4882a593Smuzhiyun } \ 446*4882a593Smuzhiyun Sglext_clear_signexponent_set_hidden(opndp1); \ 447*4882a593Smuzhiyun if (exponent >= (1-DBL_P)) { \ 448*4882a593Smuzhiyun if (exponent >= -31) { \ 449*4882a593Smuzhiyun if (exponent > -31) { \ 450*4882a593Smuzhiyun sticky = Sextallp2(opndp2) << 31+exponent; \ 451*4882a593Smuzhiyun Variable_shift_double(opndp1,opndp2,1-exponent,opndp2); \ 452*4882a593Smuzhiyun Sextallp1(opndp1) >>= 1-exponent; \ 453*4882a593Smuzhiyun } \ 454*4882a593Smuzhiyun else { \ 455*4882a593Smuzhiyun sticky = Sextallp2(opndp2); \ 456*4882a593Smuzhiyun Sextallp2(opndp2) = Sextallp1(opndp1); \ 457*4882a593Smuzhiyun Sextallp1(opndp1) = 0; \ 458*4882a593Smuzhiyun } \ 459*4882a593Smuzhiyun } \ 460*4882a593Smuzhiyun else { \ 461*4882a593Smuzhiyun sticky = (Sextallp1(opndp1) << 31+exponent) | \ 462*4882a593Smuzhiyun Sextallp2(opndp2); \ 463*4882a593Smuzhiyun Sextallp2(opndp2) = Sextallp1(opndp1) >> -31-exponent; \ 464*4882a593Smuzhiyun Sextallp1(opndp1) = 0; \ 465*4882a593Smuzhiyun } \ 466*4882a593Smuzhiyun } \ 467*4882a593Smuzhiyun else { \ 468*4882a593Smuzhiyun sticky = Sextallp1(opndp1) | Sextallp2(opndp2); \ 469*4882a593Smuzhiyun Sglext_setzero(opndp1,opndp2); \ 470*4882a593Smuzhiyun } \ 471*4882a593Smuzhiyun if (sticky) Sglext_setone_lowmantissap2(opndp2); \ 472*4882a593Smuzhiyun exponent = 0; \ 473*4882a593Smuzhiyun } 474