1*4882a593Smuzhiyun| 2*4882a593Smuzhiyun| kernel_ex.sa 3.3 12/19/90 3*4882a593Smuzhiyun| 4*4882a593Smuzhiyun| This file contains routines to force exception status in the 5*4882a593Smuzhiyun| fpu for exceptional cases detected or reported within the 6*4882a593Smuzhiyun| transcendental functions. Typically, the t_xx routine will 7*4882a593Smuzhiyun| set the appropriate bits in the USER_FPSR word on the stack. 8*4882a593Smuzhiyun| The bits are tested in gen_except.sa to determine if an exceptional 9*4882a593Smuzhiyun| situation needs to be created on return from the FPSP. 10*4882a593Smuzhiyun| 11*4882a593Smuzhiyun 12*4882a593Smuzhiyun| Copyright (C) Motorola, Inc. 1990 13*4882a593Smuzhiyun| All Rights Reserved 14*4882a593Smuzhiyun| 15*4882a593Smuzhiyun| For details on the license for this file, please see the 16*4882a593Smuzhiyun| file, README, in this same directory. 17*4882a593Smuzhiyun 18*4882a593SmuzhiyunKERNEL_EX: |idnt 2,1 | Motorola 040 Floating Point Software Package 19*4882a593Smuzhiyun 20*4882a593Smuzhiyun |section 8 21*4882a593Smuzhiyun 22*4882a593Smuzhiyun#include "fpsp.h" 23*4882a593Smuzhiyun 24*4882a593Smuzhiyunmns_inf: .long 0xffff0000,0x00000000,0x00000000 25*4882a593Smuzhiyunpls_inf: .long 0x7fff0000,0x00000000,0x00000000 26*4882a593Smuzhiyunnan: .long 0x7fff0000,0xffffffff,0xffffffff 27*4882a593Smuzhiyunhuge: .long 0x7ffe0000,0xffffffff,0xffffffff 28*4882a593Smuzhiyun 29*4882a593Smuzhiyun |xref ovf_r_k 30*4882a593Smuzhiyun |xref unf_sub 31*4882a593Smuzhiyun |xref nrm_set 32*4882a593Smuzhiyun 33*4882a593Smuzhiyun .global t_dz 34*4882a593Smuzhiyun .global t_dz2 35*4882a593Smuzhiyun .global t_operr 36*4882a593Smuzhiyun .global t_unfl 37*4882a593Smuzhiyun .global t_ovfl 38*4882a593Smuzhiyun .global t_ovfl2 39*4882a593Smuzhiyun .global t_inx2 40*4882a593Smuzhiyun .global t_frcinx 41*4882a593Smuzhiyun .global t_extdnrm 42*4882a593Smuzhiyun .global t_resdnrm 43*4882a593Smuzhiyun .global dst_nan 44*4882a593Smuzhiyun .global src_nan 45*4882a593Smuzhiyun| 46*4882a593Smuzhiyun| DZ exception 47*4882a593Smuzhiyun| 48*4882a593Smuzhiyun| 49*4882a593Smuzhiyun| if dz trap disabled 50*4882a593Smuzhiyun| store properly signed inf (use sign of etemp) into fp0 51*4882a593Smuzhiyun| set FPSR exception status dz bit, condition code 52*4882a593Smuzhiyun| inf bit, and accrued dz bit 53*4882a593Smuzhiyun| return 54*4882a593Smuzhiyun| frestore the frame into the machine (done by unimp_hd) 55*4882a593Smuzhiyun| 56*4882a593Smuzhiyun| else dz trap enabled 57*4882a593Smuzhiyun| set exception status bit & accrued bits in FPSR 58*4882a593Smuzhiyun| set flag to disable sto_res from corrupting fp register 59*4882a593Smuzhiyun| return 60*4882a593Smuzhiyun| frestore the frame into the machine (done by unimp_hd) 61*4882a593Smuzhiyun| 62*4882a593Smuzhiyun| t_dz2 is used by monadic functions such as flogn (from do_func). 63*4882a593Smuzhiyun| t_dz is used by monadic functions such as satanh (from the 64*4882a593Smuzhiyun| transcendental function). 65*4882a593Smuzhiyun| 66*4882a593Smuzhiyunt_dz2: 67*4882a593Smuzhiyun bsetb #neg_bit,FPSR_CC(%a6) |set neg bit in FPSR 68*4882a593Smuzhiyun fmovel #0,%FPSR |clr status bits (Z set) 69*4882a593Smuzhiyun btstb #dz_bit,FPCR_ENABLE(%a6) |test FPCR for dz exc enabled 70*4882a593Smuzhiyun bnes dz_ena_end 71*4882a593Smuzhiyun bras m_inf |flogx always returns -inf 72*4882a593Smuzhiyunt_dz: 73*4882a593Smuzhiyun fmovel #0,%FPSR |clr status bits (Z set) 74*4882a593Smuzhiyun btstb #dz_bit,FPCR_ENABLE(%a6) |test FPCR for dz exc enabled 75*4882a593Smuzhiyun bnes dz_ena 76*4882a593Smuzhiyun| 77*4882a593Smuzhiyun| dz disabled 78*4882a593Smuzhiyun| 79*4882a593Smuzhiyun btstb #sign_bit,ETEMP_EX(%a6) |check sign for neg or pos 80*4882a593Smuzhiyun beqs p_inf |branch if pos sign 81*4882a593Smuzhiyun 82*4882a593Smuzhiyunm_inf: 83*4882a593Smuzhiyun fmovemx mns_inf,%fp0-%fp0 |load -inf 84*4882a593Smuzhiyun bsetb #neg_bit,FPSR_CC(%a6) |set neg bit in FPSR 85*4882a593Smuzhiyun bras set_fpsr 86*4882a593Smuzhiyunp_inf: 87*4882a593Smuzhiyun fmovemx pls_inf,%fp0-%fp0 |load +inf 88*4882a593Smuzhiyunset_fpsr: 89*4882a593Smuzhiyun orl #dzinf_mask,USER_FPSR(%a6) |set I,DZ,ADZ 90*4882a593Smuzhiyun rts 91*4882a593Smuzhiyun| 92*4882a593Smuzhiyun| dz enabled 93*4882a593Smuzhiyun| 94*4882a593Smuzhiyundz_ena: 95*4882a593Smuzhiyun btstb #sign_bit,ETEMP_EX(%a6) |check sign for neg or pos 96*4882a593Smuzhiyun beqs dz_ena_end 97*4882a593Smuzhiyun bsetb #neg_bit,FPSR_CC(%a6) |set neg bit in FPSR 98*4882a593Smuzhiyundz_ena_end: 99*4882a593Smuzhiyun orl #dzinf_mask,USER_FPSR(%a6) |set I,DZ,ADZ 100*4882a593Smuzhiyun st STORE_FLG(%a6) 101*4882a593Smuzhiyun rts 102*4882a593Smuzhiyun| 103*4882a593Smuzhiyun| OPERR exception 104*4882a593Smuzhiyun| 105*4882a593Smuzhiyun| if (operr trap disabled) 106*4882a593Smuzhiyun| set FPSR exception status operr bit, condition code 107*4882a593Smuzhiyun| nan bit; Store default NAN into fp0 108*4882a593Smuzhiyun| frestore the frame into the machine (done by unimp_hd) 109*4882a593Smuzhiyun| 110*4882a593Smuzhiyun| else (operr trap enabled) 111*4882a593Smuzhiyun| set FPSR exception status operr bit, accrued operr bit 112*4882a593Smuzhiyun| set flag to disable sto_res from corrupting fp register 113*4882a593Smuzhiyun| frestore the frame into the machine (done by unimp_hd) 114*4882a593Smuzhiyun| 115*4882a593Smuzhiyunt_operr: 116*4882a593Smuzhiyun orl #opnan_mask,USER_FPSR(%a6) |set NaN, OPERR, AIOP 117*4882a593Smuzhiyun 118*4882a593Smuzhiyun btstb #operr_bit,FPCR_ENABLE(%a6) |test FPCR for operr enabled 119*4882a593Smuzhiyun bnes op_ena 120*4882a593Smuzhiyun 121*4882a593Smuzhiyun fmovemx nan,%fp0-%fp0 |load default nan 122*4882a593Smuzhiyun rts 123*4882a593Smuzhiyunop_ena: 124*4882a593Smuzhiyun st STORE_FLG(%a6) |do not corrupt destination 125*4882a593Smuzhiyun rts 126*4882a593Smuzhiyun 127*4882a593Smuzhiyun| 128*4882a593Smuzhiyun| t_unfl --- UNFL exception 129*4882a593Smuzhiyun| 130*4882a593Smuzhiyun| This entry point is used by all routines requiring unfl, inex2, 131*4882a593Smuzhiyun| aunfl, and ainex to be set on exit. 132*4882a593Smuzhiyun| 133*4882a593Smuzhiyun| On entry, a0 points to the exceptional operand. The final exceptional 134*4882a593Smuzhiyun| operand is built in FP_SCR1 and only the sign from the original operand 135*4882a593Smuzhiyun| is used. 136*4882a593Smuzhiyun| 137*4882a593Smuzhiyunt_unfl: 138*4882a593Smuzhiyun clrl FP_SCR1(%a6) |set exceptional operand to zero 139*4882a593Smuzhiyun clrl FP_SCR1+4(%a6) 140*4882a593Smuzhiyun clrl FP_SCR1+8(%a6) 141*4882a593Smuzhiyun tstb (%a0) |extract sign from caller's exop 142*4882a593Smuzhiyun bpls unfl_signok 143*4882a593Smuzhiyun bset #sign_bit,FP_SCR1(%a6) 144*4882a593Smuzhiyununfl_signok: 145*4882a593Smuzhiyun leal FP_SCR1(%a6),%a0 146*4882a593Smuzhiyun orl #unfinx_mask,USER_FPSR(%a6) 147*4882a593Smuzhiyun| ;set UNFL, INEX2, AUNFL, AINEX 148*4882a593Smuzhiyununfl_con: 149*4882a593Smuzhiyun btstb #unfl_bit,FPCR_ENABLE(%a6) 150*4882a593Smuzhiyun beqs unfl_dis 151*4882a593Smuzhiyun 152*4882a593Smuzhiyununfl_ena: 153*4882a593Smuzhiyun bfclr STAG(%a6){#5:#3} |clear wbtm66,wbtm1,wbtm0 154*4882a593Smuzhiyun bsetb #wbtemp15_bit,WB_BYTE(%a6) |set wbtemp15 155*4882a593Smuzhiyun bsetb #sticky_bit,STICKY(%a6) |set sticky bit 156*4882a593Smuzhiyun 157*4882a593Smuzhiyun bclrb #E1,E_BYTE(%a6) 158*4882a593Smuzhiyun 159*4882a593Smuzhiyununfl_dis: 160*4882a593Smuzhiyun bfextu FPCR_MODE(%a6){#0:#2},%d0 |get round precision 161*4882a593Smuzhiyun 162*4882a593Smuzhiyun bclrb #sign_bit,LOCAL_EX(%a0) 163*4882a593Smuzhiyun sne LOCAL_SGN(%a0) |convert to internal ext format 164*4882a593Smuzhiyun 165*4882a593Smuzhiyun bsr unf_sub |returns IEEE result at a0 166*4882a593Smuzhiyun| ;and sets FPSR_CC accordingly 167*4882a593Smuzhiyun 168*4882a593Smuzhiyun bfclr LOCAL_SGN(%a0){#0:#8} |convert back to IEEE ext format 169*4882a593Smuzhiyun beqs unfl_fin 170*4882a593Smuzhiyun 171*4882a593Smuzhiyun bsetb #sign_bit,LOCAL_EX(%a0) 172*4882a593Smuzhiyun bsetb #sign_bit,FP_SCR1(%a6) |set sign bit of exc operand 173*4882a593Smuzhiyun 174*4882a593Smuzhiyununfl_fin: 175*4882a593Smuzhiyun fmovemx (%a0),%fp0-%fp0 |store result in fp0 176*4882a593Smuzhiyun rts 177*4882a593Smuzhiyun 178*4882a593Smuzhiyun 179*4882a593Smuzhiyun| 180*4882a593Smuzhiyun| t_ovfl2 --- OVFL exception (without inex2 returned) 181*4882a593Smuzhiyun| 182*4882a593Smuzhiyun| This entry is used by scale to force catastrophic overflow. The 183*4882a593Smuzhiyun| ovfl, aovfl, and ainex bits are set, but not the inex2 bit. 184*4882a593Smuzhiyun| 185*4882a593Smuzhiyunt_ovfl2: 186*4882a593Smuzhiyun orl #ovfl_inx_mask,USER_FPSR(%a6) 187*4882a593Smuzhiyun movel ETEMP(%a6),FP_SCR1(%a6) 188*4882a593Smuzhiyun movel ETEMP_HI(%a6),FP_SCR1+4(%a6) 189*4882a593Smuzhiyun movel ETEMP_LO(%a6),FP_SCR1+8(%a6) 190*4882a593Smuzhiyun| 191*4882a593Smuzhiyun| Check for single or double round precision. If single, check if 192*4882a593Smuzhiyun| the lower 40 bits of ETEMP are zero; if not, set inex2. If double, 193*4882a593Smuzhiyun| check if the lower 21 bits are zero; if not, set inex2. 194*4882a593Smuzhiyun| 195*4882a593Smuzhiyun moveb FPCR_MODE(%a6),%d0 196*4882a593Smuzhiyun andib #0xc0,%d0 197*4882a593Smuzhiyun beq t_work |if extended, finish ovfl processing 198*4882a593Smuzhiyun cmpib #0x40,%d0 |test for single 199*4882a593Smuzhiyun bnes t_dbl 200*4882a593Smuzhiyunt_sgl: 201*4882a593Smuzhiyun tstb ETEMP_LO(%a6) 202*4882a593Smuzhiyun bnes t_setinx2 203*4882a593Smuzhiyun movel ETEMP_HI(%a6),%d0 204*4882a593Smuzhiyun andil #0xff,%d0 |look at only lower 8 bits 205*4882a593Smuzhiyun bnes t_setinx2 206*4882a593Smuzhiyun bra t_work 207*4882a593Smuzhiyunt_dbl: 208*4882a593Smuzhiyun movel ETEMP_LO(%a6),%d0 209*4882a593Smuzhiyun andil #0x7ff,%d0 |look at only lower 11 bits 210*4882a593Smuzhiyun beq t_work 211*4882a593Smuzhiyunt_setinx2: 212*4882a593Smuzhiyun orl #inex2_mask,USER_FPSR(%a6) 213*4882a593Smuzhiyun bras t_work 214*4882a593Smuzhiyun| 215*4882a593Smuzhiyun| t_ovfl --- OVFL exception 216*4882a593Smuzhiyun| 217*4882a593Smuzhiyun|** Note: the exc operand is returned in ETEMP. 218*4882a593Smuzhiyun| 219*4882a593Smuzhiyunt_ovfl: 220*4882a593Smuzhiyun orl #ovfinx_mask,USER_FPSR(%a6) 221*4882a593Smuzhiyunt_work: 222*4882a593Smuzhiyun btstb #ovfl_bit,FPCR_ENABLE(%a6) |test FPCR for ovfl enabled 223*4882a593Smuzhiyun beqs ovf_dis 224*4882a593Smuzhiyun 225*4882a593Smuzhiyunovf_ena: 226*4882a593Smuzhiyun clrl FP_SCR1(%a6) |set exceptional operand 227*4882a593Smuzhiyun clrl FP_SCR1+4(%a6) 228*4882a593Smuzhiyun clrl FP_SCR1+8(%a6) 229*4882a593Smuzhiyun 230*4882a593Smuzhiyun bfclr STAG(%a6){#5:#3} |clear wbtm66,wbtm1,wbtm0 231*4882a593Smuzhiyun bclrb #wbtemp15_bit,WB_BYTE(%a6) |clear wbtemp15 232*4882a593Smuzhiyun bsetb #sticky_bit,STICKY(%a6) |set sticky bit 233*4882a593Smuzhiyun 234*4882a593Smuzhiyun bclrb #E1,E_BYTE(%a6) 235*4882a593Smuzhiyun| ;fall through to disabled case 236*4882a593Smuzhiyun 237*4882a593Smuzhiyun| For disabled overflow call 'ovf_r_k'. This routine loads the 238*4882a593Smuzhiyun| correct result based on the rounding precision, destination 239*4882a593Smuzhiyun| format, rounding mode and sign. 240*4882a593Smuzhiyun| 241*4882a593Smuzhiyunovf_dis: 242*4882a593Smuzhiyun bsr ovf_r_k |returns unsigned ETEMP_EX 243*4882a593Smuzhiyun| ;and sets FPSR_CC accordingly. 244*4882a593Smuzhiyun bfclr ETEMP_SGN(%a6){#0:#8} |fix sign 245*4882a593Smuzhiyun beqs ovf_pos 246*4882a593Smuzhiyun bsetb #sign_bit,ETEMP_EX(%a6) 247*4882a593Smuzhiyun bsetb #sign_bit,FP_SCR1(%a6) |set exceptional operand sign 248*4882a593Smuzhiyunovf_pos: 249*4882a593Smuzhiyun fmovemx ETEMP(%a6),%fp0-%fp0 |move the result to fp0 250*4882a593Smuzhiyun rts 251*4882a593Smuzhiyun 252*4882a593Smuzhiyun 253*4882a593Smuzhiyun| 254*4882a593Smuzhiyun| INEX2 exception 255*4882a593Smuzhiyun| 256*4882a593Smuzhiyun| The inex2 and ainex bits are set. 257*4882a593Smuzhiyun| 258*4882a593Smuzhiyunt_inx2: 259*4882a593Smuzhiyun orl #inx2a_mask,USER_FPSR(%a6) |set INEX2, AINEX 260*4882a593Smuzhiyun rts 261*4882a593Smuzhiyun 262*4882a593Smuzhiyun| 263*4882a593Smuzhiyun| Force Inex2 264*4882a593Smuzhiyun| 265*4882a593Smuzhiyun| This routine is called by the transcendental routines to force 266*4882a593Smuzhiyun| the inex2 exception bits set in the FPSR. If the underflow bit 267*4882a593Smuzhiyun| is set, but the underflow trap was not taken, the aunfl bit in 268*4882a593Smuzhiyun| the FPSR must be set. 269*4882a593Smuzhiyun| 270*4882a593Smuzhiyunt_frcinx: 271*4882a593Smuzhiyun orl #inx2a_mask,USER_FPSR(%a6) |set INEX2, AINEX 272*4882a593Smuzhiyun btstb #unfl_bit,FPSR_EXCEPT(%a6) |test for unfl bit set 273*4882a593Smuzhiyun beqs no_uacc1 |if clear, do not set aunfl 274*4882a593Smuzhiyun bsetb #aunfl_bit,FPSR_AEXCEPT(%a6) 275*4882a593Smuzhiyunno_uacc1: 276*4882a593Smuzhiyun rts 277*4882a593Smuzhiyun 278*4882a593Smuzhiyun| 279*4882a593Smuzhiyun| DST_NAN 280*4882a593Smuzhiyun| 281*4882a593Smuzhiyun| Determine if the destination nan is signalling or non-signalling, 282*4882a593Smuzhiyun| and set the FPSR bits accordingly. See the MC68040 User's Manual 283*4882a593Smuzhiyun| section 3.2.2.5 NOT-A-NUMBERS. 284*4882a593Smuzhiyun| 285*4882a593Smuzhiyundst_nan: 286*4882a593Smuzhiyun btstb #sign_bit,FPTEMP_EX(%a6) |test sign of nan 287*4882a593Smuzhiyun beqs dst_pos |if clr, it was positive 288*4882a593Smuzhiyun bsetb #neg_bit,FPSR_CC(%a6) |set N bit 289*4882a593Smuzhiyundst_pos: 290*4882a593Smuzhiyun btstb #signan_bit,FPTEMP_HI(%a6) |check if signalling 291*4882a593Smuzhiyun beqs dst_snan |branch if signalling 292*4882a593Smuzhiyun 293*4882a593Smuzhiyun fmovel %d1,%fpcr |restore user's rmode/prec 294*4882a593Smuzhiyun fmovex FPTEMP(%a6),%fp0 |return the non-signalling nan 295*4882a593Smuzhiyun| 296*4882a593Smuzhiyun| Check the source nan. If it is signalling, snan will be reported. 297*4882a593Smuzhiyun| 298*4882a593Smuzhiyun moveb STAG(%a6),%d0 299*4882a593Smuzhiyun andib #0xe0,%d0 300*4882a593Smuzhiyun cmpib #0x60,%d0 301*4882a593Smuzhiyun bnes no_snan 302*4882a593Smuzhiyun btstb #signan_bit,ETEMP_HI(%a6) |check if signalling 303*4882a593Smuzhiyun bnes no_snan 304*4882a593Smuzhiyun orl #snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP 305*4882a593Smuzhiyunno_snan: 306*4882a593Smuzhiyun rts 307*4882a593Smuzhiyun 308*4882a593Smuzhiyundst_snan: 309*4882a593Smuzhiyun btstb #snan_bit,FPCR_ENABLE(%a6) |check if trap enabled 310*4882a593Smuzhiyun beqs dst_dis |branch if disabled 311*4882a593Smuzhiyun 312*4882a593Smuzhiyun orb #nan_tag,DTAG(%a6) |set up dtag for nan 313*4882a593Smuzhiyun st STORE_FLG(%a6) |do not store a result 314*4882a593Smuzhiyun orl #snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP 315*4882a593Smuzhiyun rts 316*4882a593Smuzhiyun 317*4882a593Smuzhiyundst_dis: 318*4882a593Smuzhiyun bsetb #signan_bit,FPTEMP_HI(%a6) |set SNAN bit in sop 319*4882a593Smuzhiyun fmovel %d1,%fpcr |restore user's rmode/prec 320*4882a593Smuzhiyun fmovex FPTEMP(%a6),%fp0 |load non-sign. nan 321*4882a593Smuzhiyun orl #snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP 322*4882a593Smuzhiyun rts 323*4882a593Smuzhiyun 324*4882a593Smuzhiyun| 325*4882a593Smuzhiyun| SRC_NAN 326*4882a593Smuzhiyun| 327*4882a593Smuzhiyun| Determine if the source nan is signalling or non-signalling, 328*4882a593Smuzhiyun| and set the FPSR bits accordingly. See the MC68040 User's Manual 329*4882a593Smuzhiyun| section 3.2.2.5 NOT-A-NUMBERS. 330*4882a593Smuzhiyun| 331*4882a593Smuzhiyunsrc_nan: 332*4882a593Smuzhiyun btstb #sign_bit,ETEMP_EX(%a6) |test sign of nan 333*4882a593Smuzhiyun beqs src_pos |if clr, it was positive 334*4882a593Smuzhiyun bsetb #neg_bit,FPSR_CC(%a6) |set N bit 335*4882a593Smuzhiyunsrc_pos: 336*4882a593Smuzhiyun btstb #signan_bit,ETEMP_HI(%a6) |check if signalling 337*4882a593Smuzhiyun beqs src_snan |branch if signalling 338*4882a593Smuzhiyun fmovel %d1,%fpcr |restore user's rmode/prec 339*4882a593Smuzhiyun fmovex ETEMP(%a6),%fp0 |return the non-signalling nan 340*4882a593Smuzhiyun rts 341*4882a593Smuzhiyun 342*4882a593Smuzhiyunsrc_snan: 343*4882a593Smuzhiyun btstb #snan_bit,FPCR_ENABLE(%a6) |check if trap enabled 344*4882a593Smuzhiyun beqs src_dis |branch if disabled 345*4882a593Smuzhiyun bsetb #signan_bit,ETEMP_HI(%a6) |set SNAN bit in sop 346*4882a593Smuzhiyun orb #norm_tag,DTAG(%a6) |set up dtag for norm 347*4882a593Smuzhiyun orb #nan_tag,STAG(%a6) |set up stag for nan 348*4882a593Smuzhiyun st STORE_FLG(%a6) |do not store a result 349*4882a593Smuzhiyun orl #snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP 350*4882a593Smuzhiyun rts 351*4882a593Smuzhiyun 352*4882a593Smuzhiyunsrc_dis: 353*4882a593Smuzhiyun bsetb #signan_bit,ETEMP_HI(%a6) |set SNAN bit in sop 354*4882a593Smuzhiyun fmovel %d1,%fpcr |restore user's rmode/prec 355*4882a593Smuzhiyun fmovex ETEMP(%a6),%fp0 |load non-sign. nan 356*4882a593Smuzhiyun orl #snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP 357*4882a593Smuzhiyun rts 358*4882a593Smuzhiyun 359*4882a593Smuzhiyun| 360*4882a593Smuzhiyun| For all functions that have a denormalized input and that f(x)=x, 361*4882a593Smuzhiyun| this is the entry point 362*4882a593Smuzhiyun| 363*4882a593Smuzhiyunt_extdnrm: 364*4882a593Smuzhiyun orl #unfinx_mask,USER_FPSR(%a6) 365*4882a593Smuzhiyun| ;set UNFL, INEX2, AUNFL, AINEX 366*4882a593Smuzhiyun bras xdnrm_con 367*4882a593Smuzhiyun| 368*4882a593Smuzhiyun| Entry point for scale with extended denorm. The function does 369*4882a593Smuzhiyun| not set inex2, aunfl, or ainex. 370*4882a593Smuzhiyun| 371*4882a593Smuzhiyunt_resdnrm: 372*4882a593Smuzhiyun orl #unfl_mask,USER_FPSR(%a6) 373*4882a593Smuzhiyun 374*4882a593Smuzhiyunxdnrm_con: 375*4882a593Smuzhiyun btstb #unfl_bit,FPCR_ENABLE(%a6) 376*4882a593Smuzhiyun beqs xdnrm_dis 377*4882a593Smuzhiyun 378*4882a593Smuzhiyun| 379*4882a593Smuzhiyun| If exceptions are enabled, the additional task of setting up WBTEMP 380*4882a593Smuzhiyun| is needed so that when the underflow exception handler is entered, 381*4882a593Smuzhiyun| the user perceives no difference between what the 040 provides vs. 382*4882a593Smuzhiyun| what the FPSP provides. 383*4882a593Smuzhiyun| 384*4882a593Smuzhiyunxdnrm_ena: 385*4882a593Smuzhiyun movel %a0,-(%a7) 386*4882a593Smuzhiyun 387*4882a593Smuzhiyun movel LOCAL_EX(%a0),FP_SCR1(%a6) 388*4882a593Smuzhiyun movel LOCAL_HI(%a0),FP_SCR1+4(%a6) 389*4882a593Smuzhiyun movel LOCAL_LO(%a0),FP_SCR1+8(%a6) 390*4882a593Smuzhiyun 391*4882a593Smuzhiyun lea FP_SCR1(%a6),%a0 392*4882a593Smuzhiyun 393*4882a593Smuzhiyun bclrb #sign_bit,LOCAL_EX(%a0) 394*4882a593Smuzhiyun sne LOCAL_SGN(%a0) |convert to internal ext format 395*4882a593Smuzhiyun tstw LOCAL_EX(%a0) |check if input is denorm 396*4882a593Smuzhiyun beqs xdnrm_dn |if so, skip nrm_set 397*4882a593Smuzhiyun bsr nrm_set |normalize the result (exponent 398*4882a593Smuzhiyun| ;will be negative 399*4882a593Smuzhiyunxdnrm_dn: 400*4882a593Smuzhiyun bclrb #sign_bit,LOCAL_EX(%a0) |take off false sign 401*4882a593Smuzhiyun bfclr LOCAL_SGN(%a0){#0:#8} |change back to IEEE ext format 402*4882a593Smuzhiyun beqs xdep 403*4882a593Smuzhiyun bsetb #sign_bit,LOCAL_EX(%a0) 404*4882a593Smuzhiyunxdep: 405*4882a593Smuzhiyun bfclr STAG(%a6){#5:#3} |clear wbtm66,wbtm1,wbtm0 406*4882a593Smuzhiyun bsetb #wbtemp15_bit,WB_BYTE(%a6) |set wbtemp15 407*4882a593Smuzhiyun bclrb #sticky_bit,STICKY(%a6) |clear sticky bit 408*4882a593Smuzhiyun bclrb #E1,E_BYTE(%a6) 409*4882a593Smuzhiyun movel (%a7)+,%a0 410*4882a593Smuzhiyunxdnrm_dis: 411*4882a593Smuzhiyun bfextu FPCR_MODE(%a6){#0:#2},%d0 |get round precision 412*4882a593Smuzhiyun bnes not_ext |if not round extended, store 413*4882a593Smuzhiyun| ;IEEE defaults 414*4882a593Smuzhiyunis_ext: 415*4882a593Smuzhiyun btstb #sign_bit,LOCAL_EX(%a0) 416*4882a593Smuzhiyun beqs xdnrm_store 417*4882a593Smuzhiyun 418*4882a593Smuzhiyun bsetb #neg_bit,FPSR_CC(%a6) |set N bit in FPSR_CC 419*4882a593Smuzhiyun 420*4882a593Smuzhiyun bras xdnrm_store 421*4882a593Smuzhiyun 422*4882a593Smuzhiyunnot_ext: 423*4882a593Smuzhiyun bclrb #sign_bit,LOCAL_EX(%a0) 424*4882a593Smuzhiyun sne LOCAL_SGN(%a0) |convert to internal ext format 425*4882a593Smuzhiyun bsr unf_sub |returns IEEE result pointed by 426*4882a593Smuzhiyun| ;a0; sets FPSR_CC accordingly 427*4882a593Smuzhiyun bfclr LOCAL_SGN(%a0){#0:#8} |convert back to IEEE ext format 428*4882a593Smuzhiyun beqs xdnrm_store 429*4882a593Smuzhiyun bsetb #sign_bit,LOCAL_EX(%a0) 430*4882a593Smuzhiyunxdnrm_store: 431*4882a593Smuzhiyun fmovemx (%a0),%fp0-%fp0 |store result in fp0 432*4882a593Smuzhiyun rts 433*4882a593Smuzhiyun 434*4882a593Smuzhiyun| 435*4882a593Smuzhiyun| This subroutine is used for dyadic operations that use an extended 436*4882a593Smuzhiyun| denorm within the kernel. The approach used is to capture the frame, 437*4882a593Smuzhiyun| fix/restore. 438*4882a593Smuzhiyun| 439*4882a593Smuzhiyun .global t_avoid_unsupp 440*4882a593Smuzhiyunt_avoid_unsupp: 441*4882a593Smuzhiyun link %a2,#-LOCAL_SIZE |so that a2 fpsp.h negative 442*4882a593Smuzhiyun| ;offsets may be used 443*4882a593Smuzhiyun fsave -(%a7) 444*4882a593Smuzhiyun tstb 1(%a7) |check if idle, exit if so 445*4882a593Smuzhiyun beq idle_end 446*4882a593Smuzhiyun btstb #E1,E_BYTE(%a2) |check for an E1 exception if 447*4882a593Smuzhiyun| ;enabled, there is an unsupp 448*4882a593Smuzhiyun beq end_avun |else, exit 449*4882a593Smuzhiyun btstb #7,DTAG(%a2) |check for denorm destination 450*4882a593Smuzhiyun beqs src_den |else, must be a source denorm 451*4882a593Smuzhiyun| 452*4882a593Smuzhiyun| handle destination denorm 453*4882a593Smuzhiyun| 454*4882a593Smuzhiyun lea FPTEMP(%a2),%a0 455*4882a593Smuzhiyun btstb #sign_bit,LOCAL_EX(%a0) 456*4882a593Smuzhiyun sne LOCAL_SGN(%a0) |convert to internal ext format 457*4882a593Smuzhiyun bclrb #7,DTAG(%a2) |set DTAG to norm 458*4882a593Smuzhiyun bsr nrm_set |normalize result, exponent 459*4882a593Smuzhiyun| ;will become negative 460*4882a593Smuzhiyun bclrb #sign_bit,LOCAL_EX(%a0) |get rid of fake sign 461*4882a593Smuzhiyun bfclr LOCAL_SGN(%a0){#0:#8} |convert back to IEEE ext format 462*4882a593Smuzhiyun beqs ck_src_den |check if source is also denorm 463*4882a593Smuzhiyun bsetb #sign_bit,LOCAL_EX(%a0) 464*4882a593Smuzhiyunck_src_den: 465*4882a593Smuzhiyun btstb #7,STAG(%a2) 466*4882a593Smuzhiyun beqs end_avun 467*4882a593Smuzhiyunsrc_den: 468*4882a593Smuzhiyun lea ETEMP(%a2),%a0 469*4882a593Smuzhiyun btstb #sign_bit,LOCAL_EX(%a0) 470*4882a593Smuzhiyun sne LOCAL_SGN(%a0) |convert to internal ext format 471*4882a593Smuzhiyun bclrb #7,STAG(%a2) |set STAG to norm 472*4882a593Smuzhiyun bsr nrm_set |normalize result, exponent 473*4882a593Smuzhiyun| ;will become negative 474*4882a593Smuzhiyun bclrb #sign_bit,LOCAL_EX(%a0) |get rid of fake sign 475*4882a593Smuzhiyun bfclr LOCAL_SGN(%a0){#0:#8} |convert back to IEEE ext format 476*4882a593Smuzhiyun beqs den_com 477*4882a593Smuzhiyun bsetb #sign_bit,LOCAL_EX(%a0) 478*4882a593Smuzhiyunden_com: 479*4882a593Smuzhiyun moveb #0xfe,CU_SAVEPC(%a2) |set continue frame 480*4882a593Smuzhiyun clrw NMNEXC(%a2) |clear NMNEXC 481*4882a593Smuzhiyun bclrb #E1,E_BYTE(%a2) 482*4882a593Smuzhiyun| fmove.l %FPSR,FPSR_SHADOW(%a2) 483*4882a593Smuzhiyun| bset.b #SFLAG,E_BYTE(%a2) 484*4882a593Smuzhiyun| bset.b #XFLAG,T_BYTE(%a2) 485*4882a593Smuzhiyunend_avun: 486*4882a593Smuzhiyun frestore (%a7)+ 487*4882a593Smuzhiyun unlk %a2 488*4882a593Smuzhiyun rts 489*4882a593Smuzhiyunidle_end: 490*4882a593Smuzhiyun addl #4,%a7 491*4882a593Smuzhiyun unlk %a2 492*4882a593Smuzhiyun rts 493*4882a593Smuzhiyun |end 494