xref: /optee_os/lib/libutils/isoc/arch/arm/softfloat/source/extF80_rem.c (revision 1bb929836182ecb96d2d9d268daa807c67596396)
1*1bb92983SJerome Forissier // SPDX-License-Identifier: BSD-3-Clause
29403c583SJens Wiklander 
39403c583SJens Wiklander /*============================================================================
49403c583SJens Wiklander 
59403c583SJens Wiklander This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic
69403c583SJens Wiklander Package, Release 3a, by John R. Hauser.
79403c583SJens Wiklander 
89403c583SJens Wiklander Copyright 2011, 2012, 2013, 2014 The Regents of the University of California.
99403c583SJens Wiklander All rights reserved.
109403c583SJens Wiklander 
119403c583SJens Wiklander Redistribution and use in source and binary forms, with or without
129403c583SJens Wiklander modification, are permitted provided that the following conditions are met:
139403c583SJens Wiklander 
149403c583SJens Wiklander  1. Redistributions of source code must retain the above copyright notice,
159403c583SJens Wiklander     this list of conditions, and the following disclaimer.
169403c583SJens Wiklander 
179403c583SJens Wiklander  2. Redistributions in binary form must reproduce the above copyright notice,
189403c583SJens Wiklander     this list of conditions, and the following disclaimer in the documentation
199403c583SJens Wiklander     and/or other materials provided with the distribution.
209403c583SJens Wiklander 
219403c583SJens Wiklander  3. Neither the name of the University nor the names of its contributors may
229403c583SJens Wiklander     be used to endorse or promote products derived from this software without
239403c583SJens Wiklander     specific prior written permission.
249403c583SJens Wiklander 
259403c583SJens Wiklander THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY
269403c583SJens Wiklander EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
279403c583SJens Wiklander WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE
289403c583SJens Wiklander DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
299403c583SJens Wiklander DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
309403c583SJens Wiklander (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
319403c583SJens Wiklander LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
329403c583SJens Wiklander ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
339403c583SJens Wiklander (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
349403c583SJens Wiklander SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
359403c583SJens Wiklander 
369403c583SJens Wiklander =============================================================================*/
379403c583SJens Wiklander 
389403c583SJens Wiklander #include <stdbool.h>
399403c583SJens Wiklander #include <stdint.h>
409403c583SJens Wiklander #include "platform.h"
419403c583SJens Wiklander #include "internals.h"
429403c583SJens Wiklander #include "specialize.h"
439403c583SJens Wiklander #include "softfloat.h"
449403c583SJens Wiklander 
extF80_rem(extFloat80_t a,extFloat80_t b)459403c583SJens Wiklander extFloat80_t extF80_rem( extFloat80_t a, extFloat80_t b )
469403c583SJens Wiklander {
479403c583SJens Wiklander     union { struct extFloat80M s; extFloat80_t f; } uA;
489403c583SJens Wiklander     uint_fast16_t uiA64;
499403c583SJens Wiklander     uint_fast64_t uiA0;
509403c583SJens Wiklander     bool signA;
519403c583SJens Wiklander     int_fast32_t expA;
529403c583SJens Wiklander     uint_fast64_t sigA;
539403c583SJens Wiklander     union { struct extFloat80M s; extFloat80_t f; } uB;
549403c583SJens Wiklander     uint_fast16_t uiB64;
559403c583SJens Wiklander     uint_fast64_t uiB0;
569403c583SJens Wiklander     bool signB;
579403c583SJens Wiklander     int_fast32_t expB;
589403c583SJens Wiklander     uint_fast64_t sigB;
599403c583SJens Wiklander     struct exp32_sig64 normExpSig;
609403c583SJens Wiklander     int_fast32_t expDiff;
619403c583SJens Wiklander     struct uint128 rem, shiftedSigB;
629403c583SJens Wiklander     uint_fast32_t q, recip32;
639403c583SJens Wiklander     uint_fast64_t q64;
649403c583SJens Wiklander     struct uint128 term, altRem, meanRem;
659403c583SJens Wiklander     bool signRem;
669403c583SJens Wiklander     struct uint128 uiZ;
679403c583SJens Wiklander     uint_fast16_t uiZ64;
689403c583SJens Wiklander     uint_fast64_t uiZ0;
699403c583SJens Wiklander     union { struct extFloat80M s; extFloat80_t f; } uZ;
709403c583SJens Wiklander 
719403c583SJens Wiklander     /*------------------------------------------------------------------------
729403c583SJens Wiklander     *------------------------------------------------------------------------*/
739403c583SJens Wiklander     uA.f = a;
749403c583SJens Wiklander     uiA64 = uA.s.signExp;
759403c583SJens Wiklander     uiA0  = uA.s.signif;
769403c583SJens Wiklander     signA = signExtF80UI64( uiA64 );
779403c583SJens Wiklander     expA  = expExtF80UI64( uiA64 );
789403c583SJens Wiklander     sigA  = uiA0;
799403c583SJens Wiklander     uB.f = b;
809403c583SJens Wiklander     uiB64 = uB.s.signExp;
819403c583SJens Wiklander     uiB0  = uB.s.signif;
829403c583SJens Wiklander     signB = signExtF80UI64( uiB64 );
839403c583SJens Wiklander     expB  = expExtF80UI64( uiB64 );
849403c583SJens Wiklander     sigB  = uiB0;
859403c583SJens Wiklander     /*------------------------------------------------------------------------
869403c583SJens Wiklander     *------------------------------------------------------------------------*/
879403c583SJens Wiklander     if ( expA == 0x7FFF ) {
889403c583SJens Wiklander         if (
899403c583SJens Wiklander                (sigA & UINT64_C( 0x7FFFFFFFFFFFFFFF ))
909403c583SJens Wiklander             || ((expB == 0x7FFF) && (sigB & UINT64_C( 0x7FFFFFFFFFFFFFFF )))
919403c583SJens Wiklander         ) {
929403c583SJens Wiklander             goto propagateNaN;
939403c583SJens Wiklander         }
949403c583SJens Wiklander         goto invalid;
959403c583SJens Wiklander     }
969403c583SJens Wiklander     if ( expB == 0x7FFF ) {
979403c583SJens Wiklander         if ( sigB & UINT64_C( 0x7FFFFFFFFFFFFFFF ) ) goto propagateNaN;
989403c583SJens Wiklander         /*--------------------------------------------------------------------
999403c583SJens Wiklander         | Argument b is an infinity.  Doubling `expB' is an easy way to ensure
1009403c583SJens Wiklander         | that `expDiff' later is less than -1, which will result in returning
1019403c583SJens Wiklander         | a canonicalized version of argument a.
1029403c583SJens Wiklander         *--------------------------------------------------------------------*/
1039403c583SJens Wiklander         expB += expB;
1049403c583SJens Wiklander     }
1059403c583SJens Wiklander     /*------------------------------------------------------------------------
1069403c583SJens Wiklander     *------------------------------------------------------------------------*/
1079403c583SJens Wiklander     if ( ! expB ) expB = 1;
1089403c583SJens Wiklander     if ( ! (sigB & UINT64_C( 0x8000000000000000 )) ) {
1099403c583SJens Wiklander         if ( ! sigB ) goto invalid;
1109403c583SJens Wiklander         normExpSig = softfloat_normSubnormalExtF80Sig( sigB );
1119403c583SJens Wiklander         expB += normExpSig.exp;
1129403c583SJens Wiklander         sigB = normExpSig.sig;
1139403c583SJens Wiklander     }
1149403c583SJens Wiklander     if ( ! expA ) expA = 1;
1159403c583SJens Wiklander     if ( ! (sigA & UINT64_C( 0x8000000000000000 )) ) {
1169403c583SJens Wiklander         if ( ! sigA ) {
1179403c583SJens Wiklander             expA = 0;
1189403c583SJens Wiklander             goto copyA;
1199403c583SJens Wiklander         }
1209403c583SJens Wiklander         normExpSig = softfloat_normSubnormalExtF80Sig( sigA );
1219403c583SJens Wiklander         expA += normExpSig.exp;
1229403c583SJens Wiklander         sigA = normExpSig.sig;
1239403c583SJens Wiklander     }
1249403c583SJens Wiklander     /*------------------------------------------------------------------------
1259403c583SJens Wiklander     *------------------------------------------------------------------------*/
1269403c583SJens Wiklander     expDiff = expA - expB;
1279403c583SJens Wiklander     if ( expDiff < -1 ) goto copyA;
1289403c583SJens Wiklander     rem = softfloat_shortShiftLeft128( 0, sigA, 32 );
1299403c583SJens Wiklander     shiftedSigB = softfloat_shortShiftLeft128( 0, sigB, 32 );
1309403c583SJens Wiklander     if ( expDiff < 1 ) {
1319403c583SJens Wiklander         if ( expDiff ) {
1329403c583SJens Wiklander             --expB;
1339403c583SJens Wiklander             shiftedSigB = softfloat_shortShiftLeft128( 0, sigB, 33 );
1349403c583SJens Wiklander             q = 0;
1359403c583SJens Wiklander         } else {
1369403c583SJens Wiklander             q = (sigB <= sigA);
1379403c583SJens Wiklander             if ( q ) {
1389403c583SJens Wiklander                 rem =
1399403c583SJens Wiklander                     softfloat_sub128(
1409403c583SJens Wiklander                         rem.v64, rem.v0, shiftedSigB.v64, shiftedSigB.v0 );
1419403c583SJens Wiklander             }
1429403c583SJens Wiklander         }
1439403c583SJens Wiklander     } else {
1449403c583SJens Wiklander         recip32 = softfloat_approxRecip32_1( sigB>>32 );
1459403c583SJens Wiklander         expDiff -= 30;
1469403c583SJens Wiklander         for (;;) {
1479403c583SJens Wiklander             q64 = (uint_fast64_t) (uint32_t) (rem.v64>>2) * recip32;
1489403c583SJens Wiklander             if ( expDiff < 0 ) break;
1499403c583SJens Wiklander             q = (q64 + 0x80000000)>>32;
1509403c583SJens Wiklander             rem = softfloat_shortShiftLeft128( rem.v64, rem.v0, 29 );
1519403c583SJens Wiklander             term = softfloat_mul64ByShifted32To128( sigB, q );
1529403c583SJens Wiklander             rem = softfloat_sub128( rem.v64, rem.v0, term.v64, term.v0 );
1539403c583SJens Wiklander             if ( rem.v64 & UINT64_C( 0x8000000000000000 ) ) {
1549403c583SJens Wiklander                 rem =
1559403c583SJens Wiklander                     softfloat_add128(
1569403c583SJens Wiklander                         rem.v64, rem.v0, shiftedSigB.v64, shiftedSigB.v0 );
1579403c583SJens Wiklander             }
1589403c583SJens Wiklander             expDiff -= 29;
1599403c583SJens Wiklander         }
1609403c583SJens Wiklander         /*--------------------------------------------------------------------
1619403c583SJens Wiklander         | (`expDiff' cannot be less than -29 here.)
1629403c583SJens Wiklander         *--------------------------------------------------------------------*/
1639403c583SJens Wiklander         q = (uint32_t) (q64>>32)>>(~expDiff & 31);
1649403c583SJens Wiklander         rem = softfloat_shortShiftLeft128( rem.v64, rem.v0, expDiff + 30 );
1659403c583SJens Wiklander         term = softfloat_mul64ByShifted32To128( sigB, q );
1669403c583SJens Wiklander         rem = softfloat_sub128( rem.v64, rem.v0, term.v64, term.v0 );
1679403c583SJens Wiklander         if ( rem.v64 & UINT64_C( 0x8000000000000000 ) ) {
1689403c583SJens Wiklander             altRem =
1699403c583SJens Wiklander                 softfloat_add128(
1709403c583SJens Wiklander                     rem.v64, rem.v0, shiftedSigB.v64, shiftedSigB.v0 );
1719403c583SJens Wiklander             goto selectRem;
1729403c583SJens Wiklander         }
1739403c583SJens Wiklander     }
1749403c583SJens Wiklander     /*------------------------------------------------------------------------
1759403c583SJens Wiklander     *------------------------------------------------------------------------*/
1769403c583SJens Wiklander     do {
1779403c583SJens Wiklander         altRem = rem;
1789403c583SJens Wiklander         ++q;
1799403c583SJens Wiklander         rem =
1809403c583SJens Wiklander             softfloat_sub128(
1819403c583SJens Wiklander                 rem.v64, rem.v0, shiftedSigB.v64, shiftedSigB.v0 );
1829403c583SJens Wiklander     } while ( ! (rem.v64 & UINT64_C( 0x8000000000000000 )) );
1839403c583SJens Wiklander  selectRem:
1849403c583SJens Wiklander     meanRem = softfloat_add128( rem.v64, rem.v0, altRem.v64, altRem.v0 );
1859403c583SJens Wiklander     if (
1869403c583SJens Wiklander         (meanRem.v64 & UINT64_C( 0x8000000000000000 ))
1879403c583SJens Wiklander             || (! (meanRem.v64 | meanRem.v0) && (q & 1))
1889403c583SJens Wiklander     ) {
1899403c583SJens Wiklander         rem = altRem;
1909403c583SJens Wiklander     }
1919403c583SJens Wiklander     signRem = signA;
1929403c583SJens Wiklander     if ( rem.v64 & UINT64_C( 0x8000000000000000 ) ) {
1939403c583SJens Wiklander         signRem = ! signRem;
1949403c583SJens Wiklander         rem = softfloat_sub128( 0, 0, rem.v64, rem.v0 );
1959403c583SJens Wiklander     }
1969403c583SJens Wiklander     return
1979403c583SJens Wiklander         softfloat_normRoundPackToExtF80(
1989403c583SJens Wiklander             signRem, expB + 32, rem.v64, rem.v0, 80 );
1999403c583SJens Wiklander     /*------------------------------------------------------------------------
2009403c583SJens Wiklander     *------------------------------------------------------------------------*/
2019403c583SJens Wiklander  propagateNaN:
2029403c583SJens Wiklander     uiZ = softfloat_propagateNaNExtF80UI( uiA64, uiA0, uiB64, uiB0 );
2039403c583SJens Wiklander     uiZ64 = uiZ.v64;
2049403c583SJens Wiklander     uiZ0  = uiZ.v0;
2059403c583SJens Wiklander     goto uiZ;
2069403c583SJens Wiklander     /*------------------------------------------------------------------------
2079403c583SJens Wiklander     *------------------------------------------------------------------------*/
2089403c583SJens Wiklander  invalid:
2099403c583SJens Wiklander     softfloat_raiseFlags( softfloat_flag_invalid );
2109403c583SJens Wiklander     uiZ64 = defaultNaNExtF80UI64;
2119403c583SJens Wiklander     uiZ0  = defaultNaNExtF80UI0;
2129403c583SJens Wiklander     goto uiZ;
2139403c583SJens Wiklander     /*------------------------------------------------------------------------
2149403c583SJens Wiklander     *------------------------------------------------------------------------*/
2159403c583SJens Wiklander  copyA:
2169403c583SJens Wiklander     if ( expA < 1 ) {
2179403c583SJens Wiklander         sigA >>= 1 - expA;
2189403c583SJens Wiklander         expA = 0;
2199403c583SJens Wiklander     }
2209403c583SJens Wiklander     uiZ64 = packToExtF80UI64( signA, expA );
2219403c583SJens Wiklander     uiZ0  = sigA;
2229403c583SJens Wiklander  uiZ:
2239403c583SJens Wiklander     uZ.s.signExp = uiZ64;
2249403c583SJens Wiklander     uZ.s.signif  = uiZ0;
2259403c583SJens Wiklander     return uZ.f;
2269403c583SJens Wiklander 
2279403c583SJens Wiklander }
2289403c583SJens Wiklander 
229