1*1bb92983SJerome Forissier // SPDX-License-Identifier: BSD-3-Clause
29403c583SJens Wiklander
39403c583SJens Wiklander /*============================================================================
49403c583SJens Wiklander
59403c583SJens Wiklander This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic
69403c583SJens Wiklander Package, Release 3a, by John R. Hauser.
79403c583SJens Wiklander
89403c583SJens Wiklander Copyright 2011, 2012, 2013, 2014 The Regents of the University of California.
99403c583SJens Wiklander All rights reserved.
109403c583SJens Wiklander
119403c583SJens Wiklander Redistribution and use in source and binary forms, with or without
129403c583SJens Wiklander modification, are permitted provided that the following conditions are met:
139403c583SJens Wiklander
149403c583SJens Wiklander 1. Redistributions of source code must retain the above copyright notice,
159403c583SJens Wiklander this list of conditions, and the following disclaimer.
169403c583SJens Wiklander
179403c583SJens Wiklander 2. Redistributions in binary form must reproduce the above copyright notice,
189403c583SJens Wiklander this list of conditions, and the following disclaimer in the documentation
199403c583SJens Wiklander and/or other materials provided with the distribution.
209403c583SJens Wiklander
219403c583SJens Wiklander 3. Neither the name of the University nor the names of its contributors may
229403c583SJens Wiklander be used to endorse or promote products derived from this software without
239403c583SJens Wiklander specific prior written permission.
249403c583SJens Wiklander
259403c583SJens Wiklander THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY
269403c583SJens Wiklander EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
279403c583SJens Wiklander WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE
289403c583SJens Wiklander DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
299403c583SJens Wiklander DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
309403c583SJens Wiklander (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
319403c583SJens Wiklander LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
329403c583SJens Wiklander ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
339403c583SJens Wiklander (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
349403c583SJens Wiklander SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
359403c583SJens Wiklander
369403c583SJens Wiklander =============================================================================*/
379403c583SJens Wiklander
389403c583SJens Wiklander #include <stdbool.h>
399403c583SJens Wiklander #include <stdint.h>
409403c583SJens Wiklander #include "platform.h"
419403c583SJens Wiklander #include "internals.h"
429403c583SJens Wiklander #include "specialize.h"
439403c583SJens Wiklander #include "softfloat.h"
449403c583SJens Wiklander
f128_div(float128_t a,float128_t b)459403c583SJens Wiklander float128_t f128_div( float128_t a, float128_t b )
469403c583SJens Wiklander {
479403c583SJens Wiklander union ui128_f128 uA;
489403c583SJens Wiklander uint_fast64_t uiA64, uiA0;
499403c583SJens Wiklander bool signA;
509403c583SJens Wiklander int_fast32_t expA;
519403c583SJens Wiklander struct uint128 sigA;
529403c583SJens Wiklander union ui128_f128 uB;
539403c583SJens Wiklander uint_fast64_t uiB64, uiB0;
549403c583SJens Wiklander bool signB;
559403c583SJens Wiklander int_fast32_t expB;
569403c583SJens Wiklander struct uint128 sigB;
579403c583SJens Wiklander bool signZ;
589403c583SJens Wiklander struct exp32_sig128 normExpSig;
599403c583SJens Wiklander int_fast32_t expZ;
609403c583SJens Wiklander struct uint128 rem;
619403c583SJens Wiklander uint_fast32_t recip32;
629403c583SJens Wiklander int ix;
639403c583SJens Wiklander uint_fast64_t q64;
649403c583SJens Wiklander uint_fast32_t q;
659403c583SJens Wiklander struct uint128 term;
669403c583SJens Wiklander uint_fast32_t qs[3];
679403c583SJens Wiklander uint_fast64_t sigZExtra;
689403c583SJens Wiklander struct uint128 sigZ, uiZ;
699403c583SJens Wiklander union ui128_f128 uZ;
709403c583SJens Wiklander
719403c583SJens Wiklander /*------------------------------------------------------------------------
729403c583SJens Wiklander *------------------------------------------------------------------------*/
739403c583SJens Wiklander uA.f = a;
749403c583SJens Wiklander uiA64 = uA.ui.v64;
759403c583SJens Wiklander uiA0 = uA.ui.v0;
769403c583SJens Wiklander signA = signF128UI64( uiA64 );
779403c583SJens Wiklander expA = expF128UI64( uiA64 );
789403c583SJens Wiklander sigA.v64 = fracF128UI64( uiA64 );
799403c583SJens Wiklander sigA.v0 = uiA0;
809403c583SJens Wiklander uB.f = b;
819403c583SJens Wiklander uiB64 = uB.ui.v64;
829403c583SJens Wiklander uiB0 = uB.ui.v0;
839403c583SJens Wiklander signB = signF128UI64( uiB64 );
849403c583SJens Wiklander expB = expF128UI64( uiB64 );
859403c583SJens Wiklander sigB.v64 = fracF128UI64( uiB64 );
869403c583SJens Wiklander sigB.v0 = uiB0;
879403c583SJens Wiklander signZ = signA ^ signB;
889403c583SJens Wiklander /*------------------------------------------------------------------------
899403c583SJens Wiklander *------------------------------------------------------------------------*/
909403c583SJens Wiklander if ( expA == 0x7FFF ) {
919403c583SJens Wiklander if ( sigA.v64 | sigA.v0 ) goto propagateNaN;
929403c583SJens Wiklander if ( expB == 0x7FFF ) {
939403c583SJens Wiklander if ( sigB.v64 | sigB.v0 ) goto propagateNaN;
949403c583SJens Wiklander goto invalid;
959403c583SJens Wiklander }
969403c583SJens Wiklander goto infinity;
979403c583SJens Wiklander }
989403c583SJens Wiklander if ( expB == 0x7FFF ) {
999403c583SJens Wiklander if ( sigB.v64 | sigB.v0 ) goto propagateNaN;
1009403c583SJens Wiklander goto zero;
1019403c583SJens Wiklander }
1029403c583SJens Wiklander /*------------------------------------------------------------------------
1039403c583SJens Wiklander *------------------------------------------------------------------------*/
1049403c583SJens Wiklander if ( ! expB ) {
1059403c583SJens Wiklander if ( ! (sigB.v64 | sigB.v0) ) {
1069403c583SJens Wiklander if ( ! (expA | sigA.v64 | sigA.v0) ) goto invalid;
1079403c583SJens Wiklander softfloat_raiseFlags( softfloat_flag_infinite );
1089403c583SJens Wiklander goto infinity;
1099403c583SJens Wiklander }
1109403c583SJens Wiklander normExpSig = softfloat_normSubnormalF128Sig( sigB.v64, sigB.v0 );
1119403c583SJens Wiklander expB = normExpSig.exp;
1129403c583SJens Wiklander sigB = normExpSig.sig;
1139403c583SJens Wiklander }
1149403c583SJens Wiklander if ( ! expA ) {
1159403c583SJens Wiklander if ( ! (sigA.v64 | sigA.v0) ) goto zero;
1169403c583SJens Wiklander normExpSig = softfloat_normSubnormalF128Sig( sigA.v64, sigA.v0 );
1179403c583SJens Wiklander expA = normExpSig.exp;
1189403c583SJens Wiklander sigA = normExpSig.sig;
1199403c583SJens Wiklander }
1209403c583SJens Wiklander /*------------------------------------------------------------------------
1219403c583SJens Wiklander *------------------------------------------------------------------------*/
1229403c583SJens Wiklander expZ = expA - expB + 0x3FFE;
1239403c583SJens Wiklander sigA.v64 |= UINT64_C( 0x0001000000000000 );
1249403c583SJens Wiklander sigB.v64 |= UINT64_C( 0x0001000000000000 );
1259403c583SJens Wiklander rem = sigA;
1269403c583SJens Wiklander if ( softfloat_lt128( sigA.v64, sigA.v0, sigB.v64, sigB.v0 ) ) {
1279403c583SJens Wiklander --expZ;
1289403c583SJens Wiklander rem = softfloat_add128( sigA.v64, sigA.v0, sigA.v64, sigA.v0 );
1299403c583SJens Wiklander }
1309403c583SJens Wiklander recip32 = softfloat_approxRecip32_1( sigB.v64>>17 );
1319403c583SJens Wiklander ix = 3;
1329403c583SJens Wiklander for (;;) {
1339403c583SJens Wiklander q64 = (uint_fast64_t) (uint32_t) (rem.v64>>19) * recip32;
1349403c583SJens Wiklander q = (q64 + 0x80000000)>>32;
1359403c583SJens Wiklander --ix;
1369403c583SJens Wiklander if ( ix < 0 ) break;
1379403c583SJens Wiklander rem = softfloat_shortShiftLeft128( rem.v64, rem.v0, 29 );
1389403c583SJens Wiklander term = softfloat_mul128By32( sigB.v64, sigB.v0, q );
1399403c583SJens Wiklander rem = softfloat_sub128( rem.v64, rem.v0, term.v64, term.v0 );
1409403c583SJens Wiklander if ( rem.v64 & UINT64_C( 0x8000000000000000 ) ) {
1419403c583SJens Wiklander --q;
1429403c583SJens Wiklander rem = softfloat_add128( rem.v64, rem.v0, sigB.v64, sigB.v0 );
1439403c583SJens Wiklander }
1449403c583SJens Wiklander qs[ix] = q;
1459403c583SJens Wiklander }
1469403c583SJens Wiklander /*------------------------------------------------------------------------
1479403c583SJens Wiklander *------------------------------------------------------------------------*/
1489403c583SJens Wiklander if ( ((q + 1) & 7) < 2 ) {
1499403c583SJens Wiklander rem = softfloat_shortShiftLeft128( rem.v64, rem.v0, 29 );
1509403c583SJens Wiklander term = softfloat_mul128By32( sigB.v64, sigB.v0, q );
1519403c583SJens Wiklander rem = softfloat_sub128( rem.v64, rem.v0, term.v64, term.v0 );
1529403c583SJens Wiklander if ( rem.v64 & UINT64_C( 0x8000000000000000 ) ) {
1539403c583SJens Wiklander --q;
1549403c583SJens Wiklander rem = softfloat_add128( rem.v64, rem.v0, sigB.v64, sigB.v0 );
1559403c583SJens Wiklander } else if ( softfloat_le128( sigB.v64, sigB.v0, rem.v64, rem.v0 ) ) {
1569403c583SJens Wiklander ++q;
1579403c583SJens Wiklander rem = softfloat_sub128( rem.v64, rem.v0, sigB.v64, sigB.v0 );
1589403c583SJens Wiklander }
1599403c583SJens Wiklander if ( rem.v64 | rem.v0 ) q |= 1;
1609403c583SJens Wiklander }
1619403c583SJens Wiklander /*------------------------------------------------------------------------
1629403c583SJens Wiklander *------------------------------------------------------------------------*/
1639403c583SJens Wiklander sigZExtra = (uint64_t) ((uint_fast64_t) q<<60);
1649403c583SJens Wiklander term = softfloat_shortShiftLeft128( 0, qs[1], 54 );
1659403c583SJens Wiklander sigZ =
1669403c583SJens Wiklander softfloat_add128(
1679403c583SJens Wiklander (uint_fast64_t) qs[2]<<19, ((uint_fast64_t) qs[0]<<25) + (q>>4),
1689403c583SJens Wiklander term.v64, term.v0
1699403c583SJens Wiklander );
1709403c583SJens Wiklander return
1719403c583SJens Wiklander softfloat_roundPackToF128( signZ, expZ, sigZ.v64, sigZ.v0, sigZExtra );
1729403c583SJens Wiklander /*------------------------------------------------------------------------
1739403c583SJens Wiklander *------------------------------------------------------------------------*/
1749403c583SJens Wiklander propagateNaN:
1759403c583SJens Wiklander uiZ = softfloat_propagateNaNF128UI( uiA64, uiA0, uiB64, uiB0 );
1769403c583SJens Wiklander goto uiZ;
1779403c583SJens Wiklander /*------------------------------------------------------------------------
1789403c583SJens Wiklander *------------------------------------------------------------------------*/
1799403c583SJens Wiklander invalid:
1809403c583SJens Wiklander softfloat_raiseFlags( softfloat_flag_invalid );
1819403c583SJens Wiklander uiZ.v64 = defaultNaNF128UI64;
1829403c583SJens Wiklander uiZ.v0 = defaultNaNF128UI0;
1839403c583SJens Wiklander goto uiZ;
1849403c583SJens Wiklander /*------------------------------------------------------------------------
1859403c583SJens Wiklander *------------------------------------------------------------------------*/
1869403c583SJens Wiklander infinity:
1879403c583SJens Wiklander uiZ.v64 = packToF128UI64( signZ, 0x7FFF, 0 );
1889403c583SJens Wiklander goto uiZ0;
1899403c583SJens Wiklander /*------------------------------------------------------------------------
1909403c583SJens Wiklander *------------------------------------------------------------------------*/
1919403c583SJens Wiklander zero:
1929403c583SJens Wiklander uiZ.v64 = packToF128UI64( signZ, 0, 0 );
1939403c583SJens Wiklander uiZ0:
1949403c583SJens Wiklander uiZ.v0 = 0;
1959403c583SJens Wiklander uiZ:
1969403c583SJens Wiklander uZ.ui = uiZ;
1979403c583SJens Wiklander return uZ.f;
1989403c583SJens Wiklander
1999403c583SJens Wiklander }
2009403c583SJens Wiklander
201