xref: /optee_os/lib/libutils/isoc/arch/arm/softfloat/source/extF80M_sqrt.c (revision 1bb929836182ecb96d2d9d268daa807c67596396)
1*1bb92983SJerome Forissier // SPDX-License-Identifier: BSD-3-Clause
29403c583SJens Wiklander 
39403c583SJens Wiklander /*============================================================================
49403c583SJens Wiklander 
59403c583SJens Wiklander This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic
69403c583SJens Wiklander Package, Release 3a, by John R. Hauser.
79403c583SJens Wiklander 
89403c583SJens Wiklander Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of
99403c583SJens Wiklander California.  All rights reserved.
109403c583SJens Wiklander 
119403c583SJens Wiklander Redistribution and use in source and binary forms, with or without
129403c583SJens Wiklander modification, are permitted provided that the following conditions are met:
139403c583SJens Wiklander 
149403c583SJens Wiklander  1. Redistributions of source code must retain the above copyright notice,
159403c583SJens Wiklander     this list of conditions, and the following disclaimer.
169403c583SJens Wiklander 
179403c583SJens Wiklander  2. Redistributions in binary form must reproduce the above copyright notice,
189403c583SJens Wiklander     this list of conditions, and the following disclaimer in the documentation
199403c583SJens Wiklander     and/or other materials provided with the distribution.
209403c583SJens Wiklander 
219403c583SJens Wiklander  3. Neither the name of the University nor the names of its contributors may
229403c583SJens Wiklander     be used to endorse or promote products derived from this software without
239403c583SJens Wiklander     specific prior written permission.
249403c583SJens Wiklander 
259403c583SJens Wiklander THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY
269403c583SJens Wiklander EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
279403c583SJens Wiklander WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE
289403c583SJens Wiklander DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
299403c583SJens Wiklander DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
309403c583SJens Wiklander (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
319403c583SJens Wiklander LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
329403c583SJens Wiklander ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
339403c583SJens Wiklander (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
349403c583SJens Wiklander SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
359403c583SJens Wiklander 
369403c583SJens Wiklander =============================================================================*/
379403c583SJens Wiklander 
389403c583SJens Wiklander #include <stdbool.h>
399403c583SJens Wiklander #include <stdint.h>
409403c583SJens Wiklander #include "platform.h"
419403c583SJens Wiklander #include "internals.h"
429403c583SJens Wiklander #include "specialize.h"
439403c583SJens Wiklander #include "softfloat.h"
449403c583SJens Wiklander 
459403c583SJens Wiklander #ifdef SOFTFLOAT_FAST_INT64
469403c583SJens Wiklander 
extF80M_sqrt(const extFloat80_t * aPtr,extFloat80_t * zPtr)479403c583SJens Wiklander void extF80M_sqrt( const extFloat80_t *aPtr, extFloat80_t *zPtr )
489403c583SJens Wiklander {
499403c583SJens Wiklander 
509403c583SJens Wiklander     *zPtr = extF80_sqrt( *aPtr );
519403c583SJens Wiklander 
529403c583SJens Wiklander }
539403c583SJens Wiklander 
549403c583SJens Wiklander #else
559403c583SJens Wiklander 
extF80M_sqrt(const extFloat80_t * aPtr,extFloat80_t * zPtr)569403c583SJens Wiklander void extF80M_sqrt( const extFloat80_t *aPtr, extFloat80_t *zPtr )
579403c583SJens Wiklander {
589403c583SJens Wiklander     const struct extFloat80M *aSPtr;
599403c583SJens Wiklander     struct extFloat80M *zSPtr;
609403c583SJens Wiklander     uint_fast16_t uiA64, signUI64;
619403c583SJens Wiklander     int32_t expA;
629403c583SJens Wiklander     uint64_t rem64;
639403c583SJens Wiklander     int32_t expZ;
649403c583SJens Wiklander     uint32_t rem[4], sig32A, recipSqrt32, sig32Z, q;
659403c583SJens Wiklander     uint64_t sig64Z, x64;
669403c583SJens Wiklander     uint32_t term[4], extSigZ[3];
679403c583SJens Wiklander 
689403c583SJens Wiklander     /*------------------------------------------------------------------------
699403c583SJens Wiklander     *------------------------------------------------------------------------*/
709403c583SJens Wiklander     aSPtr = (const struct extFloat80M *) aPtr;
719403c583SJens Wiklander     zSPtr = (struct extFloat80M *) zPtr;
729403c583SJens Wiklander     /*------------------------------------------------------------------------
739403c583SJens Wiklander     *------------------------------------------------------------------------*/
749403c583SJens Wiklander     uiA64 = aSPtr->signExp;
759403c583SJens Wiklander     signUI64 = uiA64 & packToExtF80UI64( 1, 0 );
769403c583SJens Wiklander     expA = expExtF80UI64( uiA64 );
779403c583SJens Wiklander     rem64 = aSPtr->signif;
789403c583SJens Wiklander     /*------------------------------------------------------------------------
799403c583SJens Wiklander     *------------------------------------------------------------------------*/
809403c583SJens Wiklander     if ( expA == 0x7FFF ) {
819403c583SJens Wiklander         if ( rem64 & UINT64_C( 0x7FFFFFFFFFFFFFFF ) ) {
829403c583SJens Wiklander             softfloat_propagateNaNExtF80M( aSPtr, 0, zSPtr );
839403c583SJens Wiklander             return;
849403c583SJens Wiklander         }
859403c583SJens Wiklander         if ( signUI64 ) goto invalid;
869403c583SJens Wiklander         rem64 = UINT64_C( 0x8000000000000000 );
879403c583SJens Wiklander         goto copyA;
889403c583SJens Wiklander     }
899403c583SJens Wiklander     /*------------------------------------------------------------------------
909403c583SJens Wiklander     *------------------------------------------------------------------------*/
919403c583SJens Wiklander     if ( ! expA ) expA = 1;
929403c583SJens Wiklander     if ( ! (rem64 & UINT64_C( 0x8000000000000000 )) ) {
939403c583SJens Wiklander         if ( ! rem64 ) {
949403c583SJens Wiklander             uiA64 = signUI64;
959403c583SJens Wiklander             goto copyA;
969403c583SJens Wiklander         }
979403c583SJens Wiklander         expA += softfloat_normExtF80SigM( &rem64 );
989403c583SJens Wiklander     }
999403c583SJens Wiklander     if ( signUI64 ) goto invalid;
1009403c583SJens Wiklander     /*------------------------------------------------------------------------
1019403c583SJens Wiklander     *------------------------------------------------------------------------*/
1029403c583SJens Wiklander     expZ = ((expA - 0x3FFF)>>1) + 0x3FFF;
1039403c583SJens Wiklander     expA &= 1;
1049403c583SJens Wiklander     softfloat_shortShiftLeft64To96M(
1059403c583SJens Wiklander         rem64, 30 - expA, &rem[indexMultiwordHi( 4, 3 )] );
1069403c583SJens Wiklander     sig32A = rem64>>32;
1079403c583SJens Wiklander     recipSqrt32 = softfloat_approxRecipSqrt32_1( expA, sig32A );
1089403c583SJens Wiklander     sig32Z = ((uint64_t) sig32A * recipSqrt32)>>32;
1099403c583SJens Wiklander     if ( expA ) sig32Z >>= 1;
1109403c583SJens Wiklander     rem64 =
1119403c583SJens Wiklander         ((uint64_t) rem[indexWord( 4, 3 )]<<32 | rem[indexWord( 4, 2 )])
1129403c583SJens Wiklander             - (uint64_t) sig32Z * sig32Z;
1139403c583SJens Wiklander     rem[indexWord( 4, 3 )] = rem64>>32;
1149403c583SJens Wiklander     rem[indexWord( 4, 2 )] = rem64;
1159403c583SJens Wiklander     /*------------------------------------------------------------------------
1169403c583SJens Wiklander     *------------------------------------------------------------------------*/
1179403c583SJens Wiklander     q = ((uint32_t) (rem64>>2) * (uint64_t) recipSqrt32)>>32;
1189403c583SJens Wiklander     sig64Z = ((uint64_t) sig32Z<<32) + ((uint64_t) q<<3);
1199403c583SJens Wiklander     x64 = ((uint64_t) sig32Z<<32) + sig64Z;
1209403c583SJens Wiklander     term[indexWord( 3, 2 )] = 0;
1219403c583SJens Wiklander     term[indexWord( 3, 1 )] = x64>>32;
1229403c583SJens Wiklander     term[indexWord( 3, 0 )] = x64;
1239403c583SJens Wiklander     softfloat_remStep96MBy32(
1249403c583SJens Wiklander         &rem[indexMultiwordHi( 4, 3 )],
1259403c583SJens Wiklander         29,
1269403c583SJens Wiklander         term,
1279403c583SJens Wiklander         q,
1289403c583SJens Wiklander         &rem[indexMultiwordHi( 4, 3 )]
1299403c583SJens Wiklander     );
1309403c583SJens Wiklander     rem64 = (uint64_t) rem[indexWord( 4, 3 )]<<32 | rem[indexWord( 4, 2 )];
1319403c583SJens Wiklander     /*------------------------------------------------------------------------
1329403c583SJens Wiklander     *------------------------------------------------------------------------*/
1339403c583SJens Wiklander     q = (((uint32_t) (rem64>>2) * (uint64_t) recipSqrt32)>>32) + 2;
1349403c583SJens Wiklander     x64 = (uint64_t) q<<7;
1359403c583SJens Wiklander     extSigZ[indexWord( 3, 0 )] = x64;
1369403c583SJens Wiklander     x64 = (sig64Z<<1) + (x64>>32);
1379403c583SJens Wiklander     extSigZ[indexWord( 3, 2 )] = x64>>32;
1389403c583SJens Wiklander     extSigZ[indexWord( 3, 1 )] = x64;
1399403c583SJens Wiklander     /*------------------------------------------------------------------------
1409403c583SJens Wiklander     *------------------------------------------------------------------------*/
1419403c583SJens Wiklander     if ( (q & 0xFFFFFF) <= 2 ) {
1429403c583SJens Wiklander         q &= ~(uint32_t) 0xFFFF;
1439403c583SJens Wiklander         extSigZ[indexWordLo( 3 )] = q<<7;
1449403c583SJens Wiklander         x64 = sig64Z + (q>>27);
1459403c583SJens Wiklander         term[indexWord( 4, 3 )] = 0;
1469403c583SJens Wiklander         term[indexWord( 4, 2 )] = x64>>32;
1479403c583SJens Wiklander         term[indexWord( 4, 1 )] = x64;
1489403c583SJens Wiklander         term[indexWord( 4, 0 )] = q<<5;
1499403c583SJens Wiklander         rem[indexWord( 4, 0 )] = 0;
1509403c583SJens Wiklander         softfloat_remStep128MBy32( rem, 28, term, q, rem );
1519403c583SJens Wiklander         q = rem[indexWordHi( 4 )];
1529403c583SJens Wiklander         if ( q & 0x80000000 ) {
1539403c583SJens Wiklander             softfloat_sub1X96M( extSigZ );
1549403c583SJens Wiklander         } else {
1559403c583SJens Wiklander             if ( q || rem[indexWord( 4, 1 )] || rem[indexWord( 4, 2 )] ) {
1569403c583SJens Wiklander                 extSigZ[indexWordLo( 3 )] |= 1;
1579403c583SJens Wiklander             }
1589403c583SJens Wiklander         }
1599403c583SJens Wiklander     }
1609403c583SJens Wiklander     softfloat_roundPackMToExtF80M(
1619403c583SJens Wiklander         0, expZ, extSigZ, extF80_roundingPrecision, zSPtr );
1629403c583SJens Wiklander     return;
1639403c583SJens Wiklander     /*------------------------------------------------------------------------
1649403c583SJens Wiklander     *------------------------------------------------------------------------*/
1659403c583SJens Wiklander  invalid:
1669403c583SJens Wiklander     softfloat_invalidExtF80M( zSPtr );
1679403c583SJens Wiklander     return;
1689403c583SJens Wiklander     /*------------------------------------------------------------------------
1699403c583SJens Wiklander     *------------------------------------------------------------------------*/
1709403c583SJens Wiklander  copyA:
1719403c583SJens Wiklander     zSPtr->signExp = uiA64;
1729403c583SJens Wiklander     zSPtr->signif  = rem64;
1739403c583SJens Wiklander 
1749403c583SJens Wiklander }
1759403c583SJens Wiklander 
1769403c583SJens Wiklander #endif
1779403c583SJens Wiklander 
178