softfloat/bits32/softfloat.c

*2cec0187Schristos/* $NetBSD: softfloat.c,v 1.2 2012/03/21 14:17:54 christos Exp $ */
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21 * This version hacked for use with gcc -msoft-float by bjh21.
936b7f4cSbjh21 * (Mostly a case of #ifdefing out things GCC doesn't need or provides
936b7f4cSbjh21 *  itself).
936b7f4cSbjh21 */
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21 * Things you may want to define:
936b7f4cSbjh21 *
936b7f4cSbjh21 * SOFTFLOAT_FOR_GCC - build only those functions necessary for GCC (with
936b7f4cSbjh21 *   -msoft-float) to work.  Include "softfloat-for-gcc.h" to get them
936b7f4cSbjh21 *   properly renamed.
936b7f4cSbjh21 */
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21 * This differs from the standard bits32/softfloat.c in that float64
936b7f4cSbjh21 * is defined to be a 64-bit integer rather than a structure.  The
936b7f4cSbjh21 * structure is float64s, with translation between the two going via
936b7f4cSbjh21 * float64u.
936b7f4cSbjh21 */
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21===============================================================================
936b7f4cSbjh21
936b7f4cSbjh21This C source file is part of the SoftFloat IEC/IEEE Floating-Point
936b7f4cSbjh21Arithmetic Package, Release 2a.
936b7f4cSbjh21
936b7f4cSbjh21Written by John R. Hauser.  This work was made possible in part by the
936b7f4cSbjh21International Computer Science Institute, located at Suite 600, 1947 Center
936b7f4cSbjh21Street, Berkeley, California 94704.  Funding was partially provided by the
936b7f4cSbjh21National Science Foundation under grant MIP-9311980.  The original version
936b7f4cSbjh21of this code was written as part of a project to build a fixed-point vector
936b7f4cSbjh21processor in collaboration with the University of California at Berkeley,
936b7f4cSbjh21overseen by Profs. Nelson Morgan and John Wawrzynek.  More information
936b7f4cSbjh21is available through the Web page `http://HTTP.CS.Berkeley.EDU/~jhauser/
936b7f4cSbjh21arithmetic/SoftFloat.html'.
936b7f4cSbjh21
936b7f4cSbjh21THIS SOFTWARE IS DISTRIBUTED AS IS, FOR FREE.  Although reasonable effort
936b7f4cSbjh21has been made to avoid it, THIS SOFTWARE MAY CONTAIN FAULTS THAT WILL AT
936b7f4cSbjh21TIMES RESULT IN INCORRECT BEHAVIOR.  USE OF THIS SOFTWARE IS RESTRICTED TO
936b7f4cSbjh21PERSONS AND ORGANIZATIONS WHO CAN AND WILL TAKE FULL RESPONSIBILITY FOR ANY
936b7f4cSbjh21AND ALL LOSSES, COSTS, OR OTHER PROBLEMS ARISING FROM ITS USE.
936b7f4cSbjh21
936b7f4cSbjh21Derivative works are acceptable, even for commercial purposes, so long as
936b7f4cSbjh21(1) they include prominent notice that the work is derivative, and (2) they
936b7f4cSbjh21include prominent notice akin to these four paragraphs for those parts of
936b7f4cSbjh21this code that are retained.
936b7f4cSbjh21
936b7f4cSbjh21===============================================================================
936b7f4cSbjh21*/
936b7f4cSbjh21
936b7f4cSbjh21#include <sys/cdefs.h>
936b7f4cSbjh21#if defined(LIBC_SCCS) && !defined(lint)
*2cec0187Schristos__RCSID("$NetBSD: softfloat.c,v 1.2 2012/03/21 14:17:54 christos Exp $");
936b7f4cSbjh21#endif /* LIBC_SCCS and not lint */
936b7f4cSbjh21
936b7f4cSbjh21#ifdef SOFTFLOAT_FOR_GCC
936b7f4cSbjh21#include "softfloat-for-gcc.h"
936b7f4cSbjh21#endif
936b7f4cSbjh21
936b7f4cSbjh21#include "milieu.h"
936b7f4cSbjh21#include "softfloat.h"
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21 * Conversions between floats as stored in memory and floats as
936b7f4cSbjh21 * SoftFloat uses them
936b7f4cSbjh21 */
936b7f4cSbjh21#ifndef FLOAT64_DEMANGLE
936b7f4cSbjh21#define FLOAT64_DEMANGLE(a)	(a)
936b7f4cSbjh21#endif
936b7f4cSbjh21#ifndef FLOAT64_MANGLE
936b7f4cSbjh21#define FLOAT64_MANGLE(a)	(a)
936b7f4cSbjh21#endif
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Floating-point rounding mode and exception flags.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21fp_rnd float_rounding_mode = float_round_nearest_even;
936b7f4cSbjh21fp_except float_exception_flags = 0;
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Primitive arithmetic functions, including multi-word arithmetic, and
936b7f4cSbjh21division and square root approximations.  (Can be specialized to target if
936b7f4cSbjh21desired.)
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21#include "softfloat-macros"
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Functions and definitions to determine:  (1) whether tininess for underflow
936b7f4cSbjh21is detected before or after rounding by default, (2) what (if anything)
936b7f4cSbjh21happens when exceptions are raised, (3) how signaling NaNs are distinguished
936b7f4cSbjh21from quiet NaNs, (4) the default generated quiet NaNs, and (4) how NaNs
936b7f4cSbjh21are propagated from function inputs to output.  These details are target-
936b7f4cSbjh21specific.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21#include "softfloat-specialize"
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the fraction bits of the single-precision floating-point value `a'.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21INLINE bits32 extractFloat32Frac( float32 a )
936b7f4cSbjh21{
936b7f4cSbjh21
936b7f4cSbjh21    return a & 0x007FFFFF;
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the exponent bits of the single-precision floating-point value `a'.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21INLINE int16 extractFloat32Exp( float32 a )
936b7f4cSbjh21{
936b7f4cSbjh21
936b7f4cSbjh21    return ( a>>23 ) & 0xFF;
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the sign bit of the single-precision floating-point value `a'.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21INLINE flag extractFloat32Sign( float32 a )
936b7f4cSbjh21{
936b7f4cSbjh21
936b7f4cSbjh21    return a>>31;
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Normalizes the subnormal single-precision floating-point value represented
936b7f4cSbjh21by the denormalized significand `aSig'.  The normalized exponent and
936b7f4cSbjh21significand are stored at the locations pointed to by `zExpPtr' and
936b7f4cSbjh21`zSigPtr', respectively.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21static void
936b7f4cSbjh21 normalizeFloat32Subnormal( bits32 aSig, int16 *zExpPtr, bits32 *zSigPtr )
936b7f4cSbjh21{
936b7f4cSbjh21    int8 shiftCount;
936b7f4cSbjh21
936b7f4cSbjh21    shiftCount = countLeadingZeros32( aSig ) - 8;
936b7f4cSbjh21    *zSigPtr = aSig<<shiftCount;
936b7f4cSbjh21    *zExpPtr = 1 - shiftCount;
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Packs the sign `zSign', exponent `zExp', and significand `zSig' into a
936b7f4cSbjh21single-precision floating-point value, returning the result.  After being
936b7f4cSbjh21shifted into the proper positions, the three fields are simply added
936b7f4cSbjh21together to form the result.  This means that any integer portion of `zSig'
936b7f4cSbjh21will be added into the exponent.  Since a properly normalized significand
936b7f4cSbjh21will have an integer portion equal to 1, the `zExp' input should be 1 less
936b7f4cSbjh21than the desired result exponent whenever `zSig' is a complete, normalized
936b7f4cSbjh21significand.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21INLINE float32 packFloat32( flag zSign, int16 zExp, bits32 zSig )
936b7f4cSbjh21{
936b7f4cSbjh21
936b7f4cSbjh21    return ( ( (bits32) zSign )<<31 ) + ( ( (bits32) zExp )<<23 ) + zSig;
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Takes an abstract floating-point value having sign `zSign', exponent `zExp',
936b7f4cSbjh21and significand `zSig', and returns the proper single-precision floating-
936b7f4cSbjh21point value corresponding to the abstract input.  Ordinarily, the abstract
936b7f4cSbjh21value is simply rounded and packed into the single-precision format, with
936b7f4cSbjh21the inexact exception raised if the abstract input cannot be represented
936b7f4cSbjh21exactly.  However, if the abstract value is too large, the overflow and
936b7f4cSbjh21inexact exceptions are raised and an infinity or maximal finite value is
936b7f4cSbjh21returned.  If the abstract value is too small, the input value is rounded to
936b7f4cSbjh21a subnormal number, and the underflow and inexact exceptions are raised if
936b7f4cSbjh21the abstract input cannot be represented exactly as a subnormal single-
936b7f4cSbjh21precision floating-point number.
936b7f4cSbjh21    The input significand `zSig' has its binary point between bits 30
936b7f4cSbjh21and 29, which is 7 bits to the left of the usual location.  This shifted
936b7f4cSbjh21significand must be normalized or smaller.  If `zSig' is not normalized,
936b7f4cSbjh21`zExp' must be 0; in that case, the result returned is a subnormal number,
936b7f4cSbjh21and it must not require rounding.  In the usual case that `zSig' is
936b7f4cSbjh21normalized, `zExp' must be 1 less than the ``true'' floating-point exponent.
936b7f4cSbjh21The handling of underflow and overflow follows the IEC/IEEE Standard for
936b7f4cSbjh21Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21static float32 roundAndPackFloat32( flag zSign, int16 zExp, bits32 zSig )
936b7f4cSbjh21{
936b7f4cSbjh21    int8 roundingMode;
936b7f4cSbjh21    flag roundNearestEven;
936b7f4cSbjh21    int8 roundIncrement, roundBits;
936b7f4cSbjh21    flag isTiny;
936b7f4cSbjh21
936b7f4cSbjh21    roundingMode = float_rounding_mode;
936b7f4cSbjh21    roundNearestEven = roundingMode == float_round_nearest_even;
936b7f4cSbjh21    roundIncrement = 0x40;
936b7f4cSbjh21    if ( ! roundNearestEven ) {
936b7f4cSbjh21        if ( roundingMode == float_round_to_zero ) {
936b7f4cSbjh21            roundIncrement = 0;
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            roundIncrement = 0x7F;
936b7f4cSbjh21            if ( zSign ) {
936b7f4cSbjh21                if ( roundingMode == float_round_up ) roundIncrement = 0;
936b7f4cSbjh21            }
936b7f4cSbjh21            else {
936b7f4cSbjh21                if ( roundingMode == float_round_down ) roundIncrement = 0;
936b7f4cSbjh21            }
936b7f4cSbjh21        }
936b7f4cSbjh21    }
936b7f4cSbjh21    roundBits = zSig & 0x7F;
936b7f4cSbjh21    if ( 0xFD <= (bits16) zExp ) {
936b7f4cSbjh21        if (    ( 0xFD < zExp )
936b7f4cSbjh21             || (    ( zExp == 0xFD )
936b7f4cSbjh21                  && ( (sbits32) ( zSig + roundIncrement ) < 0 ) )
936b7f4cSbjh21           ) {
936b7f4cSbjh21            float_raise( float_flag_overflow | float_flag_inexact );
936b7f4cSbjh21            return packFloat32( zSign, 0xFF, 0 ) - ( roundIncrement == 0 );
936b7f4cSbjh21        }
936b7f4cSbjh21        if ( zExp < 0 ) {
936b7f4cSbjh21            isTiny =
936b7f4cSbjh21                   ( float_detect_tininess == float_tininess_before_rounding )
936b7f4cSbjh21                || ( zExp < -1 )
*2cec0187Schristos                || ( zSig + roundIncrement < (uint32)0x80000000 );
936b7f4cSbjh21            shift32RightJamming( zSig, - zExp, &zSig );
936b7f4cSbjh21            zExp = 0;
936b7f4cSbjh21            roundBits = zSig & 0x7F;
936b7f4cSbjh21            if ( isTiny && roundBits ) float_raise( float_flag_underflow );
936b7f4cSbjh21        }
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( roundBits ) float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21    zSig = ( zSig + roundIncrement )>>7;
936b7f4cSbjh21    zSig &= ~ ( ( ( roundBits ^ 0x40 ) == 0 ) & roundNearestEven );
936b7f4cSbjh21    if ( zSig == 0 ) zExp = 0;
936b7f4cSbjh21    return packFloat32( zSign, zExp, zSig );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Takes an abstract floating-point value having sign `zSign', exponent `zExp',
936b7f4cSbjh21and significand `zSig', and returns the proper single-precision floating-
936b7f4cSbjh21point value corresponding to the abstract input.  This routine is just like
936b7f4cSbjh21`roundAndPackFloat32' except that `zSig' does not have to be normalized.
936b7f4cSbjh21Bit 31 of `zSig' must be zero, and `zExp' must be 1 less than the ``true''
936b7f4cSbjh21floating-point exponent.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21static float32
936b7f4cSbjh21 normalizeRoundAndPackFloat32( flag zSign, int16 zExp, bits32 zSig )
936b7f4cSbjh21{
936b7f4cSbjh21    int8 shiftCount;
936b7f4cSbjh21
936b7f4cSbjh21    shiftCount = countLeadingZeros32( zSig ) - 1;
936b7f4cSbjh21    return roundAndPackFloat32( zSign, zExp - shiftCount, zSig<<shiftCount );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the least-significant 32 fraction bits of the double-precision
936b7f4cSbjh21floating-point value `a'.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21INLINE bits32 extractFloat64Frac1( float64 a )
936b7f4cSbjh21{
936b7f4cSbjh21
*2cec0187Schristos    return (bits32)(FLOAT64_DEMANGLE(a) & LIT64(0x00000000FFFFFFFF));
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the most-significant 20 fraction bits of the double-precision
936b7f4cSbjh21floating-point value `a'.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21INLINE bits32 extractFloat64Frac0( float64 a )
936b7f4cSbjh21{
936b7f4cSbjh21
*2cec0187Schristos    return (bits32)((FLOAT64_DEMANGLE(a) >> 32) & 0x000FFFFF);
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the exponent bits of the double-precision floating-point value `a'.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21INLINE int16 extractFloat64Exp( float64 a )
936b7f4cSbjh21{
936b7f4cSbjh21
*2cec0187Schristos    return (int16)((FLOAT64_DEMANGLE(a) >> 52) & 0x7FF);
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the sign bit of the double-precision floating-point value `a'.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21INLINE flag extractFloat64Sign( float64 a )
936b7f4cSbjh21{
936b7f4cSbjh21
*2cec0187Schristos    return (flag)(FLOAT64_DEMANGLE(a) >> 63);
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Normalizes the subnormal double-precision floating-point value represented
936b7f4cSbjh21by the denormalized significand formed by the concatenation of `aSig0' and
936b7f4cSbjh21`aSig1'.  The normalized exponent is stored at the location pointed to by
936b7f4cSbjh21`zExpPtr'.  The most significant 21 bits of the normalized significand are
936b7f4cSbjh21stored at the location pointed to by `zSig0Ptr', and the least significant
936b7f4cSbjh2132 bits of the normalized significand are stored at the location pointed to
936b7f4cSbjh21by `zSig1Ptr'.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21static void
936b7f4cSbjh21 normalizeFloat64Subnormal(
936b7f4cSbjh21     bits32 aSig0,
936b7f4cSbjh21     bits32 aSig1,
936b7f4cSbjh21     int16 *zExpPtr,
936b7f4cSbjh21     bits32 *zSig0Ptr,
936b7f4cSbjh21     bits32 *zSig1Ptr
936b7f4cSbjh21 )
936b7f4cSbjh21{
936b7f4cSbjh21    int8 shiftCount;
936b7f4cSbjh21
936b7f4cSbjh21    if ( aSig0 == 0 ) {
936b7f4cSbjh21        shiftCount = countLeadingZeros32( aSig1 ) - 11;
936b7f4cSbjh21        if ( shiftCount < 0 ) {
936b7f4cSbjh21            *zSig0Ptr = aSig1>>( - shiftCount );
936b7f4cSbjh21            *zSig1Ptr = aSig1<<( shiftCount & 31 );
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            *zSig0Ptr = aSig1<<shiftCount;
936b7f4cSbjh21            *zSig1Ptr = 0;
936b7f4cSbjh21        }
936b7f4cSbjh21        *zExpPtr = - shiftCount - 31;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        shiftCount = countLeadingZeros32( aSig0 ) - 11;
936b7f4cSbjh21        shortShift64Left( aSig0, aSig1, shiftCount, zSig0Ptr, zSig1Ptr );
936b7f4cSbjh21        *zExpPtr = 1 - shiftCount;
936b7f4cSbjh21    }
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Packs the sign `zSign', the exponent `zExp', and the significand formed by
936b7f4cSbjh21the concatenation of `zSig0' and `zSig1' into a double-precision floating-
936b7f4cSbjh21point value, returning the result.  After being shifted into the proper
936b7f4cSbjh21positions, the three fields `zSign', `zExp', and `zSig0' are simply added
936b7f4cSbjh21together to form the most significant 32 bits of the result.  This means
936b7f4cSbjh21that any integer portion of `zSig0' will be added into the exponent.  Since
936b7f4cSbjh21a properly normalized significand will have an integer portion equal to 1,
936b7f4cSbjh21the `zExp' input should be 1 less than the desired result exponent whenever
936b7f4cSbjh21`zSig0' and `zSig1' concatenated form a complete, normalized significand.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21INLINE float64
936b7f4cSbjh21 packFloat64( flag zSign, int16 zExp, bits32 zSig0, bits32 zSig1 )
936b7f4cSbjh21{
936b7f4cSbjh21
936b7f4cSbjh21    return FLOAT64_MANGLE( ( ( (bits64) zSign )<<63 ) +
936b7f4cSbjh21			   ( ( (bits64) zExp )<<52 ) +
936b7f4cSbjh21			   ( ( (bits64) zSig0 )<<32 ) + zSig1 );
936b7f4cSbjh21
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Takes an abstract floating-point value having sign `zSign', exponent `zExp',
936b7f4cSbjh21and extended significand formed by the concatenation of `zSig0', `zSig1',
936b7f4cSbjh21and `zSig2', and returns the proper double-precision floating-point value
936b7f4cSbjh21corresponding to the abstract input.  Ordinarily, the abstract value is
936b7f4cSbjh21simply rounded and packed into the double-precision format, with the inexact
936b7f4cSbjh21exception raised if the abstract input cannot be represented exactly.
936b7f4cSbjh21However, if the abstract value is too large, the overflow and inexact
936b7f4cSbjh21exceptions are raised and an infinity or maximal finite value is returned.
936b7f4cSbjh21If the abstract value is too small, the input value is rounded to a
936b7f4cSbjh21subnormal number, and the underflow and inexact exceptions are raised if the
936b7f4cSbjh21abstract input cannot be represented exactly as a subnormal double-precision
936b7f4cSbjh21floating-point number.
936b7f4cSbjh21    The input significand must be normalized or smaller.  If the input
936b7f4cSbjh21significand is not normalized, `zExp' must be 0; in that case, the result
936b7f4cSbjh21returned is a subnormal number, and it must not require rounding.  In the
936b7f4cSbjh21usual case that the input significand is normalized, `zExp' must be 1 less
936b7f4cSbjh21than the ``true'' floating-point exponent.  The handling of underflow and
936b7f4cSbjh21overflow follows the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21static float64
936b7f4cSbjh21 roundAndPackFloat64(
936b7f4cSbjh21     flag zSign, int16 zExp, bits32 zSig0, bits32 zSig1, bits32 zSig2 )
936b7f4cSbjh21{
936b7f4cSbjh21    int8 roundingMode;
936b7f4cSbjh21    flag roundNearestEven, increment, isTiny;
936b7f4cSbjh21
936b7f4cSbjh21    roundingMode = float_rounding_mode;
936b7f4cSbjh21    roundNearestEven = ( roundingMode == float_round_nearest_even );
936b7f4cSbjh21    increment = ( (sbits32) zSig2 < 0 );
936b7f4cSbjh21    if ( ! roundNearestEven ) {
936b7f4cSbjh21        if ( roundingMode == float_round_to_zero ) {
936b7f4cSbjh21            increment = 0;
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            if ( zSign ) {
936b7f4cSbjh21                increment = ( roundingMode == float_round_down ) && zSig2;
936b7f4cSbjh21            }
936b7f4cSbjh21            else {
936b7f4cSbjh21                increment = ( roundingMode == float_round_up ) && zSig2;
936b7f4cSbjh21            }
936b7f4cSbjh21        }
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( 0x7FD <= (bits16) zExp ) {
936b7f4cSbjh21        if (    ( 0x7FD < zExp )
936b7f4cSbjh21             || (    ( zExp == 0x7FD )
936b7f4cSbjh21                  && eq64( 0x001FFFFF, 0xFFFFFFFF, zSig0, zSig1 )
936b7f4cSbjh21                  && increment
936b7f4cSbjh21                )
936b7f4cSbjh21           ) {
936b7f4cSbjh21            float_raise( float_flag_overflow | float_flag_inexact );
936b7f4cSbjh21            if (    ( roundingMode == float_round_to_zero )
936b7f4cSbjh21                 || ( zSign && ( roundingMode == float_round_up ) )
936b7f4cSbjh21                 || ( ! zSign && ( roundingMode == float_round_down ) )
936b7f4cSbjh21               ) {
936b7f4cSbjh21                return packFloat64( zSign, 0x7FE, 0x000FFFFF, 0xFFFFFFFF );
936b7f4cSbjh21            }
936b7f4cSbjh21            return packFloat64( zSign, 0x7FF, 0, 0 );
936b7f4cSbjh21        }
936b7f4cSbjh21        if ( zExp < 0 ) {
936b7f4cSbjh21            isTiny =
936b7f4cSbjh21                   ( float_detect_tininess == float_tininess_before_rounding )
936b7f4cSbjh21                || ( zExp < -1 )
936b7f4cSbjh21                || ! increment
936b7f4cSbjh21                || lt64( zSig0, zSig1, 0x001FFFFF, 0xFFFFFFFF );
936b7f4cSbjh21            shift64ExtraRightJamming(
936b7f4cSbjh21                zSig0, zSig1, zSig2, - zExp, &zSig0, &zSig1, &zSig2 );
936b7f4cSbjh21            zExp = 0;
936b7f4cSbjh21            if ( isTiny && zSig2 ) float_raise( float_flag_underflow );
936b7f4cSbjh21            if ( roundNearestEven ) {
936b7f4cSbjh21                increment = ( (sbits32) zSig2 < 0 );
936b7f4cSbjh21            }
936b7f4cSbjh21            else {
936b7f4cSbjh21                if ( zSign ) {
936b7f4cSbjh21                    increment = ( roundingMode == float_round_down ) && zSig2;
936b7f4cSbjh21                }
936b7f4cSbjh21                else {
936b7f4cSbjh21                    increment = ( roundingMode == float_round_up ) && zSig2;
936b7f4cSbjh21                }
936b7f4cSbjh21            }
936b7f4cSbjh21        }
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( zSig2 ) float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21    if ( increment ) {
936b7f4cSbjh21        add64( zSig0, zSig1, 0, 1, &zSig0, &zSig1 );
936b7f4cSbjh21        zSig1 &= ~ ( ( zSig2 + zSig2 == 0 ) & roundNearestEven );
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        if ( ( zSig0 | zSig1 ) == 0 ) zExp = 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    return packFloat64( zSign, zExp, zSig0, zSig1 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Takes an abstract floating-point value having sign `zSign', exponent `zExp',
936b7f4cSbjh21and significand formed by the concatenation of `zSig0' and `zSig1', and
936b7f4cSbjh21returns the proper double-precision floating-point value corresponding
936b7f4cSbjh21to the abstract input.  This routine is just like `roundAndPackFloat64'
936b7f4cSbjh21except that the input significand has fewer bits and does not have to be
936b7f4cSbjh21normalized.  In all cases, `zExp' must be 1 less than the ``true'' floating-
936b7f4cSbjh21point exponent.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21static float64
936b7f4cSbjh21 normalizeRoundAndPackFloat64(
936b7f4cSbjh21     flag zSign, int16 zExp, bits32 zSig0, bits32 zSig1 )
936b7f4cSbjh21{
936b7f4cSbjh21    int8 shiftCount;
936b7f4cSbjh21    bits32 zSig2;
936b7f4cSbjh21
936b7f4cSbjh21    if ( zSig0 == 0 ) {
936b7f4cSbjh21        zSig0 = zSig1;
936b7f4cSbjh21        zSig1 = 0;
936b7f4cSbjh21        zExp -= 32;
936b7f4cSbjh21    }
936b7f4cSbjh21    shiftCount = countLeadingZeros32( zSig0 ) - 11;
936b7f4cSbjh21    if ( 0 <= shiftCount ) {
936b7f4cSbjh21        zSig2 = 0;
936b7f4cSbjh21        shortShift64Left( zSig0, zSig1, shiftCount, &zSig0, &zSig1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        shift64ExtraRightJamming(
936b7f4cSbjh21            zSig0, zSig1, 0, - shiftCount, &zSig0, &zSig1, &zSig2 );
936b7f4cSbjh21    }
936b7f4cSbjh21    zExp -= shiftCount;
936b7f4cSbjh21    return roundAndPackFloat64( zSign, zExp, zSig0, zSig1, zSig2 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of converting the 32-bit two's complement integer `a' to
936b7f4cSbjh21the single-precision floating-point format.  The conversion is performed
936b7f4cSbjh21according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float32 int32_to_float32( int32 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag zSign;
936b7f4cSbjh21
936b7f4cSbjh21    if ( a == 0 ) return 0;
936b7f4cSbjh21    if ( a == (sbits32) 0x80000000 ) return packFloat32( 1, 0x9E, 0 );
936b7f4cSbjh21    zSign = ( a < 0 );
*2cec0187Schristos    return normalizeRoundAndPackFloat32(zSign, 0x9C, (uint32)(zSign ? - a : a));
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of converting the 32-bit two's complement integer `a' to
936b7f4cSbjh21the double-precision floating-point format.  The conversion is performed
936b7f4cSbjh21according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float64 int32_to_float64( int32 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag zSign;
936b7f4cSbjh21    bits32 absA;
936b7f4cSbjh21    int8 shiftCount;
936b7f4cSbjh21    bits32 zSig0, zSig1;
936b7f4cSbjh21
936b7f4cSbjh21    if ( a == 0 ) return packFloat64( 0, 0, 0, 0 );
936b7f4cSbjh21    zSign = ( a < 0 );
936b7f4cSbjh21    absA = zSign ? - a : a;
936b7f4cSbjh21    shiftCount = countLeadingZeros32( absA ) - 11;
936b7f4cSbjh21    if ( 0 <= shiftCount ) {
936b7f4cSbjh21        zSig0 = absA<<shiftCount;
936b7f4cSbjh21        zSig1 = 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        shift64Right( absA, 0, - shiftCount, &zSig0, &zSig1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    return packFloat64( zSign, 0x412 - shiftCount, zSig0, zSig1 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21#ifndef SOFTFLOAT_FOR_GCC
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of converting the single-precision floating-point value
936b7f4cSbjh21`a' to the 32-bit two's complement integer format.  The conversion is
936b7f4cSbjh21performed according to the IEC/IEEE Standard for Binary Floating-Point
936b7f4cSbjh21Arithmetic---which means in particular that the conversion is rounded
936b7f4cSbjh21according to the current rounding mode.  If `a' is a NaN, the largest
936b7f4cSbjh21positive integer is returned.  Otherwise, if the conversion overflows, the
936b7f4cSbjh21largest integer with the same sign as `a' is returned.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21int32 float32_to_int32( float32 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign;
936b7f4cSbjh21    int16 aExp, shiftCount;
936b7f4cSbjh21    bits32 aSig, aSigExtra;
936b7f4cSbjh21    int32 z;
936b7f4cSbjh21    int8 roundingMode;
936b7f4cSbjh21
936b7f4cSbjh21    aSig = extractFloat32Frac( a );
936b7f4cSbjh21    aExp = extractFloat32Exp( a );
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    shiftCount = aExp - 0x96;
936b7f4cSbjh21    if ( 0 <= shiftCount ) {
936b7f4cSbjh21        if ( 0x9E <= aExp ) {
936b7f4cSbjh21            if ( a != 0xCF000000 ) {
936b7f4cSbjh21                float_raise( float_flag_invalid );
936b7f4cSbjh21                if ( ! aSign || ( ( aExp == 0xFF ) && aSig ) ) {
936b7f4cSbjh21                    return 0x7FFFFFFF;
936b7f4cSbjh21                }
936b7f4cSbjh21            }
936b7f4cSbjh21            return (sbits32) 0x80000000;
936b7f4cSbjh21        }
936b7f4cSbjh21        z = ( aSig | 0x00800000 )<<shiftCount;
936b7f4cSbjh21        if ( aSign ) z = - z;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        if ( aExp < 0x7E ) {
936b7f4cSbjh21            aSigExtra = aExp | aSig;
936b7f4cSbjh21            z = 0;
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            aSig |= 0x00800000;
936b7f4cSbjh21            aSigExtra = aSig<<( shiftCount & 31 );
936b7f4cSbjh21            z = aSig>>( - shiftCount );
936b7f4cSbjh21        }
936b7f4cSbjh21        if ( aSigExtra ) float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21        roundingMode = float_rounding_mode;
936b7f4cSbjh21        if ( roundingMode == float_round_nearest_even ) {
936b7f4cSbjh21            if ( (sbits32) aSigExtra < 0 ) {
936b7f4cSbjh21                ++z;
936b7f4cSbjh21                if ( (bits32) ( aSigExtra<<1 ) == 0 ) z &= ~1;
936b7f4cSbjh21            }
936b7f4cSbjh21            if ( aSign ) z = - z;
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            aSigExtra = ( aSigExtra != 0 );
936b7f4cSbjh21            if ( aSign ) {
936b7f4cSbjh21                z += ( roundingMode == float_round_down ) & aSigExtra;
936b7f4cSbjh21                z = - z;
936b7f4cSbjh21            }
936b7f4cSbjh21            else {
936b7f4cSbjh21                z += ( roundingMode == float_round_up ) & aSigExtra;
936b7f4cSbjh21            }
936b7f4cSbjh21        }
936b7f4cSbjh21    }
936b7f4cSbjh21    return z;
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21#endif
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of converting the single-precision floating-point value
936b7f4cSbjh21`a' to the 32-bit two's complement integer format.  The conversion is
936b7f4cSbjh21performed according to the IEC/IEEE Standard for Binary Floating-Point
936b7f4cSbjh21Arithmetic, except that the conversion is always rounded toward zero.
936b7f4cSbjh21If `a' is a NaN, the largest positive integer is returned.  Otherwise, if
936b7f4cSbjh21the conversion overflows, the largest integer with the same sign as `a' is
936b7f4cSbjh21returned.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21int32 float32_to_int32_round_to_zero( float32 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign;
936b7f4cSbjh21    int16 aExp, shiftCount;
936b7f4cSbjh21    bits32 aSig;
936b7f4cSbjh21    int32 z;
936b7f4cSbjh21
936b7f4cSbjh21    aSig = extractFloat32Frac( a );
936b7f4cSbjh21    aExp = extractFloat32Exp( a );
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    shiftCount = aExp - 0x9E;
936b7f4cSbjh21    if ( 0 <= shiftCount ) {
936b7f4cSbjh21        if ( a != 0xCF000000 ) {
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21            if ( ! aSign || ( ( aExp == 0xFF ) && aSig ) ) return 0x7FFFFFFF;
936b7f4cSbjh21        }
936b7f4cSbjh21        return (sbits32) 0x80000000;
936b7f4cSbjh21    }
936b7f4cSbjh21    else if ( aExp <= 0x7E ) {
936b7f4cSbjh21        if ( aExp | aSig ) float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    aSig = ( aSig | 0x00800000 )<<8;
936b7f4cSbjh21    z = aSig>>( - shiftCount );
936b7f4cSbjh21    if ( (bits32) ( aSig<<( shiftCount & 31 ) ) ) {
936b7f4cSbjh21        float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aSign ) z = - z;
936b7f4cSbjh21    return z;
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of converting the single-precision floating-point value
936b7f4cSbjh21`a' to the double-precision floating-point format.  The conversion is
936b7f4cSbjh21performed according to the IEC/IEEE Standard for Binary Floating-Point
936b7f4cSbjh21Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float64 float32_to_float64( float32 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign;
936b7f4cSbjh21    int16 aExp;
936b7f4cSbjh21    bits32 aSig, zSig0, zSig1;
936b7f4cSbjh21
936b7f4cSbjh21    aSig = extractFloat32Frac( a );
936b7f4cSbjh21    aExp = extractFloat32Exp( a );
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    if ( aExp == 0xFF ) {
936b7f4cSbjh21        if ( aSig ) return commonNaNToFloat64( float32ToCommonNaN( a ) );
936b7f4cSbjh21        return packFloat64( aSign, 0x7FF, 0, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        if ( aSig == 0 ) return packFloat64( aSign, 0, 0, 0 );
936b7f4cSbjh21        normalizeFloat32Subnormal( aSig, &aExp, &aSig );
936b7f4cSbjh21        --aExp;
936b7f4cSbjh21    }
936b7f4cSbjh21    shift64Right( aSig, 0, 3, &zSig0, &zSig1 );
936b7f4cSbjh21    return packFloat64( aSign, aExp + 0x380, zSig0, zSig1 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21#ifndef SOFTFLOAT_FOR_GCC
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Rounds the single-precision floating-point value `a' to an integer,
936b7f4cSbjh21and returns the result as a single-precision floating-point value.  The
936b7f4cSbjh21operation is performed according to the IEC/IEEE Standard for Binary
936b7f4cSbjh21Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float32 float32_round_to_int( float32 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign;
936b7f4cSbjh21    int16 aExp;
936b7f4cSbjh21    bits32 lastBitMask, roundBitsMask;
936b7f4cSbjh21    int8 roundingMode;
936b7f4cSbjh21    float32 z;
936b7f4cSbjh21
936b7f4cSbjh21    aExp = extractFloat32Exp( a );
936b7f4cSbjh21    if ( 0x96 <= aExp ) {
936b7f4cSbjh21        if ( ( aExp == 0xFF ) && extractFloat32Frac( a ) ) {
936b7f4cSbjh21            return propagateFloat32NaN( a, a );
936b7f4cSbjh21        }
936b7f4cSbjh21        return a;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp <= 0x7E ) {
936b7f4cSbjh21        if ( (bits32) ( a<<1 ) == 0 ) return a;
936b7f4cSbjh21        float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21        aSign = extractFloat32Sign( a );
936b7f4cSbjh21        switch ( float_rounding_mode ) {
936b7f4cSbjh21         case float_round_nearest_even:
936b7f4cSbjh21            if ( ( aExp == 0x7E ) && extractFloat32Frac( a ) ) {
936b7f4cSbjh21                return packFloat32( aSign, 0x7F, 0 );
936b7f4cSbjh21            }
936b7f4cSbjh21            break;
936b7f4cSbjh21	 case float_round_to_zero:
936b7f4cSbjh21	    break;
936b7f4cSbjh21         case float_round_down:
936b7f4cSbjh21            return aSign ? 0xBF800000 : 0;
936b7f4cSbjh21         case float_round_up:
936b7f4cSbjh21            return aSign ? 0x80000000 : 0x3F800000;
936b7f4cSbjh21        }
936b7f4cSbjh21        return packFloat32( aSign, 0, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    lastBitMask = 1;
936b7f4cSbjh21    lastBitMask <<= 0x96 - aExp;
936b7f4cSbjh21    roundBitsMask = lastBitMask - 1;
936b7f4cSbjh21    z = a;
936b7f4cSbjh21    roundingMode = float_rounding_mode;
936b7f4cSbjh21    if ( roundingMode == float_round_nearest_even ) {
936b7f4cSbjh21        z += lastBitMask>>1;
936b7f4cSbjh21        if ( ( z & roundBitsMask ) == 0 ) z &= ~ lastBitMask;
936b7f4cSbjh21    }
936b7f4cSbjh21    else if ( roundingMode != float_round_to_zero ) {
936b7f4cSbjh21        if ( extractFloat32Sign( z ) ^ ( roundingMode == float_round_up ) ) {
936b7f4cSbjh21            z += roundBitsMask;
936b7f4cSbjh21        }
936b7f4cSbjh21    }
936b7f4cSbjh21    z &= ~ roundBitsMask;
936b7f4cSbjh21    if ( z != a ) float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21    return z;
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21#endif
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of adding the absolute values of the single-precision
936b7f4cSbjh21floating-point values `a' and `b'.  If `zSign' is 1, the sum is negated
936b7f4cSbjh21before being returned.  `zSign' is ignored if the result is a NaN.
936b7f4cSbjh21The addition is performed according to the IEC/IEEE Standard for Binary
936b7f4cSbjh21Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21static float32 addFloat32Sigs( float32 a, float32 b, flag zSign )
936b7f4cSbjh21{
936b7f4cSbjh21    int16 aExp, bExp, zExp;
936b7f4cSbjh21    bits32 aSig, bSig, zSig;
936b7f4cSbjh21    int16 expDiff;
936b7f4cSbjh21
936b7f4cSbjh21    aSig = extractFloat32Frac( a );
936b7f4cSbjh21    aExp = extractFloat32Exp( a );
936b7f4cSbjh21    bSig = extractFloat32Frac( b );
936b7f4cSbjh21    bExp = extractFloat32Exp( b );
936b7f4cSbjh21    expDiff = aExp - bExp;
936b7f4cSbjh21    aSig <<= 6;
936b7f4cSbjh21    bSig <<= 6;
936b7f4cSbjh21    if ( 0 < expDiff ) {
936b7f4cSbjh21        if ( aExp == 0xFF ) {
936b7f4cSbjh21            if ( aSig ) return propagateFloat32NaN( a, b );
936b7f4cSbjh21            return a;
936b7f4cSbjh21        }
936b7f4cSbjh21        if ( bExp == 0 ) {
936b7f4cSbjh21            --expDiff;
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            bSig |= 0x20000000;
936b7f4cSbjh21        }
936b7f4cSbjh21        shift32RightJamming( bSig, expDiff, &bSig );
936b7f4cSbjh21        zExp = aExp;
936b7f4cSbjh21    }
936b7f4cSbjh21    else if ( expDiff < 0 ) {
936b7f4cSbjh21        if ( bExp == 0xFF ) {
936b7f4cSbjh21            if ( bSig ) return propagateFloat32NaN( a, b );
936b7f4cSbjh21            return packFloat32( zSign, 0xFF, 0 );
936b7f4cSbjh21        }
936b7f4cSbjh21        if ( aExp == 0 ) {
936b7f4cSbjh21            ++expDiff;
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            aSig |= 0x20000000;
936b7f4cSbjh21        }
936b7f4cSbjh21        shift32RightJamming( aSig, - expDiff, &aSig );
936b7f4cSbjh21        zExp = bExp;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        if ( aExp == 0xFF ) {
936b7f4cSbjh21            if ( aSig | bSig ) return propagateFloat32NaN( a, b );
936b7f4cSbjh21            return a;
936b7f4cSbjh21        }
936b7f4cSbjh21        if ( aExp == 0 ) return packFloat32( zSign, 0, ( aSig + bSig )>>6 );
936b7f4cSbjh21        zSig = 0x40000000 + aSig + bSig;
936b7f4cSbjh21        zExp = aExp;
936b7f4cSbjh21        goto roundAndPack;
936b7f4cSbjh21    }
936b7f4cSbjh21    aSig |= 0x20000000;
936b7f4cSbjh21    zSig = ( aSig + bSig )<<1;
936b7f4cSbjh21    --zExp;
936b7f4cSbjh21    if ( (sbits32) zSig < 0 ) {
936b7f4cSbjh21        zSig = aSig + bSig;
936b7f4cSbjh21        ++zExp;
936b7f4cSbjh21    }
936b7f4cSbjh21 roundAndPack:
936b7f4cSbjh21    return roundAndPackFloat32( zSign, zExp, zSig );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of subtracting the absolute values of the single-
936b7f4cSbjh21precision floating-point values `a' and `b'.  If `zSign' is 1, the
936b7f4cSbjh21difference is negated before being returned.  `zSign' is ignored if the
936b7f4cSbjh21result is a NaN.  The subtraction is performed according to the IEC/IEEE
936b7f4cSbjh21Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21static float32 subFloat32Sigs( float32 a, float32 b, flag zSign )
936b7f4cSbjh21{
936b7f4cSbjh21    int16 aExp, bExp, zExp;
936b7f4cSbjh21    bits32 aSig, bSig, zSig;
936b7f4cSbjh21    int16 expDiff;
936b7f4cSbjh21
936b7f4cSbjh21    aSig = extractFloat32Frac( a );
936b7f4cSbjh21    aExp = extractFloat32Exp( a );
936b7f4cSbjh21    bSig = extractFloat32Frac( b );
936b7f4cSbjh21    bExp = extractFloat32Exp( b );
936b7f4cSbjh21    expDiff = aExp - bExp;
936b7f4cSbjh21    aSig <<= 7;
936b7f4cSbjh21    bSig <<= 7;
936b7f4cSbjh21    if ( 0 < expDiff ) goto aExpBigger;
936b7f4cSbjh21    if ( expDiff < 0 ) goto bExpBigger;
936b7f4cSbjh21    if ( aExp == 0xFF ) {
936b7f4cSbjh21        if ( aSig | bSig ) return propagateFloat32NaN( a, b );
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return float32_default_nan;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        aExp = 1;
936b7f4cSbjh21        bExp = 1;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bSig < aSig ) goto aBigger;
936b7f4cSbjh21    if ( aSig < bSig ) goto bBigger;
936b7f4cSbjh21    return packFloat32( float_rounding_mode == float_round_down, 0, 0 );
936b7f4cSbjh21 bExpBigger:
936b7f4cSbjh21    if ( bExp == 0xFF ) {
936b7f4cSbjh21        if ( bSig ) return propagateFloat32NaN( a, b );
936b7f4cSbjh21        return packFloat32( zSign ^ 1, 0xFF, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        ++expDiff;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        aSig |= 0x40000000;
936b7f4cSbjh21    }
936b7f4cSbjh21    shift32RightJamming( aSig, - expDiff, &aSig );
936b7f4cSbjh21    bSig |= 0x40000000;
936b7f4cSbjh21 bBigger:
936b7f4cSbjh21    zSig = bSig - aSig;
936b7f4cSbjh21    zExp = bExp;
936b7f4cSbjh21    zSign ^= 1;
936b7f4cSbjh21    goto normalizeRoundAndPack;
936b7f4cSbjh21 aExpBigger:
936b7f4cSbjh21    if ( aExp == 0xFF ) {
936b7f4cSbjh21        if ( aSig ) return propagateFloat32NaN( a, b );
936b7f4cSbjh21        return a;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0 ) {
936b7f4cSbjh21        --expDiff;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        bSig |= 0x40000000;
936b7f4cSbjh21    }
936b7f4cSbjh21    shift32RightJamming( bSig, expDiff, &bSig );
936b7f4cSbjh21    aSig |= 0x40000000;
936b7f4cSbjh21 aBigger:
936b7f4cSbjh21    zSig = aSig - bSig;
936b7f4cSbjh21    zExp = aExp;
936b7f4cSbjh21 normalizeRoundAndPack:
936b7f4cSbjh21    --zExp;
936b7f4cSbjh21    return normalizeRoundAndPackFloat32( zSign, zExp, zSig );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of adding the single-precision floating-point values `a'
936b7f4cSbjh21and `b'.  The operation is performed according to the IEC/IEEE Standard for
936b7f4cSbjh21Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float32 float32_add( float32 a, float32 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    bSign = extractFloat32Sign( b );
936b7f4cSbjh21    if ( aSign == bSign ) {
936b7f4cSbjh21        return addFloat32Sigs( a, b, aSign );
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        return subFloat32Sigs( a, b, aSign );
936b7f4cSbjh21    }
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of subtracting the single-precision floating-point values
936b7f4cSbjh21`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
936b7f4cSbjh21for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float32 float32_sub( float32 a, float32 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    bSign = extractFloat32Sign( b );
936b7f4cSbjh21    if ( aSign == bSign ) {
936b7f4cSbjh21        return subFloat32Sigs( a, b, aSign );
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        return addFloat32Sigs( a, b, aSign );
936b7f4cSbjh21    }
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of multiplying the single-precision floating-point values
936b7f4cSbjh21`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
936b7f4cSbjh21for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float32 float32_mul( float32 a, float32 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign, zSign;
936b7f4cSbjh21    int16 aExp, bExp, zExp;
936b7f4cSbjh21    bits32 aSig, bSig, zSig0, zSig1;
936b7f4cSbjh21
936b7f4cSbjh21    aSig = extractFloat32Frac( a );
936b7f4cSbjh21    aExp = extractFloat32Exp( a );
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    bSig = extractFloat32Frac( b );
936b7f4cSbjh21    bExp = extractFloat32Exp( b );
936b7f4cSbjh21    bSign = extractFloat32Sign( b );
936b7f4cSbjh21    zSign = aSign ^ bSign;
936b7f4cSbjh21    if ( aExp == 0xFF ) {
936b7f4cSbjh21        if ( aSig || ( ( bExp == 0xFF ) && bSig ) ) {
936b7f4cSbjh21            return propagateFloat32NaN( a, b );
936b7f4cSbjh21        }
936b7f4cSbjh21        if ( ( bExp | bSig ) == 0 ) {
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21            return float32_default_nan;
936b7f4cSbjh21        }
936b7f4cSbjh21        return packFloat32( zSign, 0xFF, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0xFF ) {
936b7f4cSbjh21        if ( bSig ) return propagateFloat32NaN( a, b );
936b7f4cSbjh21        if ( ( aExp | aSig ) == 0 ) {
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21            return float32_default_nan;
936b7f4cSbjh21        }
936b7f4cSbjh21        return packFloat32( zSign, 0xFF, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        if ( aSig == 0 ) return packFloat32( zSign, 0, 0 );
936b7f4cSbjh21        normalizeFloat32Subnormal( aSig, &aExp, &aSig );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0 ) {
936b7f4cSbjh21        if ( bSig == 0 ) return packFloat32( zSign, 0, 0 );
936b7f4cSbjh21        normalizeFloat32Subnormal( bSig, &bExp, &bSig );
936b7f4cSbjh21    }
936b7f4cSbjh21    zExp = aExp + bExp - 0x7F;
936b7f4cSbjh21    aSig = ( aSig | 0x00800000 )<<7;
936b7f4cSbjh21    bSig = ( bSig | 0x00800000 )<<8;
936b7f4cSbjh21    mul32To64( aSig, bSig, &zSig0, &zSig1 );
936b7f4cSbjh21    zSig0 |= ( zSig1 != 0 );
936b7f4cSbjh21    if ( 0 <= (sbits32) ( zSig0<<1 ) ) {
936b7f4cSbjh21        zSig0 <<= 1;
936b7f4cSbjh21        --zExp;
936b7f4cSbjh21    }
936b7f4cSbjh21    return roundAndPackFloat32( zSign, zExp, zSig0 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of dividing the single-precision floating-point value `a'
936b7f4cSbjh21by the corresponding value `b'.  The operation is performed according to the
936b7f4cSbjh21IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float32 float32_div( float32 a, float32 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign, zSign;
936b7f4cSbjh21    int16 aExp, bExp, zExp;
936b7f4cSbjh21    bits32 aSig, bSig, zSig, rem0, rem1, term0, term1;
936b7f4cSbjh21
936b7f4cSbjh21    aSig = extractFloat32Frac( a );
936b7f4cSbjh21    aExp = extractFloat32Exp( a );
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    bSig = extractFloat32Frac( b );
936b7f4cSbjh21    bExp = extractFloat32Exp( b );
936b7f4cSbjh21    bSign = extractFloat32Sign( b );
936b7f4cSbjh21    zSign = aSign ^ bSign;
936b7f4cSbjh21    if ( aExp == 0xFF ) {
936b7f4cSbjh21        if ( aSig ) return propagateFloat32NaN( a, b );
936b7f4cSbjh21        if ( bExp == 0xFF ) {
936b7f4cSbjh21            if ( bSig ) return propagateFloat32NaN( a, b );
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21            return float32_default_nan;
936b7f4cSbjh21        }
936b7f4cSbjh21        return packFloat32( zSign, 0xFF, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0xFF ) {
936b7f4cSbjh21        if ( bSig ) return propagateFloat32NaN( a, b );
936b7f4cSbjh21        return packFloat32( zSign, 0, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0 ) {
936b7f4cSbjh21        if ( bSig == 0 ) {
936b7f4cSbjh21            if ( ( aExp | aSig ) == 0 ) {
936b7f4cSbjh21                float_raise( float_flag_invalid );
936b7f4cSbjh21                return float32_default_nan;
936b7f4cSbjh21            }
936b7f4cSbjh21            float_raise( float_flag_divbyzero );
936b7f4cSbjh21            return packFloat32( zSign, 0xFF, 0 );
936b7f4cSbjh21        }
936b7f4cSbjh21        normalizeFloat32Subnormal( bSig, &bExp, &bSig );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        if ( aSig == 0 ) return packFloat32( zSign, 0, 0 );
936b7f4cSbjh21        normalizeFloat32Subnormal( aSig, &aExp, &aSig );
936b7f4cSbjh21    }
936b7f4cSbjh21    zExp = aExp - bExp + 0x7D;
936b7f4cSbjh21    aSig = ( aSig | 0x00800000 )<<7;
936b7f4cSbjh21    bSig = ( bSig | 0x00800000 )<<8;
936b7f4cSbjh21    if ( bSig <= ( aSig + aSig ) ) {
936b7f4cSbjh21        aSig >>= 1;
936b7f4cSbjh21        ++zExp;
936b7f4cSbjh21    }
936b7f4cSbjh21    zSig = estimateDiv64To32( aSig, 0, bSig );
936b7f4cSbjh21    if ( ( zSig & 0x3F ) <= 2 ) {
936b7f4cSbjh21        mul32To64( bSig, zSig, &term0, &term1 );
936b7f4cSbjh21        sub64( aSig, 0, term0, term1, &rem0, &rem1 );
936b7f4cSbjh21        while ( (sbits32) rem0 < 0 ) {
936b7f4cSbjh21            --zSig;
936b7f4cSbjh21            add64( rem0, rem1, 0, bSig, &rem0, &rem1 );
936b7f4cSbjh21        }
936b7f4cSbjh21        zSig |= ( rem1 != 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    return roundAndPackFloat32( zSign, zExp, zSig );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21#ifndef SOFTFLOAT_FOR_GCC
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the remainder of the single-precision floating-point value `a'
936b7f4cSbjh21with respect to the corresponding value `b'.  The operation is performed
936b7f4cSbjh21according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float32 float32_rem( float32 a, float32 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign, zSign;
936b7f4cSbjh21    int16 aExp, bExp, expDiff;
936b7f4cSbjh21    bits32 aSig, bSig, q, allZero, alternateASig;
936b7f4cSbjh21    sbits32 sigMean;
936b7f4cSbjh21
936b7f4cSbjh21    aSig = extractFloat32Frac( a );
936b7f4cSbjh21    aExp = extractFloat32Exp( a );
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    bSig = extractFloat32Frac( b );
936b7f4cSbjh21    bExp = extractFloat32Exp( b );
936b7f4cSbjh21    bSign = extractFloat32Sign( b );
936b7f4cSbjh21    if ( aExp == 0xFF ) {
936b7f4cSbjh21        if ( aSig || ( ( bExp == 0xFF ) && bSig ) ) {
936b7f4cSbjh21            return propagateFloat32NaN( a, b );
936b7f4cSbjh21        }
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return float32_default_nan;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0xFF ) {
936b7f4cSbjh21        if ( bSig ) return propagateFloat32NaN( a, b );
936b7f4cSbjh21        return a;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0 ) {
936b7f4cSbjh21        if ( bSig == 0 ) {
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21            return float32_default_nan;
936b7f4cSbjh21        }
936b7f4cSbjh21        normalizeFloat32Subnormal( bSig, &bExp, &bSig );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        if ( aSig == 0 ) return a;
936b7f4cSbjh21        normalizeFloat32Subnormal( aSig, &aExp, &aSig );
936b7f4cSbjh21    }
936b7f4cSbjh21    expDiff = aExp - bExp;
936b7f4cSbjh21    aSig = ( aSig | 0x00800000 )<<8;
936b7f4cSbjh21    bSig = ( bSig | 0x00800000 )<<8;
936b7f4cSbjh21    if ( expDiff < 0 ) {
936b7f4cSbjh21        if ( expDiff < -1 ) return a;
936b7f4cSbjh21        aSig >>= 1;
936b7f4cSbjh21    }
936b7f4cSbjh21    q = ( bSig <= aSig );
936b7f4cSbjh21    if ( q ) aSig -= bSig;
936b7f4cSbjh21    expDiff -= 32;
936b7f4cSbjh21    while ( 0 < expDiff ) {
936b7f4cSbjh21        q = estimateDiv64To32( aSig, 0, bSig );
936b7f4cSbjh21        q = ( 2 < q ) ? q - 2 : 0;
936b7f4cSbjh21        aSig = - ( ( bSig>>2 ) * q );
936b7f4cSbjh21        expDiff -= 30;
936b7f4cSbjh21    }
936b7f4cSbjh21    expDiff += 32;
936b7f4cSbjh21    if ( 0 < expDiff ) {
936b7f4cSbjh21        q = estimateDiv64To32( aSig, 0, bSig );
936b7f4cSbjh21        q = ( 2 < q ) ? q - 2 : 0;
936b7f4cSbjh21        q >>= 32 - expDiff;
936b7f4cSbjh21        bSig >>= 2;
936b7f4cSbjh21        aSig = ( ( aSig>>1 )<<( expDiff - 1 ) ) - bSig * q;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        aSig >>= 2;
936b7f4cSbjh21        bSig >>= 2;
936b7f4cSbjh21    }
936b7f4cSbjh21    do {
936b7f4cSbjh21        alternateASig = aSig;
936b7f4cSbjh21        ++q;
936b7f4cSbjh21        aSig -= bSig;
936b7f4cSbjh21    } while ( 0 <= (sbits32) aSig );
936b7f4cSbjh21    sigMean = aSig + alternateASig;
936b7f4cSbjh21    if ( ( sigMean < 0 ) || ( ( sigMean == 0 ) && ( q & 1 ) ) ) {
936b7f4cSbjh21        aSig = alternateASig;
936b7f4cSbjh21    }
936b7f4cSbjh21    zSign = ( (sbits32) aSig < 0 );
936b7f4cSbjh21    if ( zSign ) aSig = - aSig;
936b7f4cSbjh21    return normalizeRoundAndPackFloat32( aSign ^ zSign, bExp, aSig );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21#endif
936b7f4cSbjh21
936b7f4cSbjh21#ifndef SOFTFLOAT_FOR_GCC
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the square root of the single-precision floating-point value `a'.
936b7f4cSbjh21The operation is performed according to the IEC/IEEE Standard for Binary
936b7f4cSbjh21Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float32 float32_sqrt( float32 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign;
936b7f4cSbjh21    int16 aExp, zExp;
936b7f4cSbjh21    bits32 aSig, zSig, rem0, rem1, term0, term1;
936b7f4cSbjh21
936b7f4cSbjh21    aSig = extractFloat32Frac( a );
936b7f4cSbjh21    aExp = extractFloat32Exp( a );
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    if ( aExp == 0xFF ) {
936b7f4cSbjh21        if ( aSig ) return propagateFloat32NaN( a, 0 );
936b7f4cSbjh21        if ( ! aSign ) return a;
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return float32_default_nan;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aSign ) {
936b7f4cSbjh21        if ( ( aExp | aSig ) == 0 ) return a;
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return float32_default_nan;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        if ( aSig == 0 ) return 0;
936b7f4cSbjh21        normalizeFloat32Subnormal( aSig, &aExp, &aSig );
936b7f4cSbjh21    }
936b7f4cSbjh21    zExp = ( ( aExp - 0x7F )>>1 ) + 0x7E;
936b7f4cSbjh21    aSig = ( aSig | 0x00800000 )<<8;
936b7f4cSbjh21    zSig = estimateSqrt32( aExp, aSig ) + 2;
936b7f4cSbjh21    if ( ( zSig & 0x7F ) <= 5 ) {
936b7f4cSbjh21        if ( zSig < 2 ) {
936b7f4cSbjh21            zSig = 0x7FFFFFFF;
936b7f4cSbjh21            goto roundAndPack;
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            aSig >>= aExp & 1;
936b7f4cSbjh21            mul32To64( zSig, zSig, &term0, &term1 );
936b7f4cSbjh21            sub64( aSig, 0, term0, term1, &rem0, &rem1 );
936b7f4cSbjh21            while ( (sbits32) rem0 < 0 ) {
936b7f4cSbjh21                --zSig;
936b7f4cSbjh21                shortShift64Left( 0, zSig, 1, &term0, &term1 );
936b7f4cSbjh21                term1 |= 1;
936b7f4cSbjh21                add64( rem0, rem1, term0, term1, &rem0, &rem1 );
936b7f4cSbjh21            }
936b7f4cSbjh21            zSig |= ( ( rem0 | rem1 ) != 0 );
936b7f4cSbjh21        }
936b7f4cSbjh21    }
936b7f4cSbjh21    shift32RightJamming( zSig, 1, &zSig );
936b7f4cSbjh21 roundAndPack:
936b7f4cSbjh21    return roundAndPackFloat32( 0, zExp, zSig );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21#endif
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the single-precision floating-point value `a' is equal to
936b7f4cSbjh21the corresponding value `b', and 0 otherwise.  The comparison is performed
936b7f4cSbjh21according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float32_eq( float32 a, float32 b )
936b7f4cSbjh21{
936b7f4cSbjh21
936b7f4cSbjh21    if (    ( ( extractFloat32Exp( a ) == 0xFF ) && extractFloat32Frac( a ) )
936b7f4cSbjh21         || ( ( extractFloat32Exp( b ) == 0xFF ) && extractFloat32Frac( b ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        if ( float32_is_signaling_nan( a ) || float32_is_signaling_nan( b ) ) {
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21        }
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    return ( a == b ) || ( (bits32) ( ( a | b )<<1 ) == 0 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the single-precision floating-point value `a' is less than
936b7f4cSbjh21or equal to the corresponding value `b', and 0 otherwise.  The comparison
936b7f4cSbjh21is performed according to the IEC/IEEE Standard for Binary Floating-Point
936b7f4cSbjh21Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float32_le( float32 a, float32 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21
936b7f4cSbjh21    if (    ( ( extractFloat32Exp( a ) == 0xFF ) && extractFloat32Frac( a ) )
936b7f4cSbjh21         || ( ( extractFloat32Exp( b ) == 0xFF ) && extractFloat32Frac( b ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    bSign = extractFloat32Sign( b );
936b7f4cSbjh21    if ( aSign != bSign ) return aSign || ( (bits32) ( ( a | b )<<1 ) == 0 );
936b7f4cSbjh21    return ( a == b ) || ( aSign ^ ( a < b ) );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the single-precision floating-point value `a' is less than
936b7f4cSbjh21the corresponding value `b', and 0 otherwise.  The comparison is performed
936b7f4cSbjh21according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float32_lt( float32 a, float32 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21
936b7f4cSbjh21    if (    ( ( extractFloat32Exp( a ) == 0xFF ) && extractFloat32Frac( a ) )
936b7f4cSbjh21         || ( ( extractFloat32Exp( b ) == 0xFF ) && extractFloat32Frac( b ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    bSign = extractFloat32Sign( b );
936b7f4cSbjh21    if ( aSign != bSign ) return aSign && ( (bits32) ( ( a | b )<<1 ) != 0 );
936b7f4cSbjh21    return ( a != b ) && ( aSign ^ ( a < b ) );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21#ifndef SOFTFLOAT_FOR_GCC /* Not needed */
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the single-precision floating-point value `a' is equal to
936b7f4cSbjh21the corresponding value `b', and 0 otherwise.  The invalid exception is
936b7f4cSbjh21raised if either operand is a NaN.  Otherwise, the comparison is performed
936b7f4cSbjh21according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float32_eq_signaling( float32 a, float32 b )
936b7f4cSbjh21{
936b7f4cSbjh21
936b7f4cSbjh21    if (    ( ( extractFloat32Exp( a ) == 0xFF ) && extractFloat32Frac( a ) )
936b7f4cSbjh21         || ( ( extractFloat32Exp( b ) == 0xFF ) && extractFloat32Frac( b ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    return ( a == b ) || ( (bits32) ( ( a | b )<<1 ) == 0 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the single-precision floating-point value `a' is less than or
936b7f4cSbjh21equal to the corresponding value `b', and 0 otherwise.  Quiet NaNs do not
936b7f4cSbjh21cause an exception.  Otherwise, the comparison is performed according to the
936b7f4cSbjh21IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float32_le_quiet( float32 a, float32 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21    int16 aExp, bExp;
936b7f4cSbjh21
936b7f4cSbjh21    if (    ( ( extractFloat32Exp( a ) == 0xFF ) && extractFloat32Frac( a ) )
936b7f4cSbjh21         || ( ( extractFloat32Exp( b ) == 0xFF ) && extractFloat32Frac( b ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        if ( float32_is_signaling_nan( a ) || float32_is_signaling_nan( b ) ) {
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21        }
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    bSign = extractFloat32Sign( b );
936b7f4cSbjh21    if ( aSign != bSign ) return aSign || ( (bits32) ( ( a | b )<<1 ) == 0 );
936b7f4cSbjh21    return ( a == b ) || ( aSign ^ ( a < b ) );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the single-precision floating-point value `a' is less than
936b7f4cSbjh21the corresponding value `b', and 0 otherwise.  Quiet NaNs do not cause an
936b7f4cSbjh21exception.  Otherwise, the comparison is performed according to the IEC/IEEE
936b7f4cSbjh21Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float32_lt_quiet( float32 a, float32 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21
936b7f4cSbjh21    if (    ( ( extractFloat32Exp( a ) == 0xFF ) && extractFloat32Frac( a ) )
936b7f4cSbjh21         || ( ( extractFloat32Exp( b ) == 0xFF ) && extractFloat32Frac( b ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        if ( float32_is_signaling_nan( a ) || float32_is_signaling_nan( b ) ) {
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21        }
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    aSign = extractFloat32Sign( a );
936b7f4cSbjh21    bSign = extractFloat32Sign( b );
936b7f4cSbjh21    if ( aSign != bSign ) return aSign && ( (bits32) ( ( a | b )<<1 ) != 0 );
936b7f4cSbjh21    return ( a != b ) && ( aSign ^ ( a < b ) );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21#endif /* !SOFTFLOAT_FOR_GCC */
936b7f4cSbjh21
936b7f4cSbjh21#ifndef SOFTFLOAT_FOR_GCC /* Not needed */
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of converting the double-precision floating-point value
936b7f4cSbjh21`a' to the 32-bit two's complement integer format.  The conversion is
936b7f4cSbjh21performed according to the IEC/IEEE Standard for Binary Floating-Point
936b7f4cSbjh21Arithmetic---which means in particular that the conversion is rounded
936b7f4cSbjh21according to the current rounding mode.  If `a' is a NaN, the largest
936b7f4cSbjh21positive integer is returned.  Otherwise, if the conversion overflows, the
936b7f4cSbjh21largest integer with the same sign as `a' is returned.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21int32 float64_to_int32( float64 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign;
936b7f4cSbjh21    int16 aExp, shiftCount;
936b7f4cSbjh21    bits32 aSig0, aSig1, absZ, aSigExtra;
936b7f4cSbjh21    int32 z;
936b7f4cSbjh21    int8 roundingMode;
936b7f4cSbjh21
936b7f4cSbjh21    aSig1 = extractFloat64Frac1( a );
936b7f4cSbjh21    aSig0 = extractFloat64Frac0( a );
936b7f4cSbjh21    aExp = extractFloat64Exp( a );
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    shiftCount = aExp - 0x413;
936b7f4cSbjh21    if ( 0 <= shiftCount ) {
936b7f4cSbjh21        if ( 0x41E < aExp ) {
936b7f4cSbjh21            if ( ( aExp == 0x7FF ) && ( aSig0 | aSig1 ) ) aSign = 0;
936b7f4cSbjh21            goto invalid;
936b7f4cSbjh21        }
936b7f4cSbjh21        shortShift64Left(
936b7f4cSbjh21            aSig0 | 0x00100000, aSig1, shiftCount, &absZ, &aSigExtra );
936b7f4cSbjh21        if ( 0x80000000 < absZ ) goto invalid;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        aSig1 = ( aSig1 != 0 );
936b7f4cSbjh21        if ( aExp < 0x3FE ) {
936b7f4cSbjh21            aSigExtra = aExp | aSig0 | aSig1;
936b7f4cSbjh21            absZ = 0;
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            aSig0 |= 0x00100000;
936b7f4cSbjh21            aSigExtra = ( aSig0<<( shiftCount & 31 ) ) | aSig1;
936b7f4cSbjh21            absZ = aSig0>>( - shiftCount );
936b7f4cSbjh21        }
936b7f4cSbjh21    }
936b7f4cSbjh21    roundingMode = float_rounding_mode;
936b7f4cSbjh21    if ( roundingMode == float_round_nearest_even ) {
936b7f4cSbjh21        if ( (sbits32) aSigExtra < 0 ) {
936b7f4cSbjh21            ++absZ;
936b7f4cSbjh21            if ( (bits32) ( aSigExtra<<1 ) == 0 ) absZ &= ~1;
936b7f4cSbjh21        }
936b7f4cSbjh21        z = aSign ? - absZ : absZ;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        aSigExtra = ( aSigExtra != 0 );
936b7f4cSbjh21        if ( aSign ) {
936b7f4cSbjh21            z = - (   absZ
936b7f4cSbjh21                    + ( ( roundingMode == float_round_down ) & aSigExtra ) );
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            z = absZ + ( ( roundingMode == float_round_up ) & aSigExtra );
936b7f4cSbjh21        }
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( ( aSign ^ ( z < 0 ) ) && z ) {
936b7f4cSbjh21 invalid:
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return aSign ? (sbits32) 0x80000000 : 0x7FFFFFFF;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aSigExtra ) float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21    return z;
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21#endif /* !SOFTFLOAT_FOR_GCC */
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of converting the double-precision floating-point value
936b7f4cSbjh21`a' to the 32-bit two's complement integer format.  The conversion is
936b7f4cSbjh21performed according to the IEC/IEEE Standard for Binary Floating-Point
936b7f4cSbjh21Arithmetic, except that the conversion is always rounded toward zero.
936b7f4cSbjh21If `a' is a NaN, the largest positive integer is returned.  Otherwise, if
936b7f4cSbjh21the conversion overflows, the largest integer with the same sign as `a' is
936b7f4cSbjh21returned.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21int32 float64_to_int32_round_to_zero( float64 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign;
936b7f4cSbjh21    int16 aExp, shiftCount;
936b7f4cSbjh21    bits32 aSig0, aSig1, absZ, aSigExtra;
936b7f4cSbjh21    int32 z;
936b7f4cSbjh21
936b7f4cSbjh21    aSig1 = extractFloat64Frac1( a );
936b7f4cSbjh21    aSig0 = extractFloat64Frac0( a );
936b7f4cSbjh21    aExp = extractFloat64Exp( a );
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    shiftCount = aExp - 0x413;
936b7f4cSbjh21    if ( 0 <= shiftCount ) {
936b7f4cSbjh21        if ( 0x41E < aExp ) {
936b7f4cSbjh21            if ( ( aExp == 0x7FF ) && ( aSig0 | aSig1 ) ) aSign = 0;
936b7f4cSbjh21            goto invalid;
936b7f4cSbjh21        }
936b7f4cSbjh21        shortShift64Left(
936b7f4cSbjh21            aSig0 | 0x00100000, aSig1, shiftCount, &absZ, &aSigExtra );
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        if ( aExp < 0x3FF ) {
936b7f4cSbjh21            if ( aExp | aSig0 | aSig1 ) {
936b7f4cSbjh21                float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21            }
936b7f4cSbjh21            return 0;
936b7f4cSbjh21        }
936b7f4cSbjh21        aSig0 |= 0x00100000;
936b7f4cSbjh21        aSigExtra = ( aSig0<<( shiftCount & 31 ) ) | aSig1;
936b7f4cSbjh21        absZ = aSig0>>( - shiftCount );
936b7f4cSbjh21    }
936b7f4cSbjh21    z = aSign ? - absZ : absZ;
936b7f4cSbjh21    if ( ( aSign ^ ( z < 0 ) ) && z ) {
936b7f4cSbjh21 invalid:
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return aSign ? (sbits32) 0x80000000 : 0x7FFFFFFF;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aSigExtra ) float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21    return z;
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of converting the double-precision floating-point value
936b7f4cSbjh21`a' to the single-precision floating-point format.  The conversion is
936b7f4cSbjh21performed according to the IEC/IEEE Standard for Binary Floating-Point
936b7f4cSbjh21Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float32 float64_to_float32( float64 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign;
936b7f4cSbjh21    int16 aExp;
936b7f4cSbjh21    bits32 aSig0, aSig1, zSig;
936b7f4cSbjh21    bits32 allZero;
936b7f4cSbjh21
936b7f4cSbjh21    aSig1 = extractFloat64Frac1( a );
936b7f4cSbjh21    aSig0 = extractFloat64Frac0( a );
936b7f4cSbjh21    aExp = extractFloat64Exp( a );
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    if ( aExp == 0x7FF ) {
936b7f4cSbjh21        if ( aSig0 | aSig1 ) {
936b7f4cSbjh21            return commonNaNToFloat32( float64ToCommonNaN( a ) );
936b7f4cSbjh21        }
936b7f4cSbjh21        return packFloat32( aSign, 0xFF, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    shift64RightJamming( aSig0, aSig1, 22, &allZero, &zSig );
936b7f4cSbjh21    if ( aExp ) zSig |= 0x40000000;
936b7f4cSbjh21    return roundAndPackFloat32( aSign, aExp - 0x381, zSig );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21#ifndef SOFTFLOAT_FOR_GCC
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Rounds the double-precision floating-point value `a' to an integer,
936b7f4cSbjh21and returns the result as a double-precision floating-point value.  The
936b7f4cSbjh21operation is performed according to the IEC/IEEE Standard for Binary
936b7f4cSbjh21Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float64 float64_round_to_int( float64 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign;
936b7f4cSbjh21    int16 aExp;
936b7f4cSbjh21    bits32 lastBitMask, roundBitsMask;
936b7f4cSbjh21    int8 roundingMode;
936b7f4cSbjh21    float64 z;
936b7f4cSbjh21
936b7f4cSbjh21    aExp = extractFloat64Exp( a );
936b7f4cSbjh21    if ( 0x413 <= aExp ) {
936b7f4cSbjh21        if ( 0x433 <= aExp ) {
936b7f4cSbjh21            if (    ( aExp == 0x7FF )
936b7f4cSbjh21                 && ( extractFloat64Frac0( a ) | extractFloat64Frac1( a ) ) ) {
936b7f4cSbjh21                return propagateFloat64NaN( a, a );
936b7f4cSbjh21            }
936b7f4cSbjh21            return a;
936b7f4cSbjh21        }
936b7f4cSbjh21        lastBitMask = 1;
936b7f4cSbjh21        lastBitMask = ( lastBitMask<<( 0x432 - aExp ) )<<1;
936b7f4cSbjh21        roundBitsMask = lastBitMask - 1;
936b7f4cSbjh21        z = a;
936b7f4cSbjh21        roundingMode = float_rounding_mode;
936b7f4cSbjh21        if ( roundingMode == float_round_nearest_even ) {
936b7f4cSbjh21            if ( lastBitMask ) {
936b7f4cSbjh21                add64( z.high, z.low, 0, lastBitMask>>1, &z.high, &z.low );
936b7f4cSbjh21                if ( ( z.low & roundBitsMask ) == 0 ) z.low &= ~ lastBitMask;
936b7f4cSbjh21            }
936b7f4cSbjh21            else {
936b7f4cSbjh21                if ( (sbits32) z.low < 0 ) {
936b7f4cSbjh21                    ++z.high;
936b7f4cSbjh21                    if ( (bits32) ( z.low<<1 ) == 0 ) z.high &= ~1;
936b7f4cSbjh21                }
936b7f4cSbjh21            }
936b7f4cSbjh21        }
936b7f4cSbjh21        else if ( roundingMode != float_round_to_zero ) {
936b7f4cSbjh21            if (   extractFloat64Sign( z )
936b7f4cSbjh21                 ^ ( roundingMode == float_round_up ) ) {
936b7f4cSbjh21                add64( z.high, z.low, 0, roundBitsMask, &z.high, &z.low );
936b7f4cSbjh21            }
936b7f4cSbjh21        }
936b7f4cSbjh21        z.low &= ~ roundBitsMask;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        if ( aExp <= 0x3FE ) {
936b7f4cSbjh21            if ( ( ( (bits32) ( a.high<<1 ) ) | a.low ) == 0 ) return a;
936b7f4cSbjh21            float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21            aSign = extractFloat64Sign( a );
936b7f4cSbjh21            switch ( float_rounding_mode ) {
936b7f4cSbjh21             case float_round_nearest_even:
936b7f4cSbjh21                if (    ( aExp == 0x3FE )
936b7f4cSbjh21                     && ( extractFloat64Frac0( a ) | extractFloat64Frac1( a ) )
936b7f4cSbjh21                   ) {
936b7f4cSbjh21                    return packFloat64( aSign, 0x3FF, 0, 0 );
936b7f4cSbjh21                }
936b7f4cSbjh21                break;
936b7f4cSbjh21             case float_round_down:
936b7f4cSbjh21                return
936b7f4cSbjh21                      aSign ? packFloat64( 1, 0x3FF, 0, 0 )
936b7f4cSbjh21                    : packFloat64( 0, 0, 0, 0 );
936b7f4cSbjh21             case float_round_up:
936b7f4cSbjh21                return
936b7f4cSbjh21                      aSign ? packFloat64( 1, 0, 0, 0 )
936b7f4cSbjh21                    : packFloat64( 0, 0x3FF, 0, 0 );
936b7f4cSbjh21            }
936b7f4cSbjh21            return packFloat64( aSign, 0, 0, 0 );
936b7f4cSbjh21        }
936b7f4cSbjh21        lastBitMask = 1;
936b7f4cSbjh21        lastBitMask <<= 0x413 - aExp;
936b7f4cSbjh21        roundBitsMask = lastBitMask - 1;
936b7f4cSbjh21        z.low = 0;
936b7f4cSbjh21        z.high = a.high;
936b7f4cSbjh21        roundingMode = float_rounding_mode;
936b7f4cSbjh21        if ( roundingMode == float_round_nearest_even ) {
936b7f4cSbjh21            z.high += lastBitMask>>1;
936b7f4cSbjh21            if ( ( ( z.high & roundBitsMask ) | a.low ) == 0 ) {
936b7f4cSbjh21                z.high &= ~ lastBitMask;
936b7f4cSbjh21            }
936b7f4cSbjh21        }
936b7f4cSbjh21        else if ( roundingMode != float_round_to_zero ) {
936b7f4cSbjh21            if (   extractFloat64Sign( z )
936b7f4cSbjh21                 ^ ( roundingMode == float_round_up ) ) {
936b7f4cSbjh21                z.high |= ( a.low != 0 );
936b7f4cSbjh21                z.high += roundBitsMask;
936b7f4cSbjh21            }
936b7f4cSbjh21        }
936b7f4cSbjh21        z.high &= ~ roundBitsMask;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( ( z.low != a.low ) || ( z.high != a.high ) ) {
936b7f4cSbjh21        float_exception_flags |= float_flag_inexact;
936b7f4cSbjh21    }
936b7f4cSbjh21    return z;
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21#endif
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of adding the absolute values of the double-precision
936b7f4cSbjh21floating-point values `a' and `b'.  If `zSign' is 1, the sum is negated
936b7f4cSbjh21before being returned.  `zSign' is ignored if the result is a NaN.
936b7f4cSbjh21The addition is performed according to the IEC/IEEE Standard for Binary
936b7f4cSbjh21Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21static float64 addFloat64Sigs( float64 a, float64 b, flag zSign )
936b7f4cSbjh21{
936b7f4cSbjh21    int16 aExp, bExp, zExp;
936b7f4cSbjh21    bits32 aSig0, aSig1, bSig0, bSig1, zSig0, zSig1, zSig2;
936b7f4cSbjh21    int16 expDiff;
936b7f4cSbjh21
936b7f4cSbjh21    aSig1 = extractFloat64Frac1( a );
936b7f4cSbjh21    aSig0 = extractFloat64Frac0( a );
936b7f4cSbjh21    aExp = extractFloat64Exp( a );
936b7f4cSbjh21    bSig1 = extractFloat64Frac1( b );
936b7f4cSbjh21    bSig0 = extractFloat64Frac0( b );
936b7f4cSbjh21    bExp = extractFloat64Exp( b );
936b7f4cSbjh21    expDiff = aExp - bExp;
936b7f4cSbjh21    if ( 0 < expDiff ) {
936b7f4cSbjh21        if ( aExp == 0x7FF ) {
936b7f4cSbjh21            if ( aSig0 | aSig1 ) return propagateFloat64NaN( a, b );
936b7f4cSbjh21            return a;
936b7f4cSbjh21        }
936b7f4cSbjh21        if ( bExp == 0 ) {
936b7f4cSbjh21            --expDiff;
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            bSig0 |= 0x00100000;
936b7f4cSbjh21        }
936b7f4cSbjh21        shift64ExtraRightJamming(
936b7f4cSbjh21            bSig0, bSig1, 0, expDiff, &bSig0, &bSig1, &zSig2 );
936b7f4cSbjh21        zExp = aExp;
936b7f4cSbjh21    }
936b7f4cSbjh21    else if ( expDiff < 0 ) {
936b7f4cSbjh21        if ( bExp == 0x7FF ) {
936b7f4cSbjh21            if ( bSig0 | bSig1 ) return propagateFloat64NaN( a, b );
936b7f4cSbjh21            return packFloat64( zSign, 0x7FF, 0, 0 );
936b7f4cSbjh21        }
936b7f4cSbjh21        if ( aExp == 0 ) {
936b7f4cSbjh21            ++expDiff;
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            aSig0 |= 0x00100000;
936b7f4cSbjh21        }
936b7f4cSbjh21        shift64ExtraRightJamming(
936b7f4cSbjh21            aSig0, aSig1, 0, - expDiff, &aSig0, &aSig1, &zSig2 );
936b7f4cSbjh21        zExp = bExp;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        if ( aExp == 0x7FF ) {
936b7f4cSbjh21            if ( aSig0 | aSig1 | bSig0 | bSig1 ) {
936b7f4cSbjh21                return propagateFloat64NaN( a, b );
936b7f4cSbjh21            }
936b7f4cSbjh21            return a;
936b7f4cSbjh21        }
936b7f4cSbjh21        add64( aSig0, aSig1, bSig0, bSig1, &zSig0, &zSig1 );
936b7f4cSbjh21        if ( aExp == 0 ) return packFloat64( zSign, 0, zSig0, zSig1 );
936b7f4cSbjh21        zSig2 = 0;
936b7f4cSbjh21        zSig0 |= 0x00200000;
936b7f4cSbjh21        zExp = aExp;
936b7f4cSbjh21        goto shiftRight1;
936b7f4cSbjh21    }
936b7f4cSbjh21    aSig0 |= 0x00100000;
936b7f4cSbjh21    add64( aSig0, aSig1, bSig0, bSig1, &zSig0, &zSig1 );
936b7f4cSbjh21    --zExp;
936b7f4cSbjh21    if ( zSig0 < 0x00200000 ) goto roundAndPack;
936b7f4cSbjh21    ++zExp;
936b7f4cSbjh21 shiftRight1:
936b7f4cSbjh21    shift64ExtraRightJamming( zSig0, zSig1, zSig2, 1, &zSig0, &zSig1, &zSig2 );
936b7f4cSbjh21 roundAndPack:
936b7f4cSbjh21    return roundAndPackFloat64( zSign, zExp, zSig0, zSig1, zSig2 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of subtracting the absolute values of the double-
936b7f4cSbjh21precision floating-point values `a' and `b'.  If `zSign' is 1, the
936b7f4cSbjh21difference is negated before being returned.  `zSign' is ignored if the
936b7f4cSbjh21result is a NaN.  The subtraction is performed according to the IEC/IEEE
936b7f4cSbjh21Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21static float64 subFloat64Sigs( float64 a, float64 b, flag zSign )
936b7f4cSbjh21{
936b7f4cSbjh21    int16 aExp, bExp, zExp;
936b7f4cSbjh21    bits32 aSig0, aSig1, bSig0, bSig1, zSig0, zSig1;
936b7f4cSbjh21    int16 expDiff;
936b7f4cSbjh21
936b7f4cSbjh21    aSig1 = extractFloat64Frac1( a );
936b7f4cSbjh21    aSig0 = extractFloat64Frac0( a );
936b7f4cSbjh21    aExp = extractFloat64Exp( a );
936b7f4cSbjh21    bSig1 = extractFloat64Frac1( b );
936b7f4cSbjh21    bSig0 = extractFloat64Frac0( b );
936b7f4cSbjh21    bExp = extractFloat64Exp( b );
936b7f4cSbjh21    expDiff = aExp - bExp;
936b7f4cSbjh21    shortShift64Left( aSig0, aSig1, 10, &aSig0, &aSig1 );
936b7f4cSbjh21    shortShift64Left( bSig0, bSig1, 10, &bSig0, &bSig1 );
936b7f4cSbjh21    if ( 0 < expDiff ) goto aExpBigger;
936b7f4cSbjh21    if ( expDiff < 0 ) goto bExpBigger;
936b7f4cSbjh21    if ( aExp == 0x7FF ) {
936b7f4cSbjh21        if ( aSig0 | aSig1 | bSig0 | bSig1 ) {
936b7f4cSbjh21            return propagateFloat64NaN( a, b );
936b7f4cSbjh21        }
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return float64_default_nan;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        aExp = 1;
936b7f4cSbjh21        bExp = 1;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bSig0 < aSig0 ) goto aBigger;
936b7f4cSbjh21    if ( aSig0 < bSig0 ) goto bBigger;
936b7f4cSbjh21    if ( bSig1 < aSig1 ) goto aBigger;
936b7f4cSbjh21    if ( aSig1 < bSig1 ) goto bBigger;
936b7f4cSbjh21    return packFloat64( float_rounding_mode == float_round_down, 0, 0, 0 );
936b7f4cSbjh21 bExpBigger:
936b7f4cSbjh21    if ( bExp == 0x7FF ) {
936b7f4cSbjh21        if ( bSig0 | bSig1 ) return propagateFloat64NaN( a, b );
936b7f4cSbjh21        return packFloat64( zSign ^ 1, 0x7FF, 0, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        ++expDiff;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        aSig0 |= 0x40000000;
936b7f4cSbjh21    }
936b7f4cSbjh21    shift64RightJamming( aSig0, aSig1, - expDiff, &aSig0, &aSig1 );
936b7f4cSbjh21    bSig0 |= 0x40000000;
936b7f4cSbjh21 bBigger:
936b7f4cSbjh21    sub64( bSig0, bSig1, aSig0, aSig1, &zSig0, &zSig1 );
936b7f4cSbjh21    zExp = bExp;
936b7f4cSbjh21    zSign ^= 1;
936b7f4cSbjh21    goto normalizeRoundAndPack;
936b7f4cSbjh21 aExpBigger:
936b7f4cSbjh21    if ( aExp == 0x7FF ) {
936b7f4cSbjh21        if ( aSig0 | aSig1 ) return propagateFloat64NaN( a, b );
936b7f4cSbjh21        return a;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0 ) {
936b7f4cSbjh21        --expDiff;
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        bSig0 |= 0x40000000;
936b7f4cSbjh21    }
936b7f4cSbjh21    shift64RightJamming( bSig0, bSig1, expDiff, &bSig0, &bSig1 );
936b7f4cSbjh21    aSig0 |= 0x40000000;
936b7f4cSbjh21 aBigger:
936b7f4cSbjh21    sub64( aSig0, aSig1, bSig0, bSig1, &zSig0, &zSig1 );
936b7f4cSbjh21    zExp = aExp;
936b7f4cSbjh21 normalizeRoundAndPack:
936b7f4cSbjh21    --zExp;
936b7f4cSbjh21    return normalizeRoundAndPackFloat64( zSign, zExp - 10, zSig0, zSig1 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of adding the double-precision floating-point values `a'
936b7f4cSbjh21and `b'.  The operation is performed according to the IEC/IEEE Standard for
936b7f4cSbjh21Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float64 float64_add( float64 a, float64 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    bSign = extractFloat64Sign( b );
936b7f4cSbjh21    if ( aSign == bSign ) {
936b7f4cSbjh21        return addFloat64Sigs( a, b, aSign );
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        return subFloat64Sigs( a, b, aSign );
936b7f4cSbjh21    }
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of subtracting the double-precision floating-point values
936b7f4cSbjh21`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
936b7f4cSbjh21for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float64 float64_sub( float64 a, float64 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    bSign = extractFloat64Sign( b );
936b7f4cSbjh21    if ( aSign == bSign ) {
936b7f4cSbjh21        return subFloat64Sigs( a, b, aSign );
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        return addFloat64Sigs( a, b, aSign );
936b7f4cSbjh21    }
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of multiplying the double-precision floating-point values
936b7f4cSbjh21`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
936b7f4cSbjh21for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float64 float64_mul( float64 a, float64 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign, zSign;
936b7f4cSbjh21    int16 aExp, bExp, zExp;
936b7f4cSbjh21    bits32 aSig0, aSig1, bSig0, bSig1, zSig0, zSig1, zSig2, zSig3;
936b7f4cSbjh21
936b7f4cSbjh21    aSig1 = extractFloat64Frac1( a );
936b7f4cSbjh21    aSig0 = extractFloat64Frac0( a );
936b7f4cSbjh21    aExp = extractFloat64Exp( a );
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    bSig1 = extractFloat64Frac1( b );
936b7f4cSbjh21    bSig0 = extractFloat64Frac0( b );
936b7f4cSbjh21    bExp = extractFloat64Exp( b );
936b7f4cSbjh21    bSign = extractFloat64Sign( b );
936b7f4cSbjh21    zSign = aSign ^ bSign;
936b7f4cSbjh21    if ( aExp == 0x7FF ) {
936b7f4cSbjh21        if (    ( aSig0 | aSig1 )
936b7f4cSbjh21             || ( ( bExp == 0x7FF ) && ( bSig0 | bSig1 ) ) ) {
936b7f4cSbjh21            return propagateFloat64NaN( a, b );
936b7f4cSbjh21        }
936b7f4cSbjh21        if ( ( bExp | bSig0 | bSig1 ) == 0 ) goto invalid;
936b7f4cSbjh21        return packFloat64( zSign, 0x7FF, 0, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0x7FF ) {
936b7f4cSbjh21        if ( bSig0 | bSig1 ) return propagateFloat64NaN( a, b );
936b7f4cSbjh21        if ( ( aExp | aSig0 | aSig1 ) == 0 ) {
936b7f4cSbjh21 invalid:
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21            return float64_default_nan;
936b7f4cSbjh21        }
936b7f4cSbjh21        return packFloat64( zSign, 0x7FF, 0, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        if ( ( aSig0 | aSig1 ) == 0 ) return packFloat64( zSign, 0, 0, 0 );
936b7f4cSbjh21        normalizeFloat64Subnormal( aSig0, aSig1, &aExp, &aSig0, &aSig1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0 ) {
936b7f4cSbjh21        if ( ( bSig0 | bSig1 ) == 0 ) return packFloat64( zSign, 0, 0, 0 );
936b7f4cSbjh21        normalizeFloat64Subnormal( bSig0, bSig1, &bExp, &bSig0, &bSig1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    zExp = aExp + bExp - 0x400;
936b7f4cSbjh21    aSig0 |= 0x00100000;
936b7f4cSbjh21    shortShift64Left( bSig0, bSig1, 12, &bSig0, &bSig1 );
936b7f4cSbjh21    mul64To128( aSig0, aSig1, bSig0, bSig1, &zSig0, &zSig1, &zSig2, &zSig3 );
936b7f4cSbjh21    add64( zSig0, zSig1, aSig0, aSig1, &zSig0, &zSig1 );
936b7f4cSbjh21    zSig2 |= ( zSig3 != 0 );
936b7f4cSbjh21    if ( 0x00200000 <= zSig0 ) {
936b7f4cSbjh21        shift64ExtraRightJamming(
936b7f4cSbjh21            zSig0, zSig1, zSig2, 1, &zSig0, &zSig1, &zSig2 );
936b7f4cSbjh21        ++zExp;
936b7f4cSbjh21    }
936b7f4cSbjh21    return roundAndPackFloat64( zSign, zExp, zSig0, zSig1, zSig2 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the result of dividing the double-precision floating-point value `a'
936b7f4cSbjh21by the corresponding value `b'.  The operation is performed according to the
936b7f4cSbjh21IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float64 float64_div( float64 a, float64 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign, zSign;
936b7f4cSbjh21    int16 aExp, bExp, zExp;
936b7f4cSbjh21    bits32 aSig0, aSig1, bSig0, bSig1, zSig0, zSig1, zSig2;
936b7f4cSbjh21    bits32 rem0, rem1, rem2, rem3, term0, term1, term2, term3;
936b7f4cSbjh21
936b7f4cSbjh21    aSig1 = extractFloat64Frac1( a );
936b7f4cSbjh21    aSig0 = extractFloat64Frac0( a );
936b7f4cSbjh21    aExp = extractFloat64Exp( a );
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    bSig1 = extractFloat64Frac1( b );
936b7f4cSbjh21    bSig0 = extractFloat64Frac0( b );
936b7f4cSbjh21    bExp = extractFloat64Exp( b );
936b7f4cSbjh21    bSign = extractFloat64Sign( b );
936b7f4cSbjh21    zSign = aSign ^ bSign;
936b7f4cSbjh21    if ( aExp == 0x7FF ) {
936b7f4cSbjh21        if ( aSig0 | aSig1 ) return propagateFloat64NaN( a, b );
936b7f4cSbjh21        if ( bExp == 0x7FF ) {
936b7f4cSbjh21            if ( bSig0 | bSig1 ) return propagateFloat64NaN( a, b );
936b7f4cSbjh21            goto invalid;
936b7f4cSbjh21        }
936b7f4cSbjh21        return packFloat64( zSign, 0x7FF, 0, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0x7FF ) {
936b7f4cSbjh21        if ( bSig0 | bSig1 ) return propagateFloat64NaN( a, b );
936b7f4cSbjh21        return packFloat64( zSign, 0, 0, 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0 ) {
936b7f4cSbjh21        if ( ( bSig0 | bSig1 ) == 0 ) {
936b7f4cSbjh21            if ( ( aExp | aSig0 | aSig1 ) == 0 ) {
936b7f4cSbjh21 invalid:
936b7f4cSbjh21                float_raise( float_flag_invalid );
936b7f4cSbjh21                return float64_default_nan;
936b7f4cSbjh21            }
936b7f4cSbjh21            float_raise( float_flag_divbyzero );
936b7f4cSbjh21            return packFloat64( zSign, 0x7FF, 0, 0 );
936b7f4cSbjh21        }
936b7f4cSbjh21        normalizeFloat64Subnormal( bSig0, bSig1, &bExp, &bSig0, &bSig1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        if ( ( aSig0 | aSig1 ) == 0 ) return packFloat64( zSign, 0, 0, 0 );
936b7f4cSbjh21        normalizeFloat64Subnormal( aSig0, aSig1, &aExp, &aSig0, &aSig1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    zExp = aExp - bExp + 0x3FD;
936b7f4cSbjh21    shortShift64Left( aSig0 | 0x00100000, aSig1, 11, &aSig0, &aSig1 );
936b7f4cSbjh21    shortShift64Left( bSig0 | 0x00100000, bSig1, 11, &bSig0, &bSig1 );
936b7f4cSbjh21    if ( le64( bSig0, bSig1, aSig0, aSig1 ) ) {
936b7f4cSbjh21        shift64Right( aSig0, aSig1, 1, &aSig0, &aSig1 );
936b7f4cSbjh21        ++zExp;
936b7f4cSbjh21    }
936b7f4cSbjh21    zSig0 = estimateDiv64To32( aSig0, aSig1, bSig0 );
936b7f4cSbjh21    mul64By32To96( bSig0, bSig1, zSig0, &term0, &term1, &term2 );
936b7f4cSbjh21    sub96( aSig0, aSig1, 0, term0, term1, term2, &rem0, &rem1, &rem2 );
936b7f4cSbjh21    while ( (sbits32) rem0 < 0 ) {
936b7f4cSbjh21        --zSig0;
936b7f4cSbjh21        add96( rem0, rem1, rem2, 0, bSig0, bSig1, &rem0, &rem1, &rem2 );
936b7f4cSbjh21    }
936b7f4cSbjh21    zSig1 = estimateDiv64To32( rem1, rem2, bSig0 );
936b7f4cSbjh21    if ( ( zSig1 & 0x3FF ) <= 4 ) {
936b7f4cSbjh21        mul64By32To96( bSig0, bSig1, zSig1, &term1, &term2, &term3 );
936b7f4cSbjh21        sub96( rem1, rem2, 0, term1, term2, term3, &rem1, &rem2, &rem3 );
936b7f4cSbjh21        while ( (sbits32) rem1 < 0 ) {
936b7f4cSbjh21            --zSig1;
936b7f4cSbjh21            add96( rem1, rem2, rem3, 0, bSig0, bSig1, &rem1, &rem2, &rem3 );
936b7f4cSbjh21        }
936b7f4cSbjh21        zSig1 |= ( ( rem1 | rem2 | rem3 ) != 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    shift64ExtraRightJamming( zSig0, zSig1, 0, 11, &zSig0, &zSig1, &zSig2 );
936b7f4cSbjh21    return roundAndPackFloat64( zSign, zExp, zSig0, zSig1, zSig2 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21#ifndef SOFTFLOAT_FOR_GCC
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the remainder of the double-precision floating-point value `a'
936b7f4cSbjh21with respect to the corresponding value `b'.  The operation is performed
936b7f4cSbjh21according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float64 float64_rem( float64 a, float64 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign, zSign;
936b7f4cSbjh21    int16 aExp, bExp, expDiff;
936b7f4cSbjh21    bits32 aSig0, aSig1, bSig0, bSig1, q, term0, term1, term2;
936b7f4cSbjh21    bits32 allZero, alternateASig0, alternateASig1, sigMean1;
936b7f4cSbjh21    sbits32 sigMean0;
936b7f4cSbjh21    float64 z;
936b7f4cSbjh21
936b7f4cSbjh21    aSig1 = extractFloat64Frac1( a );
936b7f4cSbjh21    aSig0 = extractFloat64Frac0( a );
936b7f4cSbjh21    aExp = extractFloat64Exp( a );
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    bSig1 = extractFloat64Frac1( b );
936b7f4cSbjh21    bSig0 = extractFloat64Frac0( b );
936b7f4cSbjh21    bExp = extractFloat64Exp( b );
936b7f4cSbjh21    bSign = extractFloat64Sign( b );
936b7f4cSbjh21    if ( aExp == 0x7FF ) {
936b7f4cSbjh21        if (    ( aSig0 | aSig1 )
936b7f4cSbjh21             || ( ( bExp == 0x7FF ) && ( bSig0 | bSig1 ) ) ) {
936b7f4cSbjh21            return propagateFloat64NaN( a, b );
936b7f4cSbjh21        }
936b7f4cSbjh21        goto invalid;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0x7FF ) {
936b7f4cSbjh21        if ( bSig0 | bSig1 ) return propagateFloat64NaN( a, b );
936b7f4cSbjh21        return a;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( bExp == 0 ) {
936b7f4cSbjh21        if ( ( bSig0 | bSig1 ) == 0 ) {
936b7f4cSbjh21 invalid:
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21            return float64_default_nan;
936b7f4cSbjh21        }
936b7f4cSbjh21        normalizeFloat64Subnormal( bSig0, bSig1, &bExp, &bSig0, &bSig1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        if ( ( aSig0 | aSig1 ) == 0 ) return a;
936b7f4cSbjh21        normalizeFloat64Subnormal( aSig0, aSig1, &aExp, &aSig0, &aSig1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    expDiff = aExp - bExp;
936b7f4cSbjh21    if ( expDiff < -1 ) return a;
936b7f4cSbjh21    shortShift64Left(
936b7f4cSbjh21        aSig0 | 0x00100000, aSig1, 11 - ( expDiff < 0 ), &aSig0, &aSig1 );
936b7f4cSbjh21    shortShift64Left( bSig0 | 0x00100000, bSig1, 11, &bSig0, &bSig1 );
936b7f4cSbjh21    q = le64( bSig0, bSig1, aSig0, aSig1 );
936b7f4cSbjh21    if ( q ) sub64( aSig0, aSig1, bSig0, bSig1, &aSig0, &aSig1 );
936b7f4cSbjh21    expDiff -= 32;
936b7f4cSbjh21    while ( 0 < expDiff ) {
936b7f4cSbjh21        q = estimateDiv64To32( aSig0, aSig1, bSig0 );
936b7f4cSbjh21        q = ( 4 < q ) ? q - 4 : 0;
936b7f4cSbjh21        mul64By32To96( bSig0, bSig1, q, &term0, &term1, &term2 );
936b7f4cSbjh21        shortShift96Left( term0, term1, term2, 29, &term1, &term2, &allZero );
936b7f4cSbjh21        shortShift64Left( aSig0, aSig1, 29, &aSig0, &allZero );
936b7f4cSbjh21        sub64( aSig0, 0, term1, term2, &aSig0, &aSig1 );
936b7f4cSbjh21        expDiff -= 29;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( -32 < expDiff ) {
936b7f4cSbjh21        q = estimateDiv64To32( aSig0, aSig1, bSig0 );
936b7f4cSbjh21        q = ( 4 < q ) ? q - 4 : 0;
936b7f4cSbjh21        q >>= - expDiff;
936b7f4cSbjh21        shift64Right( bSig0, bSig1, 8, &bSig0, &bSig1 );
936b7f4cSbjh21        expDiff += 24;
936b7f4cSbjh21        if ( expDiff < 0 ) {
936b7f4cSbjh21            shift64Right( aSig0, aSig1, - expDiff, &aSig0, &aSig1 );
936b7f4cSbjh21        }
936b7f4cSbjh21        else {
936b7f4cSbjh21            shortShift64Left( aSig0, aSig1, expDiff, &aSig0, &aSig1 );
936b7f4cSbjh21        }
936b7f4cSbjh21        mul64By32To96( bSig0, bSig1, q, &term0, &term1, &term2 );
936b7f4cSbjh21        sub64( aSig0, aSig1, term1, term2, &aSig0, &aSig1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    else {
936b7f4cSbjh21        shift64Right( aSig0, aSig1, 8, &aSig0, &aSig1 );
936b7f4cSbjh21        shift64Right( bSig0, bSig1, 8, &bSig0, &bSig1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    do {
936b7f4cSbjh21        alternateASig0 = aSig0;
936b7f4cSbjh21        alternateASig1 = aSig1;
936b7f4cSbjh21        ++q;
936b7f4cSbjh21        sub64( aSig0, aSig1, bSig0, bSig1, &aSig0, &aSig1 );
936b7f4cSbjh21    } while ( 0 <= (sbits32) aSig0 );
936b7f4cSbjh21    add64(
936b7f4cSbjh21        aSig0, aSig1, alternateASig0, alternateASig1, &sigMean0, &sigMean1 );
936b7f4cSbjh21    if (    ( sigMean0 < 0 )
936b7f4cSbjh21         || ( ( ( sigMean0 | sigMean1 ) == 0 ) && ( q & 1 ) ) ) {
936b7f4cSbjh21        aSig0 = alternateASig0;
936b7f4cSbjh21        aSig1 = alternateASig1;
936b7f4cSbjh21    }
936b7f4cSbjh21    zSign = ( (sbits32) aSig0 < 0 );
936b7f4cSbjh21    if ( zSign ) sub64( 0, 0, aSig0, aSig1, &aSig0, &aSig1 );
936b7f4cSbjh21    return
936b7f4cSbjh21        normalizeRoundAndPackFloat64( aSign ^ zSign, bExp - 4, aSig0, aSig1 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21#endif
936b7f4cSbjh21
936b7f4cSbjh21#ifndef SOFTFLOAT_FOR_GCC
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns the square root of the double-precision floating-point value `a'.
936b7f4cSbjh21The operation is performed according to the IEC/IEEE Standard for Binary
936b7f4cSbjh21Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21float64 float64_sqrt( float64 a )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign;
936b7f4cSbjh21    int16 aExp, zExp;
936b7f4cSbjh21    bits32 aSig0, aSig1, zSig0, zSig1, zSig2, doubleZSig0;
936b7f4cSbjh21    bits32 rem0, rem1, rem2, rem3, term0, term1, term2, term3;
936b7f4cSbjh21    float64 z;
936b7f4cSbjh21
936b7f4cSbjh21    aSig1 = extractFloat64Frac1( a );
936b7f4cSbjh21    aSig0 = extractFloat64Frac0( a );
936b7f4cSbjh21    aExp = extractFloat64Exp( a );
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    if ( aExp == 0x7FF ) {
936b7f4cSbjh21        if ( aSig0 | aSig1 ) return propagateFloat64NaN( a, a );
936b7f4cSbjh21        if ( ! aSign ) return a;
936b7f4cSbjh21        goto invalid;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aSign ) {
936b7f4cSbjh21        if ( ( aExp | aSig0 | aSig1 ) == 0 ) return a;
936b7f4cSbjh21 invalid:
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return float64_default_nan;
936b7f4cSbjh21    }
936b7f4cSbjh21    if ( aExp == 0 ) {
936b7f4cSbjh21        if ( ( aSig0 | aSig1 ) == 0 ) return packFloat64( 0, 0, 0, 0 );
936b7f4cSbjh21        normalizeFloat64Subnormal( aSig0, aSig1, &aExp, &aSig0, &aSig1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    zExp = ( ( aExp - 0x3FF )>>1 ) + 0x3FE;
936b7f4cSbjh21    aSig0 |= 0x00100000;
936b7f4cSbjh21    shortShift64Left( aSig0, aSig1, 11, &term0, &term1 );
936b7f4cSbjh21    zSig0 = ( estimateSqrt32( aExp, term0 )>>1 ) + 1;
936b7f4cSbjh21    if ( zSig0 == 0 ) zSig0 = 0x7FFFFFFF;
936b7f4cSbjh21    doubleZSig0 = zSig0 + zSig0;
936b7f4cSbjh21    shortShift64Left( aSig0, aSig1, 9 - ( aExp & 1 ), &aSig0, &aSig1 );
936b7f4cSbjh21    mul32To64( zSig0, zSig0, &term0, &term1 );
936b7f4cSbjh21    sub64( aSig0, aSig1, term0, term1, &rem0, &rem1 );
936b7f4cSbjh21    while ( (sbits32) rem0 < 0 ) {
936b7f4cSbjh21        --zSig0;
936b7f4cSbjh21        doubleZSig0 -= 2;
936b7f4cSbjh21        add64( rem0, rem1, 0, doubleZSig0 | 1, &rem0, &rem1 );
936b7f4cSbjh21    }
936b7f4cSbjh21    zSig1 = estimateDiv64To32( rem1, 0, doubleZSig0 );
936b7f4cSbjh21    if ( ( zSig1 & 0x1FF ) <= 5 ) {
936b7f4cSbjh21        if ( zSig1 == 0 ) zSig1 = 1;
936b7f4cSbjh21        mul32To64( doubleZSig0, zSig1, &term1, &term2 );
936b7f4cSbjh21        sub64( rem1, 0, term1, term2, &rem1, &rem2 );
936b7f4cSbjh21        mul32To64( zSig1, zSig1, &term2, &term3 );
936b7f4cSbjh21        sub96( rem1, rem2, 0, 0, term2, term3, &rem1, &rem2, &rem3 );
936b7f4cSbjh21        while ( (sbits32) rem1 < 0 ) {
936b7f4cSbjh21            --zSig1;
936b7f4cSbjh21            shortShift64Left( 0, zSig1, 1, &term2, &term3 );
936b7f4cSbjh21            term3 |= 1;
936b7f4cSbjh21            term2 |= doubleZSig0;
936b7f4cSbjh21            add96( rem1, rem2, rem3, 0, term2, term3, &rem1, &rem2, &rem3 );
936b7f4cSbjh21        }
936b7f4cSbjh21        zSig1 |= ( ( rem1 | rem2 | rem3 ) != 0 );
936b7f4cSbjh21    }
936b7f4cSbjh21    shift64ExtraRightJamming( zSig0, zSig1, 0, 10, &zSig0, &zSig1, &zSig2 );
936b7f4cSbjh21    return roundAndPackFloat64( 0, zExp, zSig0, zSig1, zSig2 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21#endif
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the double-precision floating-point value `a' is equal to
936b7f4cSbjh21the corresponding value `b', and 0 otherwise.  The comparison is performed
936b7f4cSbjh21according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float64_eq( float64 a, float64 b )
936b7f4cSbjh21{
936b7f4cSbjh21
936b7f4cSbjh21    if (    (    ( extractFloat64Exp( a ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( a ) | extractFloat64Frac1( a ) ) )
936b7f4cSbjh21         || (    ( extractFloat64Exp( b ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( b ) | extractFloat64Frac1( b ) ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        if ( float64_is_signaling_nan( a ) || float64_is_signaling_nan( b ) ) {
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21        }
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    return ( a == b ) ||
936b7f4cSbjh21	( (bits64) ( ( FLOAT64_DEMANGLE(a) | FLOAT64_DEMANGLE(b) )<<1 ) == 0 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the double-precision floating-point value `a' is less than
936b7f4cSbjh21or equal to the corresponding value `b', and 0 otherwise.  The comparison
936b7f4cSbjh21is performed according to the IEC/IEEE Standard for Binary Floating-Point
936b7f4cSbjh21Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float64_le( float64 a, float64 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21
936b7f4cSbjh21    if (    (    ( extractFloat64Exp( a ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( a ) | extractFloat64Frac1( a ) ) )
936b7f4cSbjh21         || (    ( extractFloat64Exp( b ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( b ) | extractFloat64Frac1( b ) ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    bSign = extractFloat64Sign( b );
936b7f4cSbjh21    if ( aSign != bSign )
936b7f4cSbjh21	return aSign ||
936b7f4cSbjh21	    ( (bits64) ( ( FLOAT64_DEMANGLE(a) | FLOAT64_DEMANGLE(b) )<<1 ) ==
936b7f4cSbjh21	      0 );
936b7f4cSbjh21    return ( a == b ) ||
936b7f4cSbjh21	( aSign ^ ( FLOAT64_DEMANGLE(a) < FLOAT64_DEMANGLE(b) ) );
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the double-precision floating-point value `a' is less than
936b7f4cSbjh21the corresponding value `b', and 0 otherwise.  The comparison is performed
936b7f4cSbjh21according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float64_lt( float64 a, float64 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21
936b7f4cSbjh21    if (    (    ( extractFloat64Exp( a ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( a ) | extractFloat64Frac1( a ) ) )
936b7f4cSbjh21         || (    ( extractFloat64Exp( b ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( b ) | extractFloat64Frac1( b ) ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    bSign = extractFloat64Sign( b );
936b7f4cSbjh21    if ( aSign != bSign )
936b7f4cSbjh21	return aSign &&
936b7f4cSbjh21	    ( (bits64) ( ( FLOAT64_DEMANGLE(a) | FLOAT64_DEMANGLE(b) )<<1 ) !=
936b7f4cSbjh21	      0 );
936b7f4cSbjh21    return ( a != b ) &&
936b7f4cSbjh21	( aSign ^ ( FLOAT64_DEMANGLE(a) < FLOAT64_DEMANGLE(b) ) );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21#ifndef SOFTFLOAT_FOR_GCC
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the double-precision floating-point value `a' is equal to
936b7f4cSbjh21the corresponding value `b', and 0 otherwise.  The invalid exception is
936b7f4cSbjh21raised if either operand is a NaN.  Otherwise, the comparison is performed
936b7f4cSbjh21according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float64_eq_signaling( float64 a, float64 b )
936b7f4cSbjh21{
936b7f4cSbjh21
936b7f4cSbjh21    if (    (    ( extractFloat64Exp( a ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( a ) | extractFloat64Frac1( a ) ) )
936b7f4cSbjh21         || (    ( extractFloat64Exp( b ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( b ) | extractFloat64Frac1( b ) ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        float_raise( float_flag_invalid );
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    return ( a == b ) || ( (bits64) ( ( a | b )<<1 ) == 0 );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the double-precision floating-point value `a' is less than or
936b7f4cSbjh21equal to the corresponding value `b', and 0 otherwise.  Quiet NaNs do not
936b7f4cSbjh21cause an exception.  Otherwise, the comparison is performed according to the
936b7f4cSbjh21IEC/IEEE Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float64_le_quiet( float64 a, float64 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21
936b7f4cSbjh21    if (    (    ( extractFloat64Exp( a ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( a ) | extractFloat64Frac1( a ) ) )
936b7f4cSbjh21         || (    ( extractFloat64Exp( b ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( b ) | extractFloat64Frac1( b ) ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        if ( float64_is_signaling_nan( a ) || float64_is_signaling_nan( b ) ) {
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21        }
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    bSign = extractFloat64Sign( b );
936b7f4cSbjh21    if ( aSign != bSign ) return aSign || ( (bits64) ( ( a | b )<<1 ) == 0 );
936b7f4cSbjh21    return ( a == b ) || ( aSign ^ ( a < b ) );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21/*
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21Returns 1 if the double-precision floating-point value `a' is less than
936b7f4cSbjh21the corresponding value `b', and 0 otherwise.  Quiet NaNs do not cause an
936b7f4cSbjh21exception.  Otherwise, the comparison is performed according to the IEC/IEEE
936b7f4cSbjh21Standard for Binary Floating-Point Arithmetic.
936b7f4cSbjh21-------------------------------------------------------------------------------
936b7f4cSbjh21*/
936b7f4cSbjh21flag float64_lt_quiet( float64 a, float64 b )
936b7f4cSbjh21{
936b7f4cSbjh21    flag aSign, bSign;
936b7f4cSbjh21
936b7f4cSbjh21    if (    (    ( extractFloat64Exp( a ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( a ) | extractFloat64Frac1( a ) ) )
936b7f4cSbjh21         || (    ( extractFloat64Exp( b ) == 0x7FF )
936b7f4cSbjh21              && ( extractFloat64Frac0( b ) | extractFloat64Frac1( b ) ) )
936b7f4cSbjh21       ) {
936b7f4cSbjh21        if ( float64_is_signaling_nan( a ) || float64_is_signaling_nan( b ) ) {
936b7f4cSbjh21            float_raise( float_flag_invalid );
936b7f4cSbjh21        }
936b7f4cSbjh21        return 0;
936b7f4cSbjh21    }
936b7f4cSbjh21    aSign = extractFloat64Sign( a );
936b7f4cSbjh21    bSign = extractFloat64Sign( b );
936b7f4cSbjh21    if ( aSign != bSign ) return aSign && ( (bits64) ( ( a | b )<<1 ) != 0 );
936b7f4cSbjh21    return ( a != b ) && ( aSign ^ ( a < b ) );
936b7f4cSbjh21
936b7f4cSbjh21}
936b7f4cSbjh21
936b7f4cSbjh21#endif