mirror of
https://github.com/pmret/gcc-papermario.git
synced 2024-11-09 12:22:38 +01:00
839 lines
17 KiB
C
839 lines
17 KiB
C
/*
|
|
** libgcc support for software floating point.
|
|
** Copyright (C) 1991 by Pipeline Associates, Inc. All rights reserved.
|
|
** Permission is granted to do *anything* you want with this file,
|
|
** commercial or otherwise, provided this message remains intact. So there!
|
|
** I would appreciate receiving any updates/patches/changes that anyone
|
|
** makes, and am willing to be the repository for said changes (am I
|
|
** making a big mistake?).
|
|
|
|
Warning! Only single-precision is actually implemented. This file
|
|
won't really be much use until double-precision is supported.
|
|
|
|
However, once that is done, this file might eventually become a
|
|
replacement for libgcc1.c. It might also make possible
|
|
cross-compilation for an IEEE target machine from a non-IEEE
|
|
host such as a VAX.
|
|
|
|
If you'd like to work on completing this, please talk to rms@gnu.ai.mit.edu.
|
|
|
|
|
|
**
|
|
** Pat Wood
|
|
** Pipeline Associates, Inc.
|
|
** pipeline!phw@motown.com or
|
|
** sun!pipeline!phw or
|
|
** uunet!motown!pipeline!phw
|
|
**
|
|
** 05/01/91 -- V1.0 -- first release to gcc mailing lists
|
|
** 05/04/91 -- V1.1 -- added float and double prototypes and return values
|
|
** -- fixed problems with adding and subtracting zero
|
|
** -- fixed rounding in truncdfsf2
|
|
** -- fixed SWAP define and tested on 386
|
|
*/
|
|
|
|
/*
|
|
** The following are routines that replace the libgcc soft floating point
|
|
** routines that are called automatically when -msoft-float is selected.
|
|
** The support single and double precision IEEE format, with provisions
|
|
** for byte-swapped machines (tested on 386). Some of the double-precision
|
|
** routines work at full precision, but most of the hard ones simply punt
|
|
** and call the single precision routines, producing a loss of accuracy.
|
|
** long long support is not assumed or included.
|
|
** Overall accuracy is close to IEEE (actually 68882) for single-precision
|
|
** arithmetic. I think there may still be a 1 in 1000 chance of a bit
|
|
** being rounded the wrong way during a multiply. I'm not fussy enough to
|
|
** bother with it, but if anyone is, knock yourself out.
|
|
**
|
|
** Efficiency has only been addressed where it was obvious that something
|
|
** would make a big difference. Anyone who wants to do this right for
|
|
** best speed should go in and rewrite in assembler.
|
|
**
|
|
** I have tested this only on a 68030 workstation and 386/ix integrated
|
|
** in with -msoft-float.
|
|
*/
|
|
|
|
/* the following deal with IEEE single-precision numbers */
|
|
#define D_PHANTOM_BIT 0x00100000
|
|
#define EXCESS 126
|
|
#define SIGNBIT 0x80000000
|
|
#define HIDDEN (1 << 23)
|
|
#define SIGN(fp) ((fp) & SIGNBIT)
|
|
#define EXP(fp) (((fp) >> 23) & 0xFF)
|
|
#define MANT(fp) (((fp) & 0x7FFFFF) | HIDDEN)
|
|
#define PACK(s,e,m) ((s) | ((e) << 23) | (m))
|
|
|
|
/* the following deal with IEEE double-precision numbers */
|
|
#define EXCESSD 1022
|
|
#define HIDDEND (1 << 20)
|
|
#define EXPD(fp) (((fp.l.upper) >> 20) & 0x7FF)
|
|
#define SIGND(fp) ((fp.l.upper) & SIGNBIT)
|
|
#define MANTD(fp) (((((fp.l.upper) & 0xFFFFF) | HIDDEND) << 10) | \
|
|
(fp.l.lower >> 22))
|
|
|
|
/* define SWAP for 386/960 reverse-byte-order brain-damaged CPUs */
|
|
union double_long
|
|
{
|
|
double d;
|
|
#ifdef SWAP
|
|
struct {
|
|
unsigned long lower;
|
|
long upper;
|
|
} l;
|
|
#else
|
|
struct {
|
|
long upper;
|
|
unsigned long lower;
|
|
} l;
|
|
#endif
|
|
};
|
|
|
|
union float_long
|
|
{
|
|
float f;
|
|
long l;
|
|
};
|
|
|
|
struct _ieee {
|
|
#ifdef SWAP
|
|
unsigned mantissa2 : 32;
|
|
unsigned mantissa1 : 20;
|
|
unsigned exponent : 11;
|
|
unsigned sign : 1;
|
|
#else
|
|
unsigned exponent : 11;
|
|
unsigned sign : 1;
|
|
unsigned mantissa2 : 32;
|
|
unsigned mantissa1 : 20;
|
|
#endif
|
|
};
|
|
|
|
union _doubleu {
|
|
double d;
|
|
struct _ieee ieee;
|
|
#ifdef SWAP
|
|
struct {
|
|
unsigned long lower;
|
|
long upper;
|
|
} l;
|
|
#else
|
|
struct {
|
|
long upper;
|
|
unsigned long lower;
|
|
} l;
|
|
#endif
|
|
};
|
|
|
|
/* add two floats */
|
|
|
|
float
|
|
__addsf3 (float a1, float a2)
|
|
{
|
|
register long mant1, mant2;
|
|
register union float_long fl1, fl2;
|
|
register int exp1, exp2;
|
|
int sign = 0;
|
|
|
|
fl1.f = a1;
|
|
fl2.f = a2;
|
|
|
|
/* check for zero args */
|
|
if (!fl1.l)
|
|
return (fl2.f);
|
|
if (!fl2.l)
|
|
return (fl1.f);
|
|
|
|
exp1 = EXP (fl1.l);
|
|
exp2 = EXP (fl2.l);
|
|
|
|
if (exp1 > exp2 + 25)
|
|
return (fl1.l);
|
|
if (exp2 > exp1 + 25)
|
|
return (fl2.l);
|
|
|
|
/* do everything in excess precision so's we can round later */
|
|
mant1 = MANT (fl1.l) << 6;
|
|
mant2 = MANT (fl2.l) << 6;
|
|
|
|
if (SIGN (fl1.l))
|
|
mant1 = -mant1;
|
|
if (SIGN (fl2.l))
|
|
mant2 = -mant2;
|
|
|
|
if (exp1 > exp2)
|
|
{
|
|
mant2 >>= exp1 - exp2;
|
|
}
|
|
else
|
|
{
|
|
mant1 >>= exp2 - exp1;
|
|
exp1 = exp2;
|
|
}
|
|
mant1 += mant2;
|
|
|
|
if (mant1 < 0)
|
|
{
|
|
mant1 = -mant1;
|
|
sign = SIGNBIT;
|
|
}
|
|
else if (!mant1)
|
|
return (0);
|
|
|
|
/* normalize up */
|
|
while (!(mant1 & 0xE0000000))
|
|
{
|
|
mant1 <<= 1;
|
|
exp1--;
|
|
}
|
|
|
|
/* normalize down? */
|
|
if (mant1 & (1 << 30))
|
|
{
|
|
mant1 >>= 1;
|
|
exp1++;
|
|
}
|
|
|
|
/* round to even */
|
|
mant1 += (mant1 & 0x40) ? 0x20 : 0x1F;
|
|
|
|
/* normalize down? */
|
|
if (mant1 & (1 << 30))
|
|
{
|
|
mant1 >>= 1;
|
|
exp1++;
|
|
}
|
|
|
|
/* lose extra precision */
|
|
mant1 >>= 6;
|
|
|
|
/* turn off hidden bit */
|
|
mant1 &= ~HIDDEN;
|
|
|
|
/* pack up and go home */
|
|
fl1.l = PACK (sign, exp1, mant1);
|
|
return (fl1.f);
|
|
}
|
|
|
|
/* subtract two floats */
|
|
|
|
float
|
|
__subsf3 (float a1, float a2)
|
|
{
|
|
register union float_long fl1, fl2;
|
|
|
|
fl1.f = a1;
|
|
fl2.f = a2;
|
|
|
|
/* check for zero args */
|
|
if (!fl2.l)
|
|
return (fl1.f);
|
|
if (!fl1.l)
|
|
return (-fl2.f);
|
|
|
|
/* twiddle sign bit and add */
|
|
fl2.l ^= SIGNBIT;
|
|
return __addsf3 (a1, fl2.f);
|
|
}
|
|
|
|
/* compare two floats */
|
|
|
|
long
|
|
__cmpsf2 (float a1, float a2)
|
|
{
|
|
register union float_long fl1, fl2;
|
|
|
|
fl1.f = a1;
|
|
fl2.f = a2;
|
|
|
|
if (SIGN (fl1.l) && SIGN (fl2.l))
|
|
{
|
|
fl1.l ^= SIGNBIT;
|
|
fl2.l ^= SIGNBIT;
|
|
}
|
|
if (fl1.l < fl2.l)
|
|
return (-1);
|
|
if (fl1.l > fl2.l)
|
|
return (1);
|
|
return (0);
|
|
}
|
|
|
|
/* multiply two floats */
|
|
|
|
float
|
|
__mulsf3 (float a1, float a2)
|
|
{
|
|
register union float_long fl1, fl2;
|
|
register unsigned long result;
|
|
register int exp;
|
|
int sign;
|
|
|
|
fl1.f = a1;
|
|
fl2.f = a2;
|
|
|
|
if (!fl1.l || !fl2.l)
|
|
return (0);
|
|
|
|
/* compute sign and exponent */
|
|
sign = SIGN (fl1.l) ^ SIGN (fl2.l);
|
|
exp = EXP (fl1.l) - EXCESS;
|
|
exp += EXP (fl2.l);
|
|
|
|
fl1.l = MANT (fl1.l);
|
|
fl2.l = MANT (fl2.l);
|
|
|
|
/* the multiply is done as one 16x16 multiply and two 16x8 multiples */
|
|
result = (fl1.l >> 8) * (fl2.l >> 8);
|
|
result += ((fl1.l & 0xFF) * (fl2.l >> 8)) >> 8;
|
|
result += ((fl2.l & 0xFF) * (fl1.l >> 8)) >> 8;
|
|
|
|
if (result & 0x80000000)
|
|
{
|
|
/* round */
|
|
result += 0x80;
|
|
result >>= 8;
|
|
}
|
|
else
|
|
{
|
|
/* round */
|
|
result += 0x40;
|
|
result >>= 7;
|
|
exp--;
|
|
}
|
|
|
|
result &= ~HIDDEN;
|
|
|
|
/* pack up and go home */
|
|
fl1.l = PACK (sign, exp, result);
|
|
return (fl1.f);
|
|
}
|
|
|
|
/* divide two floats */
|
|
|
|
float
|
|
__divsf3 (float a1, float a2)
|
|
{
|
|
register union float_long fl1, fl2;
|
|
register int result;
|
|
register int mask;
|
|
register int exp, sign;
|
|
|
|
fl1.f = a1;
|
|
fl2.f = a2;
|
|
|
|
/* subtract exponents */
|
|
exp = EXP (fl1.l) - EXP (fl2.l) + EXCESS;
|
|
|
|
/* compute sign */
|
|
sign = SIGN (fl1.l) ^ SIGN (fl2.l);
|
|
|
|
/* divide by zero??? */
|
|
if (!fl2.l)
|
|
/* return NaN or -NaN */
|
|
return (sign ? 0xFFFFFFFF : 0x7FFFFFFF);
|
|
|
|
/* numerator zero??? */
|
|
if (!fl1.l)
|
|
return (0);
|
|
|
|
/* now get mantissas */
|
|
fl1.l = MANT (fl1.l);
|
|
fl2.l = MANT (fl2.l);
|
|
|
|
/* this assures we have 25 bits of precision in the end */
|
|
if (fl1.l < fl2.l)
|
|
{
|
|
fl1.l <<= 1;
|
|
exp--;
|
|
}
|
|
|
|
/* now we perform repeated subtraction of fl2.l from fl1.l */
|
|
mask = 0x1000000;
|
|
result = 0;
|
|
while (mask)
|
|
{
|
|
if (fl1.l >= fl2.l)
|
|
{
|
|
result |= mask;
|
|
fl1.l -= fl2.l;
|
|
}
|
|
fl1.l <<= 1;
|
|
mask >>= 1;
|
|
}
|
|
|
|
/* round */
|
|
result += 1;
|
|
|
|
/* normalize down */
|
|
exp++;
|
|
result >>= 1;
|
|
|
|
result &= ~HIDDEN;
|
|
|
|
/* pack up and go home */
|
|
fl1.l = PACK (sign, exp, result);
|
|
return (fl1.f);
|
|
}
|
|
|
|
/* convert int to double */
|
|
|
|
double
|
|
__floatsidf (register long a1)
|
|
{
|
|
register int sign = 0, exp = 31 + EXCESSD;
|
|
union double_long dl;
|
|
|
|
if (!a1)
|
|
{
|
|
dl.l.upper = dl.l.lower = 0;
|
|
return (dl.d);
|
|
}
|
|
|
|
if (a1 < 0)
|
|
{
|
|
sign = SIGNBIT;
|
|
a1 = -a1;
|
|
}
|
|
|
|
while (a1 < 0x1000000)
|
|
{
|
|
a1 <<= 4;
|
|
exp -= 4;
|
|
}
|
|
|
|
while (a1 < 0x40000000)
|
|
{
|
|
a1 <<= 1;
|
|
exp--;
|
|
}
|
|
|
|
/* pack up and go home */
|
|
dl.l.upper = sign;
|
|
dl.l.upper |= exp << 20;
|
|
dl.l.upper |= (a1 >> 10) & ~HIDDEND;
|
|
dl.l.lower = a1 << 22;
|
|
|
|
return (dl.d);
|
|
}
|
|
|
|
/* negate a float */
|
|
|
|
float
|
|
__negsf2 (float a1)
|
|
{
|
|
register union float_long fl1;
|
|
|
|
fl1.f = a1;
|
|
if (!fl1.l)
|
|
return (0);
|
|
|
|
fl1.l ^= SIGNBIT;
|
|
return (fl1.f);
|
|
}
|
|
|
|
/* negate a double */
|
|
|
|
double
|
|
__negdf2 (double a1)
|
|
{
|
|
register union double_long dl1;
|
|
|
|
dl1.d = a1;
|
|
|
|
if (!dl1.l.upper && !dl1.l.lower)
|
|
return (dl1.d);
|
|
|
|
dl1.l.upper ^= SIGNBIT;
|
|
return (dl1.d);
|
|
}
|
|
|
|
/* convert float to double */
|
|
|
|
double
|
|
__extendsfdf2 (float a1)
|
|
{
|
|
register union float_long fl1;
|
|
register union double_long dl;
|
|
register int exp;
|
|
|
|
fl1.f = a1;
|
|
|
|
if (!fl1.l)
|
|
{
|
|
dl.l.upper = dl.l.lower = 0;
|
|
return (dl.d);
|
|
}
|
|
|
|
dl.l.upper = SIGN (fl1.l);
|
|
exp = EXP (fl1.l) - EXCESS + EXCESSD;
|
|
dl.l.upper |= exp << 20;
|
|
dl.l.upper |= (MANT (fl1.l) & ~HIDDEN) >> 3;
|
|
dl.l.lower = MANT (fl1.l) << 29;
|
|
|
|
return (dl.d);
|
|
}
|
|
|
|
/* convert double to float */
|
|
|
|
float
|
|
__truncdfsf2 (double a1)
|
|
{
|
|
register int exp;
|
|
register long mant;
|
|
register union float_long fl;
|
|
register union double_long dl1;
|
|
|
|
dl1.d = a1;
|
|
|
|
if (!dl1.l.upper && !dl1.l.lower)
|
|
return (0);
|
|
|
|
exp = EXPD (dl1) - EXCESSD + EXCESS;
|
|
|
|
/* shift double mantissa 6 bits so we can round */
|
|
mant = MANTD (dl1) >> 6;
|
|
|
|
/* now round and shift down */
|
|
mant += 1;
|
|
mant >>= 1;
|
|
|
|
/* did the round overflow? */
|
|
if (mant & 0xFF000000)
|
|
{
|
|
mant >>= 1;
|
|
exp++;
|
|
}
|
|
|
|
mant &= ~HIDDEN;
|
|
|
|
/* pack up and go home */
|
|
fl.l = PACK (SIGND (dl1), exp, mant);
|
|
return (fl.f);
|
|
}
|
|
|
|
/* compare two doubles */
|
|
|
|
long
|
|
__cmpdf2 (double a1, double a2)
|
|
{
|
|
register union double_long dl1, dl2;
|
|
|
|
dl1.d = a1;
|
|
dl2.d = a2;
|
|
|
|
if (SIGND (dl1) && SIGND (dl2))
|
|
{
|
|
dl1.l.upper ^= SIGNBIT;
|
|
dl2.l.upper ^= SIGNBIT;
|
|
}
|
|
if (dl1.l.upper < dl2.l.upper)
|
|
return (-1);
|
|
if (dl1.l.upper > dl2.l.upper)
|
|
return (1);
|
|
if (dl1.l.lower < dl2.l.lower)
|
|
return (-1);
|
|
if (dl1.l.lower > dl2.l.lower)
|
|
return (1);
|
|
return (0);
|
|
}
|
|
|
|
/* convert double to int */
|
|
|
|
long
|
|
__fixdfsi (double a1)
|
|
{
|
|
register union double_long dl1;
|
|
register int exp;
|
|
register long l;
|
|
|
|
dl1.d = a1;
|
|
|
|
if (!dl1.l.upper && !dl1.l.lower)
|
|
return (0);
|
|
|
|
exp = EXPD (dl1) - EXCESSD - 31;
|
|
l = MANTD (dl1);
|
|
|
|
if (exp > 0)
|
|
return (0x7FFFFFFF | SIGND (dl1)); /* largest integer */
|
|
|
|
/* shift down until exp = 0 or l = 0 */
|
|
if (exp < 0 && exp > -32 && l)
|
|
l >>= -exp;
|
|
else
|
|
return (0);
|
|
|
|
return (SIGND (dl1) ? -l : l);
|
|
}
|
|
|
|
/* convert double to unsigned int */
|
|
|
|
unsigned
|
|
long __fixunsdfsi (double a1)
|
|
{
|
|
register union double_long dl1;
|
|
register int exp;
|
|
register unsigned long l;
|
|
|
|
dl1.d = a1;
|
|
|
|
if (!dl1.l.upper && !dl1.l.lower)
|
|
return (0);
|
|
|
|
exp = EXPD (dl1) - EXCESSD - 32;
|
|
l = (((((dl1.l.upper) & 0xFFFFF) | HIDDEND) << 11) | (dl1.l.lower >> 21));
|
|
|
|
if (exp > 0)
|
|
return (0xFFFFFFFF); /* largest integer */
|
|
|
|
/* shift down until exp = 0 or l = 0 */
|
|
if (exp < 0 && exp > -32 && l)
|
|
l >>= -exp;
|
|
else
|
|
return (0);
|
|
|
|
return (l);
|
|
}
|
|
|
|
/* For now, the hard double-precision routines simply
|
|
punt and do it in single */
|
|
/* addtwo doubles */
|
|
|
|
double
|
|
__adddf3 (double a1, double a2)
|
|
{
|
|
return ((float) a1 + (float) a2);
|
|
}
|
|
|
|
/* subtract two doubles */
|
|
|
|
double
|
|
__subdf3 (double a1, double a2)
|
|
{
|
|
return ((float) a1 - (float) a2);
|
|
}
|
|
|
|
/* multiply two doubles */
|
|
|
|
double
|
|
__muldf3 (double a1, double a2)
|
|
{
|
|
return ((float) a1 * (float) a2);
|
|
}
|
|
|
|
/*
|
|
*
|
|
* Name: Barrett Richardson
|
|
* E-mail: barrett@iglou.com
|
|
* When: Thu Dec 15 10:31:11 EST 1994
|
|
*
|
|
* callable function:
|
|
*
|
|
* double __divdf3(double a1, double a2);
|
|
*
|
|
* Does software divide of a1 / a2.
|
|
*
|
|
* Based largely on __divsf3() in floatlib.c in the gcc
|
|
* distribution.
|
|
*
|
|
* Purpose: To be used in conjunction with the -msoft-float
|
|
* option of gcc. You should be able to tack it to the
|
|
* end of floatlib.c included in the gcc distribution,
|
|
* and delete the __divdf3() already there which just
|
|
* calls the single precision function (or may just
|
|
* use the floating point processor with some configurations).
|
|
*
|
|
* You may use this code for whatever your heart desires.
|
|
*/
|
|
|
|
|
|
|
|
|
|
/*
|
|
* Compare the the mantissas of two doubles.
|
|
* Each mantissa is in two longs.
|
|
*
|
|
* return 1 if x1's mantissa is greater than x2's
|
|
* -1 if x1's mantissa is less than x2's
|
|
* 0 if the two mantissa's are equal.
|
|
*
|
|
* The Mantissas won't fit into a 4 byte word, so they are
|
|
* broken up into two parts.
|
|
*
|
|
* This function is used internally by __divdf3()
|
|
*/
|
|
|
|
int
|
|
__dcmp (long x1m1, long x1m2, long x2m1, long x2m2)
|
|
{
|
|
if (x1m1 > x2m1)
|
|
return 1;
|
|
|
|
if (x1m1 < x2m1)
|
|
return -1;
|
|
|
|
/* If the first word in the two mantissas were equal check the second word */
|
|
|
|
if (x1m2 > x2m2)
|
|
return 1;
|
|
|
|
if (x1m2 < x2m2)
|
|
return -1;
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
/* divide two doubles */
|
|
|
|
double
|
|
__divdf3 (double a1, double a2)
|
|
{
|
|
|
|
int sign,
|
|
exponent,
|
|
bit_bucket;
|
|
|
|
register unsigned long mantissa1,
|
|
mantissa2,
|
|
x1m1,
|
|
x1m2,
|
|
x2m1,
|
|
x2m2,
|
|
mask;
|
|
|
|
union _doubleu x1,
|
|
x2,
|
|
result;
|
|
|
|
|
|
x1.d = a1;
|
|
x2.d = a2;
|
|
|
|
exponent = x1.ieee.exponent - x2.ieee.exponent + EXCESSD;
|
|
|
|
sign = x1.ieee.sign ^ x2.ieee.sign;
|
|
|
|
x2.ieee.sign = 0; /* don't want the sign bit to affect any zero */
|
|
/* comparisons when checking for zero divide */
|
|
|
|
if (!x2.l.lower && !x2.l.upper) { /* check for zero divide */
|
|
result.l.lower = 0x0;
|
|
if (sign)
|
|
result.l.upper = 0xFFF00000; /* negative infinity */
|
|
else
|
|
result.l.upper = 0x7FF00000; /* positive infinity */
|
|
return result.d;
|
|
}
|
|
|
|
if (!x1.l.upper && !x1.l.lower) /* check for 0.0 numerator */
|
|
return (0.0);
|
|
|
|
x1m1 = x1.ieee.mantissa1 | D_PHANTOM_BIT; /* turn on phantom bit */
|
|
x1m2 = x1.ieee.mantissa2;
|
|
|
|
x2m1 = x2.ieee.mantissa1 | D_PHANTOM_BIT; /* turn on phantom bit */
|
|
x2m2 = x2.ieee.mantissa2;
|
|
|
|
if (__dcmp(x1m1,x1m2,x2m1,x2m2) < 0) {
|
|
|
|
/* if x1's mantissa is less than x2's shift it left one and decrement */
|
|
/* the exponent to accommodate the change in the mantissa */
|
|
|
|
x1m1 <<= 1; /* */
|
|
bit_bucket = x1m2 >> 31; /* Shift mantissa left one */
|
|
x1m1 |= bit_bucket; /* */
|
|
x1m2 <<= 1; /* */
|
|
|
|
exponent--;
|
|
}
|
|
|
|
|
|
mantissa1 = 0;
|
|
mantissa2 = 0;
|
|
|
|
|
|
/* Get the first part of the results mantissa using successive */
|
|
/* subtraction. */
|
|
|
|
mask = 0x00200000;
|
|
while (mask) {
|
|
|
|
if (__dcmp(x1m1,x1m2,x2m1,x2m2) >= 0) {
|
|
|
|
/* subtract x2's mantissa from x1's */
|
|
|
|
mantissa1 |= mask; /* turn on a bit in the result */
|
|
|
|
if (x2m2 > x1m2)
|
|
x1m1--;
|
|
x1m2 -= x2m2;
|
|
x1m1 -= x2m1;
|
|
}
|
|
|
|
x1m1 <<= 1; /* */
|
|
bit_bucket = x1m2 >> 31; /* Shift mantissa left one */
|
|
x1m1 |= bit_bucket; /* */
|
|
x1m2 <<= 1; /* */
|
|
|
|
mask >>= 1;
|
|
}
|
|
|
|
/* Get the second part of the results mantissa using successive */
|
|
/* subtraction. */
|
|
|
|
mask = 0x80000000;
|
|
while (mask) {
|
|
|
|
if (__dcmp(x1m1,x1m2,x2m1,x2m2) >= 0) {
|
|
|
|
/* subtract x2's mantissa from x1's */
|
|
|
|
mantissa2 |= mask; /* turn on a bit in the result */
|
|
|
|
if (x2m2 > x1m2)
|
|
x1m1--;
|
|
x1m2 -= x2m2;
|
|
x1m1 -= x2m1;
|
|
}
|
|
x1m1 <<= 1; /* */
|
|
bit_bucket = x1m2 >> 31; /* Shift mantissa left one */
|
|
x1m1 |= bit_bucket; /* */
|
|
x1m2 <<= 1; /* */
|
|
|
|
mask >>= 1;
|
|
}
|
|
|
|
/* round up by adding 1 to mantissa */
|
|
|
|
if (mantissa2 == 0xFFFFFFFF) { /* check for over flow */
|
|
|
|
/* spill if overflow */
|
|
|
|
mantissa2 = 0;
|
|
mantissa1++;
|
|
}
|
|
else
|
|
mantissa2++;
|
|
|
|
exponent++; /* increment exponent (mantissa must be shifted right */
|
|
/* also) */
|
|
|
|
/* shift mantissa right one and assume a phantom bit (which really gives */
|
|
/* 53 bits of precision in the mantissa) */
|
|
|
|
mantissa2 >>= 1;
|
|
bit_bucket = mantissa1 & 1;
|
|
mantissa2 |= (bit_bucket << 31);
|
|
mantissa1 >>= 1;
|
|
|
|
/* put all the info into the result */
|
|
|
|
result.ieee.exponent = exponent;
|
|
result.ieee.sign = sign;
|
|
result.ieee.mantissa1 = mantissa1;
|
|
result.ieee.mantissa2 = mantissa2;
|
|
|
|
|
|
return result.d;
|
|
}
|