|
|
ce426f |
# commit 4cf69995e26e16005d4e3843ad4d18c75cf21a04
|
|
|
ce426f |
# Author: Alan Modra <amodra@gmail.com>
|
|
|
ce426f |
# Date: Sat Aug 17 18:19:44 2013 +0930
|
|
|
ce426f |
#
|
|
|
ce426f |
# Fix for [BZ #15680] IBM long double inaccuracy
|
|
|
ce426f |
# http://sourceware.org/ml/libc-alpha/2013-06/msg00919.html
|
|
|
ce426f |
#
|
|
|
ce426f |
# I discovered a number of places where denormals and other corner cases
|
|
|
ce426f |
# were being handled wrongly.
|
|
|
ce426f |
#
|
|
|
ce426f |
# - printf_fphex.c: Testing for the low double exponent being zero is
|
|
|
ce426f |
# unnecessary. If the difference in exponents is less than 53 then the
|
|
|
ce426f |
# high double exponent must be nearing the low end of its range, and the
|
|
|
ce426f |
# low double exponent hit rock bottom.
|
|
|
ce426f |
#
|
|
|
ce426f |
# - ldbl2mpn.c: A denormal (ie. exponent of zero) value is treated as
|
|
|
ce426f |
# if the exponent was one, so shift mantissa left by one. Code handling
|
|
|
ce426f |
# normalisation of the low double mantissa lacked a test for shift count
|
|
|
ce426f |
# greater than bits in type being shifted, and lacked anything to handle
|
|
|
ce426f |
# the case where the difference in exponents is less than 53 as in
|
|
|
ce426f |
# printf_fphex.c.
|
|
|
ce426f |
#
|
|
|
ce426f |
# - math_ldbl.h (ldbl_extract_mantissa): Same as above, but worse, with
|
|
|
ce426f |
# code testing for exponent > 1 for some reason, probably a typo for >= 1.
|
|
|
ce426f |
#
|
|
|
ce426f |
# - math_ldbl.h (ldbl_insert_mantissa): Round the high double as per
|
|
|
ce426f |
# mpn2ldbl.c (hi is odd or explicit mantissas non-zero) so that the
|
|
|
ce426f |
# number we return won't change when applying ldbl_canonicalize().
|
|
|
ce426f |
# Add missing overflow checks and normalisation of high mantissa.
|
|
|
ce426f |
# Correct misleading comment: "The hidden bit of the lo mantissa is
|
|
|
ce426f |
# zero" is not always true as can be seen from the code rounding the hi
|
|
|
ce426f |
# mantissa. Also by inspection, lzcount can never be less than zero so
|
|
|
ce426f |
# remove that test. Lastly, masking bitfields to their widths can be
|
|
|
ce426f |
# left to the compiler.
|
|
|
ce426f |
#
|
|
|
ce426f |
# - mpn2ldbl.c: The overflow checks here on rounding of high double were
|
|
|
ce426f |
# just plain wrong. Incrementing the exponent must be accompanied by a
|
|
|
ce426f |
# shift right of the mantissa to keep the value unchanged. Above notes
|
|
|
ce426f |
# for ldbl_insert_mantissa are also relevant.
|
|
|
ce426f |
#
|
|
|
ce426f |
# [BZ #15680]
|
|
|
ce426f |
# * sysdeps/ieee754/ldbl-128ibm/e_rem_pio2l.c: Comment fix.
|
|
|
ce426f |
# * sysdeps/ieee754/ldbl-128ibm/printf_fphex.c
|
|
|
ce426f |
# (PRINT_FPHEX_LONG_DOUBLE): Tidy code by moving -53 into ediff
|
|
|
ce426f |
# calculation. Remove unnecessary test for denormal exponent.
|
|
|
ce426f |
# * sysdeps/ieee754/ldbl-128ibm/ldbl2mpn.c (__mpn_extract_long_double):
|
|
|
ce426f |
# Correct handling of denormals. Avoid undefined shift behaviour.
|
|
|
ce426f |
# Correct normalisation of low mantissa when low double is denormal.
|
|
|
ce426f |
# * sysdeps/ieee754/ldbl-128ibm/math_ldbl.h
|
|
|
ce426f |
# (ldbl_extract_mantissa): Likewise. Comment. Use uint64_t* for hi64.
|
|
|
ce426f |
# (ldbl_insert_mantissa): Make both hi64 and lo64 parms uint64_t.
|
|
|
ce426f |
# Correct normalisation of low mantissa. Test for overflow of high
|
|
|
ce426f |
# mantissa and normalise.
|
|
|
ce426f |
# (ldbl_nearbyint): Use more readable constant for two52.
|
|
|
ce426f |
# * sysdeps/ieee754/ldbl-128ibm/mpn2ldbl.c
|
|
|
ce426f |
# (__mpn_construct_long_double): Fix test for overflow of high
|
|
|
ce426f |
# mantissa and correct normalisation. Avoid undefined shift.
|
|
|
ce426f |
#
|
|
|
ce426f |
diff -urN glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/e_rem_pio2l.c glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/e_rem_pio2l.c
|
|
|
ce426f |
--- glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/e_rem_pio2l.c 2014-05-27 19:13:56.000000000 -0500
|
|
|
ce426f |
+++ glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/e_rem_pio2l.c 2014-05-27 19:14:45.000000000 -0500
|
|
|
ce426f |
@@ -243,7 +243,7 @@
|
|
|
ce426f |
We split the 113 bits of the mantissa into 5 24bit integers
|
|
|
ce426f |
stored in a double array. */
|
|
|
ce426f |
/* Make the IBM extended format 105 bit mantissa look like the ieee854 112
|
|
|
ce426f |
- bit mantissa so the next operatation will give the correct result. */
|
|
|
ce426f |
+ bit mantissa so the next operation will give the correct result. */
|
|
|
ce426f |
ldbl_extract_mantissa (&ixd, &lxd, &exp, x);
|
|
|
ce426f |
exp = exp - 23;
|
|
|
ce426f |
/* This is faster than doing this in floating point, because we
|
|
|
ce426f |
diff -urN glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/ldbl2mpn.c glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/ldbl2mpn.c
|
|
|
ce426f |
--- glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/ldbl2mpn.c 2014-05-27 19:13:56.000000000 -0500
|
|
|
ce426f |
+++ glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/ldbl2mpn.c 2014-05-27 19:14:45.000000000 -0500
|
|
|
ce426f |
@@ -36,6 +36,7 @@
|
|
|
ce426f |
union ibm_extended_long_double u;
|
|
|
ce426f |
unsigned long long hi, lo;
|
|
|
ce426f |
int ediff;
|
|
|
ce426f |
+
|
|
|
ce426f |
u.ld = value;
|
|
|
ce426f |
|
|
|
ce426f |
*is_neg = u.d[0].ieee.negative;
|
|
|
ce426f |
@@ -43,27 +44,36 @@
|
|
|
ce426f |
|
|
|
ce426f |
lo = ((long long) u.d[1].ieee.mantissa0 << 32) | u.d[1].ieee.mantissa1;
|
|
|
ce426f |
hi = ((long long) u.d[0].ieee.mantissa0 << 32) | u.d[0].ieee.mantissa1;
|
|
|
ce426f |
- /* If the lower double is not a denomal or zero then set the hidden
|
|
|
ce426f |
+
|
|
|
ce426f |
+ /* If the lower double is not a denormal or zero then set the hidden
|
|
|
ce426f |
53rd bit. */
|
|
|
ce426f |
- if (u.d[1].ieee.exponent > 0)
|
|
|
ce426f |
- {
|
|
|
ce426f |
- lo |= 1LL << 52;
|
|
|
ce426f |
+ if (u.d[1].ieee.exponent != 0)
|
|
|
ce426f |
+ lo |= 1ULL << 52;
|
|
|
ce426f |
+ else
|
|
|
ce426f |
+ lo = lo << 1;
|
|
|
ce426f |
|
|
|
ce426f |
- /* The lower double is normalized separately from the upper. We may
|
|
|
ce426f |
- need to adjust the lower manitissa to reflect this. */
|
|
|
ce426f |
- ediff = u.d[0].ieee.exponent - u.d[1].ieee.exponent;
|
|
|
ce426f |
- if (ediff > 53)
|
|
|
ce426f |
- lo = lo >> (ediff-53);
|
|
|
ce426f |
+ /* The lower double is normalized separately from the upper. We may
|
|
|
ce426f |
+ need to adjust the lower manitissa to reflect this. */
|
|
|
ce426f |
+ ediff = u.d[0].ieee.exponent - u.d[1].ieee.exponent - 53;
|
|
|
ce426f |
+ if (ediff > 0)
|
|
|
ce426f |
+ {
|
|
|
ce426f |
+ if (ediff < 64)
|
|
|
ce426f |
+ lo = lo >> ediff;
|
|
|
ce426f |
+ else
|
|
|
ce426f |
+ lo = 0;
|
|
|
ce426f |
}
|
|
|
ce426f |
+ else if (ediff < 0)
|
|
|
ce426f |
+ lo = lo << -ediff;
|
|
|
ce426f |
+
|
|
|
ce426f |
/* The high double may be rounded and the low double reflects the
|
|
|
ce426f |
difference between the long double and the rounded high double
|
|
|
ce426f |
value. This is indicated by a differnce between the signs of the
|
|
|
ce426f |
high and low doubles. */
|
|
|
ce426f |
- if ((u.d[0].ieee.negative != u.d[1].ieee.negative)
|
|
|
ce426f |
- && ((u.d[1].ieee.exponent != 0) && (lo != 0L)))
|
|
|
ce426f |
+ if (u.d[0].ieee.negative != u.d[1].ieee.negative
|
|
|
ce426f |
+ && lo != 0)
|
|
|
ce426f |
{
|
|
|
ce426f |
lo = (1ULL << 53) - lo;
|
|
|
ce426f |
- if (hi == 0LL)
|
|
|
ce426f |
+ if (hi == 0)
|
|
|
ce426f |
{
|
|
|
ce426f |
/* we have a borrow from the hidden bit, so shift left 1. */
|
|
|
ce426f |
hi = 0x0ffffffffffffeLL | (lo >> 51);
|
|
|
ce426f |
diff -urN glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/math_ldbl.h glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/math_ldbl.h
|
|
|
ce426f |
--- glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/math_ldbl.h 2014-05-27 19:13:56.000000000 -0500
|
|
|
ce426f |
+++ glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/math_ldbl.h 2014-05-27 19:51:13.000000000 -0500
|
|
|
ce426f |
@@ -13,77 +13,118 @@
|
|
|
ce426f |
the number before the decimal point and the second implicit bit
|
|
|
ce426f |
as bit 53 of the mantissa. */
|
|
|
ce426f |
uint64_t hi, lo;
|
|
|
ce426f |
- int ediff;
|
|
|
ce426f |
union ibm_extended_long_double u;
|
|
|
ce426f |
+
|
|
|
ce426f |
u.ld = x;
|
|
|
ce426f |
*exp = u.d[0].ieee.exponent - IEEE754_DOUBLE_BIAS;
|
|
|
ce426f |
|
|
|
ce426f |
lo = ((uint64_t)u.d[1].ieee.mantissa0 << 32) | u.d[1].ieee.mantissa1;
|
|
|
ce426f |
hi = ((uint64_t)u.d[0].ieee.mantissa0 << 32) | u.d[0].ieee.mantissa1;
|
|
|
ce426f |
- /* If the lower double is not a denomal or zero then set the hidden
|
|
|
ce426f |
- 53rd bit. */
|
|
|
ce426f |
- if (u.d[1].ieee.exponent > 0x001)
|
|
|
ce426f |
- {
|
|
|
ce426f |
- lo |= (1ULL << 52);
|
|
|
ce426f |
- lo = lo << 7; /* pre-shift lo to match ieee854. */
|
|
|
ce426f |
- /* The lower double is normalized separately from the upper. We
|
|
|
ce426f |
- may need to adjust the lower manitissa to reflect this. */
|
|
|
ce426f |
- ediff = u.d[0].ieee.exponent - u.d[1].ieee.exponent;
|
|
|
ce426f |
- if (ediff > 53)
|
|
|
ce426f |
- lo = lo >> (ediff-53);
|
|
|
ce426f |
- hi |= (1ULL << 52);
|
|
|
ce426f |
- }
|
|
|
ce426f |
|
|
|
ce426f |
- if ((u.d[0].ieee.negative != u.d[1].ieee.negative)
|
|
|
ce426f |
- && ((u.d[1].ieee.exponent != 0) && (lo != 0LL)))
|
|
|
ce426f |
+ if (u.d[0].ieee.exponent != 0)
|
|
|
ce426f |
{
|
|
|
ce426f |
- hi--;
|
|
|
ce426f |
- lo = (1ULL << 60) - lo;
|
|
|
ce426f |
- if (hi < (1ULL << 52))
|
|
|
ce426f |
+ int ediff;
|
|
|
ce426f |
+
|
|
|
ce426f |
+ /* If not a denormal or zero then we have an implicit 53rd bit. */
|
|
|
ce426f |
+ hi |= (uint64_t) 1 << 52;
|
|
|
ce426f |
+
|
|
|
ce426f |
+ if (u.d[1].ieee.exponent != 0)
|
|
|
ce426f |
+ lo |= (uint64_t) 1 << 52;
|
|
|
ce426f |
+ else
|
|
|
ce426f |
+ /* A denormal is to be interpreted as having a biased exponent
|
|
|
ce426f |
+ of 1. */
|
|
|
ce426f |
+ lo = lo << 1;
|
|
|
ce426f |
+
|
|
|
ce426f |
+ /* We are going to shift 4 bits out of hi later, because we only
|
|
|
ce426f |
+ want 48 bits in *hi64. That means we want 60 bits in lo, but
|
|
|
ce426f |
+ we currently only have 53. Shift the value up. */
|
|
|
ce426f |
+ lo = lo << 7;
|
|
|
ce426f |
+
|
|
|
ce426f |
+ /* The lower double is normalized separately from the upper.
|
|
|
ce426f |
+ We may need to adjust the lower mantissa to reflect this.
|
|
|
ce426f |
+ The difference between the exponents can be larger than 53
|
|
|
ce426f |
+ when the low double is much less than 1ULP of the upper
|
|
|
ce426f |
+ (in which case there are significant bits, all 0's or all
|
|
|
ce426f |
+ 1's, between the two significands). The difference between
|
|
|
ce426f |
+ the exponents can be less than 53 when the upper double
|
|
|
ce426f |
+ exponent is nearing its minimum value (in which case the low
|
|
|
ce426f |
+ double is denormal ie. has an exponent of zero). */
|
|
|
ce426f |
+ ediff = u.d[0].ieee.exponent - u.d[1].ieee.exponent - 53;
|
|
|
ce426f |
+ if (ediff > 0)
|
|
|
ce426f |
{
|
|
|
ce426f |
- /* we have a borrow from the hidden bit, so shift left 1. */
|
|
|
ce426f |
- hi = (hi << 1) | (lo >> 59);
|
|
|
ce426f |
- lo = 0xfffffffffffffffLL & (lo << 1);
|
|
|
ce426f |
- *exp = *exp - 1;
|
|
|
ce426f |
+ if (ediff < 64)
|
|
|
ce426f |
+ lo = lo >> ediff;
|
|
|
ce426f |
+ else
|
|
|
ce426f |
+ lo = 0;
|
|
|
ce426f |
+ }
|
|
|
ce426f |
+ else if (ediff < 0)
|
|
|
ce426f |
+ lo = lo << -ediff;
|
|
|
ce426f |
+
|
|
|
ce426f |
+ if (u.d[0].ieee.negative != u.d[1].ieee.negative
|
|
|
ce426f |
+ && lo != 0)
|
|
|
ce426f |
+ {
|
|
|
ce426f |
+ hi--;
|
|
|
ce426f |
+ lo = ((uint64_t) 1 << 60) - lo;
|
|
|
ce426f |
+ if (hi < (uint64_t) 1 << 52)
|
|
|
ce426f |
+ {
|
|
|
ce426f |
+ /* We have a borrow from the hidden bit, so shift left 1. */
|
|
|
ce426f |
+ hi = (hi << 1) | (lo >> 59);
|
|
|
ce426f |
+ lo = (((uint64_t) 1 << 60) - 1) & (lo << 1);
|
|
|
ce426f |
+ *exp = *exp - 1;
|
|
|
ce426f |
+ }
|
|
|
ce426f |
}
|
|
|
ce426f |
}
|
|
|
ce426f |
+ else
|
|
|
ce426f |
+ /* If the larger magnitude double is denormal then the smaller
|
|
|
ce426f |
+ one must be zero. */
|
|
|
ce426f |
+ hi = hi << 1;
|
|
|
ce426f |
+
|
|
|
ce426f |
*lo64 = (hi << 60) | lo;
|
|
|
ce426f |
*hi64 = hi >> 4;
|
|
|
ce426f |
}
|
|
|
ce426f |
|
|
|
ce426f |
static inline long double
|
|
|
ce426f |
-ldbl_insert_mantissa (int sign, int exp, int64_t hi64, u_int64_t lo64)
|
|
|
ce426f |
+ldbl_insert_mantissa (int sign, int exp, int64_t hi64, uint64_t lo64)
|
|
|
ce426f |
{
|
|
|
ce426f |
union ibm_extended_long_double u;
|
|
|
ce426f |
- unsigned long hidden2, lzcount;
|
|
|
ce426f |
- unsigned long long hi, lo;
|
|
|
ce426f |
+ int expnt2;
|
|
|
ce426f |
+ uint64_t hi, lo;
|
|
|
ce426f |
|
|
|
ce426f |
u.d[0].ieee.negative = sign;
|
|
|
ce426f |
u.d[1].ieee.negative = sign;
|
|
|
ce426f |
u.d[0].ieee.exponent = exp + IEEE754_DOUBLE_BIAS;
|
|
|
ce426f |
- u.d[1].ieee.exponent = exp-53 + IEEE754_DOUBLE_BIAS;
|
|
|
ce426f |
+ u.d[1].ieee.exponent = 0;
|
|
|
ce426f |
+ expnt2 = exp - 53 + IEEE754_DOUBLE_BIAS;
|
|
|
ce426f |
+
|
|
|
ce426f |
/* Expect 113 bits (112 bits + hidden) right justified in two longs.
|
|
|
ce426f |
The low order 53 bits (52 + hidden) go into the lower double */
|
|
|
ce426f |
- lo = (lo64 >> 7)& ((1ULL << 53) - 1);
|
|
|
ce426f |
- hidden2 = (lo64 >> 59) & 1ULL;
|
|
|
ce426f |
+ lo = (lo64 >> 7) & (((uint64_t) 1 << 53) - 1);
|
|
|
ce426f |
/* The high order 53 bits (52 + hidden) go into the upper double */
|
|
|
ce426f |
- hi = (lo64 >> 60) & ((1ULL << 11) - 1);
|
|
|
ce426f |
- hi |= (hi64 << 4);
|
|
|
ce426f |
+ hi = lo64 >> 60;
|
|
|
ce426f |
+ hi |= hi64 << 4;
|
|
|
ce426f |
|
|
|
ce426f |
- if (lo != 0LL)
|
|
|
ce426f |
+ if (lo != 0)
|
|
|
ce426f |
{
|
|
|
ce426f |
- /* hidden2 bit of low double controls rounding of the high double.
|
|
|
ce426f |
- If hidden2 is '1' then round up hi and adjust lo (2nd mantissa)
|
|
|
ce426f |
+ int lzcount;
|
|
|
ce426f |
+
|
|
|
ce426f |
+ /* hidden bit of low double controls rounding of the high double.
|
|
|
ce426f |
+ If hidden is '1' and either the explicit mantissa is non-zero
|
|
|
ce426f |
+ or hi is odd, then round up hi and adjust lo (2nd mantissa)
|
|
|
ce426f |
plus change the sign of the low double to compensate. */
|
|
|
ce426f |
- if (hidden2)
|
|
|
ce426f |
+ if ((lo & ((uint64_t) 1 << 52)) != 0
|
|
|
ce426f |
+ && ((hi & 1) != 0 || (lo & (((uint64_t) 1 << 52) - 1)) != 0))
|
|
|
ce426f |
{
|
|
|
ce426f |
hi++;
|
|
|
ce426f |
+ if ((hi & ((uint64_t) 1 << 53)) != 0)
|
|
|
ce426f |
+ {
|
|
|
ce426f |
+ hi = hi >> 1;
|
|
|
ce426f |
+ u.d[0].ieee.exponent++;
|
|
|
ce426f |
+ }
|
|
|
ce426f |
u.d[1].ieee.negative = !sign;
|
|
|
ce426f |
- lo = (1ULL << 53) - lo;
|
|
|
ce426f |
+ lo = ((uint64_t) 1 << 53) - lo;
|
|
|
ce426f |
}
|
|
|
ce426f |
- /* The hidden bit of the lo mantissa is zero so we need to
|
|
|
ce426f |
- normalize the it for the low double. Shift it left until the
|
|
|
ce426f |
- hidden bit is '1' then adjust the 2nd exponent accordingly. */
|
|
|
ce426f |
+ /* Normalize the low double. Shift the mantissa left until
|
|
|
ce426f |
+ the hidden bit is '1' and adjust the exponent accordingly. */
|
|
|
ce426f |
|
|
|
ce426f |
if (sizeof (lo) == sizeof (long))
|
|
|
ce426f |
lzcount = __builtin_clzl (lo);
|
|
|
ce426f |
@@ -91,34 +132,30 @@
|
|
|
ce426f |
lzcount = __builtin_clzl ((long) (lo >> 32));
|
|
|
ce426f |
else
|
|
|
ce426f |
lzcount = __builtin_clzl ((long) lo) + 32;
|
|
|
ce426f |
- lzcount = lzcount - 11;
|
|
|
ce426f |
- if (lzcount > 0)
|
|
|
ce426f |
+ lzcount = lzcount - (64 - 53);
|
|
|
ce426f |
+ lo <<= lzcount;
|
|
|
ce426f |
+ expnt2 -= lzcount;
|
|
|
ce426f |
+
|
|
|
ce426f |
+ if (expnt2 >= 1)
|
|
|
ce426f |
+ /* Not denormal. */
|
|
|
ce426f |
+ u.d[1].ieee.exponent = expnt2;
|
|
|
ce426f |
+ else
|
|
|
ce426f |
{
|
|
|
ce426f |
- int expnt2 = u.d[1].ieee.exponent - lzcount;
|
|
|
ce426f |
- if (expnt2 >= 1)
|
|
|
ce426f |
- {
|
|
|
ce426f |
- /* Not denormal. Normalize and set low exponent. */
|
|
|
ce426f |
- lo = lo << lzcount;
|
|
|
ce426f |
- u.d[1].ieee.exponent = expnt2;
|
|
|
ce426f |
- }
|
|
|
ce426f |
+ /* Is denormal. Note that biased exponent of 0 is treated
|
|
|
ce426f |
+ as if it was 1, hence the extra shift. */
|
|
|
ce426f |
+ if (expnt2 > -53)
|
|
|
ce426f |
+ lo >>= 1 - expnt2;
|
|
|
ce426f |
else
|
|
|
ce426f |
- {
|
|
|
ce426f |
- /* Is denormal. */
|
|
|
ce426f |
- lo = lo << (lzcount + expnt2);
|
|
|
ce426f |
- u.d[1].ieee.exponent = 0;
|
|
|
ce426f |
- }
|
|
|
ce426f |
+ lo = 0;
|
|
|
ce426f |
}
|
|
|
ce426f |
}
|
|
|
ce426f |
else
|
|
|
ce426f |
- {
|
|
|
ce426f |
- u.d[1].ieee.negative = 0;
|
|
|
ce426f |
- u.d[1].ieee.exponent = 0;
|
|
|
ce426f |
- }
|
|
|
ce426f |
+ u.d[1].ieee.negative = 0;
|
|
|
ce426f |
|
|
|
ce426f |
- u.d[1].ieee.mantissa1 = lo & ((1ULL << 32) - 1);
|
|
|
ce426f |
- u.d[1].ieee.mantissa0 = (lo >> 32) & ((1ULL << 20) - 1);
|
|
|
ce426f |
- u.d[0].ieee.mantissa1 = hi & ((1ULL << 32) - 1);
|
|
|
ce426f |
- u.d[0].ieee.mantissa0 = (hi >> 32) & ((1ULL << 20) - 1);
|
|
|
ce426f |
+ u.d[1].ieee.mantissa1 = lo;
|
|
|
ce426f |
+ u.d[1].ieee.mantissa0 = lo >> 32;
|
|
|
ce426f |
+ u.d[0].ieee.mantissa1 = hi;
|
|
|
ce426f |
+ u.d[0].ieee.mantissa0 = hi >> 32;
|
|
|
ce426f |
return u.ld;
|
|
|
ce426f |
}
|
|
|
ce426f |
|
|
|
ce426f |
@@ -133,6 +170,10 @@
|
|
|
ce426f |
return u.ld;
|
|
|
ce426f |
}
|
|
|
ce426f |
|
|
|
ce426f |
+/* To suit our callers we return *hi64 and *lo64 as if they came from
|
|
|
ce426f |
+ an ieee854 112 bit mantissa, that is, 48 bits in *hi64 (plus one
|
|
|
ce426f |
+ implicit bit) and 64 bits in *lo64. */
|
|
|
ce426f |
+
|
|
|
ce426f |
static inline void
|
|
|
ce426f |
default_ldbl_unpack (long double l, double *a, double *aa)
|
|
|
ce426f |
{
|
|
|
ce426f |
@@ -162,13 +203,13 @@
|
|
|
ce426f |
*aa = xl;
|
|
|
ce426f |
}
|
|
|
ce426f |
|
|
|
ce426f |
-/* Simple inline nearbyint (double) function .
|
|
|
ce426f |
+/* Simple inline nearbyint (double) function.
|
|
|
ce426f |
Only works in the default rounding mode
|
|
|
ce426f |
but is useful in long double rounding functions. */
|
|
|
ce426f |
static inline double
|
|
|
ce426f |
ldbl_nearbyint (double a)
|
|
|
ce426f |
{
|
|
|
ce426f |
- double two52 = 0x10000000000000LL;
|
|
|
ce426f |
+ double two52 = 0x1p52;
|
|
|
ce426f |
|
|
|
ce426f |
if (__builtin_expect ((__builtin_fabs (a) < two52), 1))
|
|
|
ce426f |
{
|
|
|
ce426f |
diff -urN glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/mpn2ldbl.c glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/mpn2ldbl.c
|
|
|
ce426f |
--- glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/mpn2ldbl.c 2014-05-27 19:13:56.000000000 -0500
|
|
|
ce426f |
+++ glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/mpn2ldbl.c 2014-05-27 19:14:45.000000000 -0500
|
|
|
ce426f |
@@ -70,9 +70,9 @@
|
|
|
ce426f |
else
|
|
|
ce426f |
lzcount = __builtin_clzl ((long) val) + 32;
|
|
|
ce426f |
if (hi)
|
|
|
ce426f |
- lzcount = lzcount - 11;
|
|
|
ce426f |
+ lzcount = lzcount - (64 - 53);
|
|
|
ce426f |
else
|
|
|
ce426f |
- lzcount = lzcount + 42;
|
|
|
ce426f |
+ lzcount = lzcount + 53 - (64 - 53);
|
|
|
ce426f |
|
|
|
ce426f |
if (lzcount > u.d[0].ieee.exponent)
|
|
|
ce426f |
{
|
|
|
ce426f |
@@ -98,29 +98,27 @@
|
|
|
ce426f |
}
|
|
|
ce426f |
}
|
|
|
ce426f |
|
|
|
ce426f |
- if (lo != 0L)
|
|
|
ce426f |
+ if (lo != 0)
|
|
|
ce426f |
{
|
|
|
ce426f |
- /* hidden2 bit of low double controls rounding of the high double.
|
|
|
ce426f |
- If hidden2 is '1' and either the explicit mantissa is non-zero
|
|
|
ce426f |
+ /* hidden bit of low double controls rounding of the high double.
|
|
|
ce426f |
+ If hidden is '1' and either the explicit mantissa is non-zero
|
|
|
ce426f |
or hi is odd, then round up hi and adjust lo (2nd mantissa)
|
|
|
ce426f |
plus change the sign of the low double to compensate. */
|
|
|
ce426f |
if ((lo & (1LL << 52)) != 0
|
|
|
ce426f |
- && ((hi & 1) != 0 || (lo & ((1LL << 52) - 1))))
|
|
|
ce426f |
+ && ((hi & 1) != 0 || (lo & ((1LL << 52) - 1)) != 0))
|
|
|
ce426f |
{
|
|
|
ce426f |
hi++;
|
|
|
ce426f |
- if ((hi & ((1LL << 52) - 1)) == 0)
|
|
|
ce426f |
+ if ((hi & (1LL << 53)) != 0)
|
|
|
ce426f |
{
|
|
|
ce426f |
- if ((hi & (1LL << 53)) != 0)
|
|
|
ce426f |
- hi -= 1LL << 52;
|
|
|
ce426f |
+ hi >>= 1;
|
|
|
ce426f |
u.d[0].ieee.exponent++;
|
|
|
ce426f |
}
|
|
|
ce426f |
u.d[1].ieee.negative = !sign;
|
|
|
ce426f |
lo = (1LL << 53) - lo;
|
|
|
ce426f |
}
|
|
|
ce426f |
|
|
|
ce426f |
- /* The hidden bit of the lo mantissa is zero so we need to normalize
|
|
|
ce426f |
- it for the low double. Shift it left until the hidden bit is '1'
|
|
|
ce426f |
- then adjust the 2nd exponent accordingly. */
|
|
|
ce426f |
+ /* Normalize the low double. Shift the mantissa left until
|
|
|
ce426f |
+ the hidden bit is '1' and adjust the exponent accordingly. */
|
|
|
ce426f |
|
|
|
ce426f |
if (sizeof (lo) == sizeof (long))
|
|
|
ce426f |
lzcount = __builtin_clzl (lo);
|
|
|
ce426f |
@@ -128,24 +126,24 @@
|
|
|
ce426f |
lzcount = __builtin_clzl ((long) (lo >> 32));
|
|
|
ce426f |
else
|
|
|
ce426f |
lzcount = __builtin_clzl ((long) lo) + 32;
|
|
|
ce426f |
- lzcount = lzcount - 11;
|
|
|
ce426f |
- if (lzcount > 0)
|
|
|
ce426f |
- {
|
|
|
ce426f |
- lo = lo << lzcount;
|
|
|
ce426f |
- exponent2 = exponent2 - lzcount;
|
|
|
ce426f |
- }
|
|
|
ce426f |
+ lzcount = lzcount - (64 - 53);
|
|
|
ce426f |
+ lo <<= lzcount;
|
|
|
ce426f |
+ exponent2 -= lzcount;
|
|
|
ce426f |
+
|
|
|
ce426f |
if (exponent2 > 0)
|
|
|
ce426f |
u.d[1].ieee.exponent = exponent2;
|
|
|
ce426f |
- else
|
|
|
ce426f |
+ else if (exponent2 > -53)
|
|
|
ce426f |
lo >>= 1 - exponent2;
|
|
|
ce426f |
+ else
|
|
|
ce426f |
+ lo = 0;
|
|
|
ce426f |
}
|
|
|
ce426f |
else
|
|
|
ce426f |
u.d[1].ieee.negative = 0;
|
|
|
ce426f |
|
|
|
ce426f |
- u.d[1].ieee.mantissa1 = lo & 0xffffffffLL;
|
|
|
ce426f |
- u.d[1].ieee.mantissa0 = (lo >> 32) & 0xfffff;
|
|
|
ce426f |
- u.d[0].ieee.mantissa1 = hi & 0xffffffffLL;
|
|
|
ce426f |
- u.d[0].ieee.mantissa0 = (hi >> 32) & ((1LL << (LDBL_MANT_DIG - 86)) - 1);
|
|
|
ce426f |
+ u.d[1].ieee.mantissa1 = lo;
|
|
|
ce426f |
+ u.d[1].ieee.mantissa0 = lo >> 32;
|
|
|
ce426f |
+ u.d[0].ieee.mantissa1 = hi;
|
|
|
ce426f |
+ u.d[0].ieee.mantissa0 = hi >> 32;
|
|
|
ce426f |
|
|
|
ce426f |
return u.ld;
|
|
|
ce426f |
}
|
|
|
ce426f |
diff -urN glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/printf_fphex.c glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/printf_fphex.c
|
|
|
ce426f |
--- glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/printf_fphex.c 2014-05-27 19:13:56.000000000 -0500
|
|
|
ce426f |
+++ glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/printf_fphex.c 2014-05-27 19:14:45.000000000 -0500
|
|
|
ce426f |
@@ -43,15 +43,15 @@
|
|
|
ce426f |
lo <<= 1; \
|
|
|
ce426f |
/* The lower double is normalized separately from the upper. We \
|
|
|
ce426f |
may need to adjust the lower manitissa to reflect this. */ \
|
|
|
ce426f |
- ediff = u.d[0].ieee.exponent - u.d[1].ieee.exponent; \
|
|
|
ce426f |
- if (ediff > 53 + 63) \
|
|
|
ce426f |
+ ediff = u.d[0].ieee.exponent - u.d[1].ieee.exponent - 53; \
|
|
|
ce426f |
+ if (ediff > 63) \
|
|
|
ce426f |
lo = 0; \
|
|
|
ce426f |
- else if (ediff > 53) \
|
|
|
ce426f |
- lo = lo >> (ediff - 53); \
|
|
|
ce426f |
- else if (u.d[1].ieee.exponent == 0 && ediff < 53) \
|
|
|
ce426f |
- lo = lo << (53 - ediff); \
|
|
|
ce426f |
+ else if (ediff > 0) \
|
|
|
ce426f |
+ lo = lo >> ediff; \
|
|
|
ce426f |
+ else if (ediff < 0) \
|
|
|
ce426f |
+ lo = lo << -ediff; \
|
|
|
ce426f |
if (u.d[0].ieee.negative != u.d[1].ieee.negative \
|
|
|
ce426f |
- && (u.d[1].ieee.exponent != 0 || lo != 0L)) \
|
|
|
ce426f |
+ && lo != 0) \
|
|
|
ce426f |
{ \
|
|
|
ce426f |
lo = (1ULL << 60) - lo; \
|
|
|
ce426f |
if (hi == 0L) \
|