5de29b
# commit 62a728aeff93507ce5975f245a5f1d2046fb4503
5de29b
# Author: Alan Modra <amodra@gmail.com>
5de29b
# Date:   Sat Aug 17 18:27:19 2013 +0930
5de29b
# 
5de29b
#     PowerPC floating point little-endian [6 of 15]
5de29b
#     http://sourceware.org/ml/libc-alpha/2013-07/msg00197.html
5de29b
#     
5de29b
#     A rewrite to make this code correct for little-endian.
5de29b
#     
5de29b
#         * sysdeps/ieee754/ldbl-128ibm/e_sqrtl.c (mynumber): Replace
5de29b
#         union 32-bit int array member with 64-bit int array.
5de29b
#         (t515, tm256): Double rather than long double.
5de29b
#         (__ieee754_sqrtl): Rewrite using 64-bit arithmetic.
5de29b
#
5de29b
diff -urN glibc-2.17-c758a686.orig/sysdeps/ieee754/ldbl-128ibm/e_sqrtl.c glibc-2.17-c758a686.diff/sysdeps/ieee754/ldbl-128ibm/e_sqrtl.c
5de29b
--- glibc-2.17-c758a686.orig/sysdeps/ieee754/ldbl-128ibm/e_sqrtl.c	2014-05-27 22:20:12.000000000 -0500
5de29b
+++ glibc-2.17-c758a686.diff/sysdeps/ieee754/ldbl-128ibm/e_sqrtl.c	2014-05-27 22:21:39.000000000 -0500
5de29b
@@ -34,15 +34,13 @@
5de29b
 
5de29b
 #include <math_private.h>
5de29b
 
5de29b
-typedef unsigned int int4;
5de29b
-typedef union {int4 i[4]; long double x; double d[2]; } mynumber;
5de29b
+typedef union {int64_t i[2]; long double x; double d[2]; } mynumber;
5de29b
 
5de29b
-static const  mynumber
5de29b
-  t512 = {{0x5ff00000, 0x00000000, 0x00000000, 0x00000000 }},  /* 2^512  */
5de29b
-  tm256 = {{0x2ff00000, 0x00000000, 0x00000000, 0x00000000 }};  /* 2^-256 */
5de29b
 static const double
5de29b
-two54 = 1.80143985094819840000e+16, /* 0x4350000000000000 */
5de29b
-twom54 = 5.55111512312578270212e-17; /* 0x3C90000000000000 */
5de29b
+  t512 = 0x1p512,
5de29b
+  tm256 = 0x1p-256,
5de29b
+  two54 = 0x1p54,	/* 0x4350000000000000 */
5de29b
+  twom54 = 0x1p-54;	/* 0x3C90000000000000 */
5de29b
 
5de29b
 /*********************************************************************/
5de29b
 /* An ultimate sqrt routine. Given an IEEE double machine number x   */
5de29b
@@ -54,56 +52,53 @@
5de29b
   static const long double big = 134217728.0, big1 = 134217729.0;
5de29b
   long double t,s,i;
5de29b
   mynumber a,c;
5de29b
-  int4 k, l, m;
5de29b
-  int n;
5de29b
+  uint64_t k, l;
5de29b
+  int64_t m, n;
5de29b
   double d;
5de29b
 
5de29b
   a.x=x;
5de29b
-  k=a.i[0] & 0x7fffffff;
5de29b
+  k=a.i[0] & INT64_C(0x7fffffffffffffff);
5de29b
   /*----------------- 2^-1022  <= | x |< 2^1024  -----------------*/
5de29b
-  if (k>0x000fffff && k<0x7ff00000) {
5de29b
+  if (k>INT64_C(0x000fffff00000000) && k
5de29b
     if (x < 0) return (big1-big1)/(big-big);
5de29b
-    l = (k&0x001fffff)|0x3fe00000;
5de29b
-    if (((a.i[2] & 0x7fffffff) | a.i[3]) != 0) {
5de29b
-      n = (int) ((l - k) * 2) >> 21;
5de29b
-      m = (a.i[2] >> 20) & 0x7ff;
5de29b
+    l = (k&INT64_C(0x001fffffffffffff))|INT64_C(0x3fe0000000000000);
5de29b
+    if ((a.i[1] & INT64_C(0x7fffffffffffffff)) != 0) {
5de29b
+      n = (int64_t) ((l - k) * 2) >> 53;
5de29b
+      m = (a.i[1] >> 52) & 0x7ff;
5de29b
       if (m == 0) {
5de29b
 	a.d[1] *= two54;
5de29b
-	m = ((a.i[2] >> 20) & 0x7ff) - 54;
5de29b
+	m = ((a.i[1] >> 52) & 0x7ff) - 54;
5de29b
       }
5de29b
       m += n;
5de29b
-      if ((int) m > 0)
5de29b
-	a.i[2] = (a.i[2] & 0x800fffff) | (m << 20);
5de29b
-      else if ((int) m <= -54) {
5de29b
-	a.i[2] &= 0x80000000;
5de29b
-	a.i[3] = 0;
5de29b
+      if (m > 0)
5de29b
+	a.i[1] = (a.i[1] & INT64_C(0x800fffffffffffff)) | (m << 52);
5de29b
+      else if (m <= -54) {
5de29b
+	a.i[1] &= INT64_C(0x8000000000000000);
5de29b
       } else {
5de29b
 	m += 54;
5de29b
-	a.i[2] = (a.i[2] & 0x800fffff) | (m << 20);
5de29b
+	a.i[1] = (a.i[1] & INT64_C(0x800fffffffffffff)) | (m << 52);
5de29b
 	a.d[1] *= twom54;
5de29b
       }
5de29b
     }
5de29b
     a.i[0] = l;
5de29b
     s = a.x;
5de29b
     d = __ieee754_sqrt (a.d[0]);
5de29b
-    c.i[0] = 0x20000000+((k&0x7fe00000)>>1);
5de29b
+    c.i[0] = INT64_C(0x2000000000000000)+((k&INT64_C(0x7fe0000000000000))>>1);
5de29b
     c.i[1] = 0;
5de29b
-    c.i[2] = 0;
5de29b
-    c.i[3] = 0;
5de29b
     i = d;
5de29b
     t = 0.5L * (i + s / i);
5de29b
     i = 0.5L * (t + s / t);
5de29b
     return c.x * i;
5de29b
   }
5de29b
   else {
5de29b
-    if (k>=0x7ff00000) {
5de29b
-      if (a.i[0] == 0xfff00000 && a.i[1] == 0)
5de29b
+    if (k>=INT64_C(0x7ff0000000000000)) {
5de29b
+      if (a.i[0] == INT64_C(0xfff0000000000000))
5de29b
 	return (big1-big1)/(big-big); /* sqrt (-Inf) = NaN.  */
5de29b
       return x; /* sqrt (NaN) = NaN, sqrt (+Inf) = +Inf.  */
5de29b
     }
5de29b
     if (x == 0) return x;
5de29b
     if (x < 0) return (big1-big1)/(big-big);
5de29b
-    return tm256.x*__ieee754_sqrtl(x*t512.x);
5de29b
+    return tm256*__ieee754_sqrtl(x*t512);
5de29b
   }
5de29b
 }
5de29b
 strong_alias (__ieee754_sqrtl, __sqrtl_finite)