00db10
# commit 62a728aeff93507ce5975f245a5f1d2046fb4503
00db10
# Author: Alan Modra <amodra@gmail.com>
00db10
# Date:   Sat Aug 17 18:27:19 2013 +0930
00db10
# 
00db10
#     PowerPC floating point little-endian [6 of 15]
00db10
#     http://sourceware.org/ml/libc-alpha/2013-07/msg00197.html
00db10
#     
00db10
#     A rewrite to make this code correct for little-endian.
00db10
#     
00db10
#         * sysdeps/ieee754/ldbl-128ibm/e_sqrtl.c (mynumber): Replace
00db10
#         union 32-bit int array member with 64-bit int array.
00db10
#         (t515, tm256): Double rather than long double.
00db10
#         (__ieee754_sqrtl): Rewrite using 64-bit arithmetic.
00db10
#
00db10
diff -urN glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/e_sqrtl.c glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/e_sqrtl.c
00db10
--- glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/e_sqrtl.c	2014-05-27 22:20:12.000000000 -0500
00db10
+++ glibc-2.17-c758a686/sysdeps/ieee754/ldbl-128ibm/e_sqrtl.c	2014-05-27 22:21:39.000000000 -0500
00db10
@@ -34,15 +34,13 @@
00db10
 
00db10
 #include <math_private.h>
00db10
 
00db10
-typedef unsigned int int4;
00db10
-typedef union {int4 i[4]; long double x; double d[2]; } mynumber;
00db10
+typedef union {int64_t i[2]; long double x; double d[2]; } mynumber;
00db10
 
00db10
-static const  mynumber
00db10
-  t512 = {{0x5ff00000, 0x00000000, 0x00000000, 0x00000000 }},  /* 2^512  */
00db10
-  tm256 = {{0x2ff00000, 0x00000000, 0x00000000, 0x00000000 }};  /* 2^-256 */
00db10
 static const double
00db10
-two54 = 1.80143985094819840000e+16, /* 0x4350000000000000 */
00db10
-twom54 = 5.55111512312578270212e-17; /* 0x3C90000000000000 */
00db10
+  t512 = 0x1p512,
00db10
+  tm256 = 0x1p-256,
00db10
+  two54 = 0x1p54,	/* 0x4350000000000000 */
00db10
+  twom54 = 0x1p-54;	/* 0x3C90000000000000 */
00db10
 
00db10
 /*********************************************************************/
00db10
 /* An ultimate sqrt routine. Given an IEEE double machine number x   */
00db10
@@ -54,56 +52,53 @@
00db10
   static const long double big = 134217728.0, big1 = 134217729.0;
00db10
   long double t,s,i;
00db10
   mynumber a,c;
00db10
-  int4 k, l, m;
00db10
-  int n;
00db10
+  uint64_t k, l;
00db10
+  int64_t m, n;
00db10
   double d;
00db10
 
00db10
   a.x=x;
00db10
-  k=a.i[0] & 0x7fffffff;
00db10
+  k=a.i[0] & INT64_C(0x7fffffffffffffff);
00db10
   /*----------------- 2^-1022  <= | x |< 2^1024  -----------------*/
00db10
-  if (k>0x000fffff && k<0x7ff00000) {
00db10
+  if (k>INT64_C(0x000fffff00000000) && k
00db10
     if (x < 0) return (big1-big1)/(big-big);
00db10
-    l = (k&0x001fffff)|0x3fe00000;
00db10
-    if (((a.i[2] & 0x7fffffff) | a.i[3]) != 0) {
00db10
-      n = (int) ((l - k) * 2) >> 21;
00db10
-      m = (a.i[2] >> 20) & 0x7ff;
00db10
+    l = (k&INT64_C(0x001fffffffffffff))|INT64_C(0x3fe0000000000000);
00db10
+    if ((a.i[1] & INT64_C(0x7fffffffffffffff)) != 0) {
00db10
+      n = (int64_t) ((l - k) * 2) >> 53;
00db10
+      m = (a.i[1] >> 52) & 0x7ff;
00db10
       if (m == 0) {
00db10
 	a.d[1] *= two54;
00db10
-	m = ((a.i[2] >> 20) & 0x7ff) - 54;
00db10
+	m = ((a.i[1] >> 52) & 0x7ff) - 54;
00db10
       }
00db10
       m += n;
00db10
-      if ((int) m > 0)
00db10
-	a.i[2] = (a.i[2] & 0x800fffff) | (m << 20);
00db10
-      else if ((int) m <= -54) {
00db10
-	a.i[2] &= 0x80000000;
00db10
-	a.i[3] = 0;
00db10
+      if (m > 0)
00db10
+	a.i[1] = (a.i[1] & INT64_C(0x800fffffffffffff)) | (m << 52);
00db10
+      else if (m <= -54) {
00db10
+	a.i[1] &= INT64_C(0x8000000000000000);
00db10
       } else {
00db10
 	m += 54;
00db10
-	a.i[2] = (a.i[2] & 0x800fffff) | (m << 20);
00db10
+	a.i[1] = (a.i[1] & INT64_C(0x800fffffffffffff)) | (m << 52);
00db10
 	a.d[1] *= twom54;
00db10
       }
00db10
     }
00db10
     a.i[0] = l;
00db10
     s = a.x;
00db10
     d = __ieee754_sqrt (a.d[0]);
00db10
-    c.i[0] = 0x20000000+((k&0x7fe00000)>>1);
00db10
+    c.i[0] = INT64_C(0x2000000000000000)+((k&INT64_C(0x7fe0000000000000))>>1);
00db10
     c.i[1] = 0;
00db10
-    c.i[2] = 0;
00db10
-    c.i[3] = 0;
00db10
     i = d;
00db10
     t = 0.5L * (i + s / i);
00db10
     i = 0.5L * (t + s / t);
00db10
     return c.x * i;
00db10
   }
00db10
   else {
00db10
-    if (k>=0x7ff00000) {
00db10
-      if (a.i[0] == 0xfff00000 && a.i[1] == 0)
00db10
+    if (k>=INT64_C(0x7ff0000000000000)) {
00db10
+      if (a.i[0] == INT64_C(0xfff0000000000000))
00db10
 	return (big1-big1)/(big-big); /* sqrt (-Inf) = NaN.  */
00db10
       return x; /* sqrt (NaN) = NaN, sqrt (+Inf) = +Inf.  */
00db10
     }
00db10
     if (x == 0) return x;
00db10
     if (x < 0) return (big1-big1)/(big-big);
00db10
-    return tm256.x*__ieee754_sqrtl(x*t512.x);
00db10
+    return tm256*__ieee754_sqrtl(x*t512);
00db10
   }
00db10
 }
00db10
 strong_alias (__ieee754_sqrtl, __sqrtl_finite)