2000-10-26 23:41:17 +00:00
|
|
|
/* e_hypotl.c -- long double version of e_hypot.c.
|
|
|
|
* Conversion to long double by Jakub Jelinek, jakub@redhat.com.
|
|
|
|
*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* ====================================================
|
|
|
|
* Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
|
|
|
|
*
|
|
|
|
* Developed at SunPro, a Sun Microsystems, Inc. business.
|
|
|
|
* Permission to use, copy, modify, and distribute this
|
|
|
|
* software is freely granted, provided that this notice
|
|
|
|
* is preserved.
|
|
|
|
* ====================================================
|
|
|
|
*/
|
|
|
|
|
|
|
|
/* __ieee754_hypotl(x,y)
|
|
|
|
*
|
|
|
|
* Method :
|
|
|
|
* If (assume round-to-nearest) z=x*x+y*y
|
|
|
|
* has error less than sqrtl(2)/2 ulp, than
|
|
|
|
* sqrtl(z) has error less than 1 ulp (exercise).
|
|
|
|
*
|
|
|
|
* So, compute sqrtl(x*x+y*y) with some care as
|
|
|
|
* follows to get the error below 1 ulp:
|
|
|
|
*
|
|
|
|
* Assume x>y>0;
|
|
|
|
* (if possible, set rounding to round-to-nearest)
|
|
|
|
* 1. if x > 2y use
|
|
|
|
* x1*x1+(y*y+(x2*(x+x1))) for x*x+y*y
|
|
|
|
* where x1 = x with lower 64 bits cleared, x2 = x-x1; else
|
|
|
|
* 2. if x <= 2y use
|
|
|
|
* t1*y1+((x-y)*(x-y)+(t1*y2+t2*y))
|
|
|
|
* where t1 = 2x with lower 64 bits cleared, t2 = 2x-t1,
|
|
|
|
* y1= y with lower 64 bits chopped, y2 = y-y1.
|
|
|
|
*
|
|
|
|
* NOTE: scaling may be necessary if some argument is too
|
|
|
|
* large or too tiny
|
|
|
|
*
|
|
|
|
* Special cases:
|
|
|
|
* hypotl(x,y) is INF if x or y is +INF or -INF; else
|
|
|
|
* hypotl(x,y) is NAN if x or y is NAN.
|
|
|
|
*
|
|
|
|
* Accuracy:
|
2011-10-12 15:27:51 +00:00
|
|
|
* hypotl(x,y) returns sqrtl(x^2+y^2) with error less
|
|
|
|
* than 1 ulps (units in the last place)
|
2000-10-26 23:41:17 +00:00
|
|
|
*/
|
|
|
|
|
2012-03-09 19:29:16 +00:00
|
|
|
#include <math.h>
|
|
|
|
#include <math_private.h>
|
2000-10-26 23:41:17 +00:00
|
|
|
|
2011-10-12 15:27:51 +00:00
|
|
|
long double
|
|
|
|
__ieee754_hypotl(long double x, long double y)
|
2000-10-26 23:41:17 +00:00
|
|
|
{
|
|
|
|
long double a,b,t1,t2,y1,y2,w;
|
|
|
|
int64_t j,k,ha,hb;
|
|
|
|
|
|
|
|
GET_LDOUBLE_MSW64(ha,x);
|
|
|
|
ha &= 0x7fffffffffffffffLL;
|
|
|
|
GET_LDOUBLE_MSW64(hb,y);
|
|
|
|
hb &= 0x7fffffffffffffffLL;
|
|
|
|
if(hb > ha) {a=y;b=x;j=ha; ha=hb;hb=j;} else {a=x;b=y;}
|
|
|
|
SET_LDOUBLE_MSW64(a,ha); /* a <- |a| */
|
|
|
|
SET_LDOUBLE_MSW64(b,hb); /* b <- |b| */
|
|
|
|
if((ha-hb)>0x78000000000000LL) {return a+b;} /* x/y > 2**120 */
|
|
|
|
k=0;
|
|
|
|
if(ha > 0x5f3f000000000000LL) { /* a>2**8000 */
|
|
|
|
if(ha >= 0x7fff000000000000LL) { /* Inf or NaN */
|
|
|
|
u_int64_t low;
|
|
|
|
w = a+b; /* for sNaN */
|
|
|
|
GET_LDOUBLE_LSW64(low,a);
|
|
|
|
if(((ha&0xffffffffffffLL)|low)==0) w = a;
|
|
|
|
GET_LDOUBLE_LSW64(low,b);
|
|
|
|
if(((hb^0x7fff000000000000LL)|low)==0) w = b;
|
|
|
|
return w;
|
|
|
|
}
|
|
|
|
/* scale a and b by 2**-9600 */
|
|
|
|
ha -= 0x2580000000000000LL;
|
|
|
|
hb -= 0x2580000000000000LL; k += 9600;
|
|
|
|
SET_LDOUBLE_MSW64(a,ha);
|
|
|
|
SET_LDOUBLE_MSW64(b,hb);
|
|
|
|
}
|
|
|
|
if(hb < 0x20bf000000000000LL) { /* b < 2**-8000 */
|
|
|
|
if(hb <= 0x0000ffffffffffffLL) { /* subnormal b or 0 */
|
2011-10-12 15:27:51 +00:00
|
|
|
u_int64_t low;
|
2000-10-26 23:41:17 +00:00
|
|
|
GET_LDOUBLE_LSW64(low,b);
|
|
|
|
if((hb|low)==0) return a;
|
|
|
|
t1=0;
|
|
|
|
SET_LDOUBLE_MSW64(t1,0x7ffd000000000000LL); /* t1=2^16382 */
|
|
|
|
b *= t1;
|
|
|
|
a *= t1;
|
|
|
|
k -= 16382;
|
2013-12-17 13:42:13 +00:00
|
|
|
GET_LDOUBLE_MSW64 (ha, a);
|
|
|
|
GET_LDOUBLE_MSW64 (hb, b);
|
|
|
|
if (hb > ha)
|
|
|
|
{
|
|
|
|
t1 = a;
|
|
|
|
a = b;
|
|
|
|
b = t1;
|
|
|
|
j = ha;
|
|
|
|
ha = hb;
|
|
|
|
hb = j;
|
|
|
|
}
|
2000-10-26 23:41:17 +00:00
|
|
|
} else { /* scale a and b by 2^9600 */
|
2011-10-12 15:27:51 +00:00
|
|
|
ha += 0x2580000000000000LL; /* a *= 2^9600 */
|
2000-10-26 23:41:17 +00:00
|
|
|
hb += 0x2580000000000000LL; /* b *= 2^9600 */
|
|
|
|
k -= 9600;
|
|
|
|
SET_LDOUBLE_MSW64(a,ha);
|
|
|
|
SET_LDOUBLE_MSW64(b,hb);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/* medium size a and b */
|
|
|
|
w = a-b;
|
|
|
|
if (w>b) {
|
|
|
|
t1 = 0;
|
|
|
|
SET_LDOUBLE_MSW64(t1,ha);
|
|
|
|
t2 = a-t1;
|
|
|
|
w = __ieee754_sqrtl(t1*t1-(b*(-b)-t2*(a+t1)));
|
|
|
|
} else {
|
|
|
|
a = a+a;
|
|
|
|
y1 = 0;
|
|
|
|
SET_LDOUBLE_MSW64(y1,hb);
|
|
|
|
y2 = b - y1;
|
|
|
|
t1 = 0;
|
|
|
|
SET_LDOUBLE_MSW64(t1,ha+0x0001000000000000LL);
|
|
|
|
t2 = a - t1;
|
|
|
|
w = __ieee754_sqrtl(t1*y1-(w*(-w)-(t1*y2+t2*b)));
|
|
|
|
}
|
|
|
|
if(k!=0) {
|
|
|
|
u_int64_t high;
|
|
|
|
t1 = 1.0L;
|
|
|
|
GET_LDOUBLE_MSW64(high,t1);
|
|
|
|
SET_LDOUBLE_MSW64(t1,high+(k<<48));
|
Fix hypot missing underflows (bug 18803).
Similar to various other bugs in this area, hypot functions can fail
to raise the underflow exception when the result is tiny and inexact
but one or more low bits of the intermediate result that is scaled
down (or, in the i386 case, converted from a wider evaluation format)
are zero. This patch forces the exception in a similar way to
previous fixes.
Note that this issue cannot arise for implementations of hypotf using
double (or wider) for intermediate evaluation (if hypotf should
underflow, that means the double square root is being computed of some
number of the form N*2^-298, for 0 < N < 2^46, which is exactly
represented as a double, and whatever the rounding mode such a square
root cannot have a mantissa with all zeroes after the initial 23
bits). Thus no changes are made to hypotf implementations in this
patch, only to hypot and hypotl.
Tested for x86_64, x86, mips64 and powerpc.
[BZ #18803]
* sysdeps/i386/fpu/e_hypot.S: Use DEFINE_DBL_MIN.
(MO): New macro.
(__ieee754_hypot) [PIC]: Load PIC register.
(__ieee754_hypot): Use DBL_NARROW_EVAL_UFLOW_NONNEG instead of
DBL_NARROW_EVAL.
* sysdeps/ieee754/dbl-64/e_hypot.c (__ieee754_hypot): Use
math_check_force_underflow_nonneg in case where result might be
tiny.
* sysdeps/ieee754/ldbl-128/e_hypotl.c (__ieee754_hypotl):
Likewise.
* sysdeps/ieee754/ldbl-128ibm/e_hypotl.c (__ieee754_hypotl):
Likewise.
* sysdeps/ieee754/ldbl-96/e_hypotl.c (__ieee754_hypotl): Likewise.
* sysdeps/powerpc/fpu/e_hypot.c (__ieee754_hypot): Likewise.
* math/auto-libm-test-in: Add more tests of hypot.
* math/auto-libm-test-out: Regenerated.
2015-09-24 23:43:57 +00:00
|
|
|
w *= t1;
|
|
|
|
math_check_force_underflow_nonneg (w);
|
|
|
|
return w;
|
2000-10-26 23:41:17 +00:00
|
|
|
} else return w;
|
|
|
|
}
|
2011-10-12 15:27:51 +00:00
|
|
|
strong_alias (__ieee754_hypotl, __hypotl_finite)
|