mirror of
https://sourceware.org/git/glibc.git
synced 2024-12-03 02:11:08 +00:00
f67a8147b0
Use sqrt(f/l) to enable inlining by GCC - if inlining doesn't happen, the asm redirect ensures we will still call __ieee754_sqrt(f/l). * sysdeps/ieee754/dbl-64/e_acosh.c (__ieee754_acosh): Use sqrt. * sysdeps/ieee754/dbl-64/e_gamma_r.c (gamma_positive): Likewise. * sysdeps/ieee754/dbl-64/e_hypot.c (__ieee754_hypot): Likewise. * sysdeps/ieee754/dbl-64/e_j0.c (__ieee754_j0): Likewise. * sysdeps/ieee754/dbl-64/e_j1.c (__ieee754_j1): Likewise. * sysdeps/ieee754/dbl-64/e_jn.c (__ieee754_jn): Likewise. * sysdeps/ieee754/dbl-64/s_asinh.c (__asinh): Likewise. * sysdeps/ieee754/dbl-64/wordsize-64/e_acosh.c (__ieee754_acosh): Likewise. * sysdeps/ieee754/flt-32/e_acosf.c (__ieee754_acosf): Likewise. * sysdeps/ieee754/flt-32/e_acoshf.c (__ieee754_acoshf): Likewise. * sysdeps/ieee754/flt-32/e_asinf.c (__ieee754_asinf): Likewise. * sysdeps/ieee754/flt-32/e_gammaf_r.c (gammaf_positive): Likewise. * sysdeps/ieee754/flt-32/e_hypotf.c (__ieee754_hypotf): Likewise. * sysdeps/ieee754/flt-32/e_j0f.c (__ieee754_j0f): Likewise. * sysdeps/ieee754/flt-32/e_j1f.c (__ieee754_j1f): Likewise. * sysdeps/ieee754/flt-32/e_powf.c (__ieee754_powf): Likewise. * sysdeps/ieee754/flt-32/s_asinhf.c (__asinhf): Likewise. * sysdeps/ieee754/ldbl-128/e_acoshl.c (__ieee754_acoshl): Use sqrtl. * sysdeps/ieee754/ldbl-128/e_acosl.c (__ieee754_acosl): Likewise. * sysdeps/ieee754/ldbl-128/e_asinl.c (__ieee754_asinl): Likewise. * sysdeps/ieee754/ldbl-128/e_gammal_r.c (gammal_positive): Likewise. * sysdeps/ieee754/ldbl-128/e_hypotl.c (__ieee754_hypotl): Likewise. * sysdeps/ieee754/ldbl-128/e_j0l.c (__ieee754_j0l): Likewise. * sysdeps/ieee754/ldbl-128/e_j1l.c (__ieee754_j1l): Likewise. * sysdeps/ieee754/ldbl-128/e_jnl.c (__ieee754_jnl): Likewise. * sysdeps/ieee754/ldbl-128/e_powl.c (__ieee754_powl): Likewise. * sysdeps/ieee754/ldbl-128/s_asinhl.c (__ieee754_asinhl): Likewise. * sysdeps/ieee754/ldbl-128ibm/e_acoshl.c (__ieee754_acoshl): Likewise. * sysdeps/ieee754/ldbl-128ibm/e_acosl.c (__ieee754_acosl): Likewise. * sysdeps/ieee754/ldbl-128ibm/e_asinl.c (__ieee754_asinl): Likewise. * sysdeps/ieee754/ldbl-128ibm/e_gammal_r.c (gammal_positive): Likewise. * sysdeps/ieee754/ldbl-128ibm/e_hypotl.c (__ieee754_hypotl): Likewise. * sysdeps/ieee754/ldbl-128ibm/e_j0l.c (__ieee754_j0l): Likewise. * sysdeps/ieee754/ldbl-128ibm/e_j1l.c (__ieee754_j1l): Likewise * sysdeps/ieee754/ldbl-128ibm/e_jnl.c (__ieee754_jnl): Likewise. * sysdeps/ieee754/ldbl-128ibm/e_powl.c (__ieee754_powl): Likewise. * sysdeps/ieee754/ldbl-128ibm/s_asinhl.c (__ieee754_asinhl): Likewise. * sysdeps/ieee754/ldbl-96/e_acoshl.c (__ieee754_acoshl): Use sqrtl. * sysdeps/ieee754/ldbl-96/e_asinl.c (__ieee754_asinl): Likewise. * sysdeps/ieee754/ldbl-96/e_gammal_r.c (gammal_positive): Likewise. * sysdeps/ieee754/ldbl-96/e_hypotl.c (__ieee754_hypotl): Likewise. * sysdeps/ieee754/ldbl-96/e_j0l.c (__ieee754_j0l): Likewise. * sysdeps/ieee754/ldbl-96/e_j1l.c (__ieee754_j1l): Likewise. * sysdeps/ieee754/ldbl-96/e_jnl.c (__ieee754_jnl): Likewise. * sysdeps/ieee754/ldbl-96/s_asinhl.c (__ieee754_asinhl): Likewise. * sysdeps/m68k/m680x0/fpu/e_pow.c (__ieee754_pow): Likewise. * sysdeps/powerpc/fpu/e_hypot.c (__ieee754_hypot): Likewise. * sysdeps/powerpc/fpu/e_hypotf.c (__ieee754_hypotf): Likewise.
135 lines
4.4 KiB
C
135 lines
4.4 KiB
C
/* Pythagorean addition using doubles
|
|
Copyright (C) 2011-2018 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library
|
|
Contributed by Adhemerval Zanella <azanella@br.ibm.com>, 2011
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Library General Public License as
|
|
published by the Free Software Foundation; either version 2 of the
|
|
License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Library General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Library General Public
|
|
License along with the GNU C Library; see the file COPYING.LIB. If
|
|
not, see <http://www.gnu.org/licenses/>. */
|
|
|
|
#include <math.h>
|
|
#include <math_private.h>
|
|
#include <stdint.h>
|
|
|
|
static const double two60 = 1.152921504606847e+18;
|
|
static const double two500 = 3.2733906078961419e+150;
|
|
static const double two600 = 4.149515568880993e+180;
|
|
static const double two1022 = 4.49423283715579e+307;
|
|
static const double twoM500 = 3.054936363499605e-151;
|
|
static const double twoM600 = 2.4099198651028841e-181;
|
|
static const double two60factor = 1.5592502418239997e+290;
|
|
static const double pdnum = 2.225073858507201e-308;
|
|
|
|
/* __ieee754_hypot(x,y)
|
|
*
|
|
* This a FP only version without any FP->INT conversion.
|
|
* It is similar to default C version, making appropriates
|
|
* overflow and underflows checks as well scaling when it
|
|
* is needed.
|
|
*/
|
|
|
|
#ifdef _ARCH_PWR7
|
|
/* POWER7 isinf and isnan optimization are fast. */
|
|
# define TEST_INF_NAN(x, y) \
|
|
if ((isinf(x) || isinf(y)) \
|
|
&& !issignaling (x) && !issignaling (y)) \
|
|
return INFINITY; \
|
|
if (isnan(x) || isnan(y)) \
|
|
return x + y;
|
|
# else
|
|
/* For POWER6 and below isinf/isnan triggers LHS and PLT calls are
|
|
* costly (especially for POWER6). */
|
|
# define GET_TW0_HIGH_WORD(d1,d2,i1,i2) \
|
|
do { \
|
|
ieee_double_shape_type gh_u1; \
|
|
ieee_double_shape_type gh_u2; \
|
|
gh_u1.value = (d1); \
|
|
gh_u2.value = (d2); \
|
|
(i1) = gh_u1.parts.msw & 0x7fffffff; \
|
|
(i2) = gh_u2.parts.msw & 0x7fffffff; \
|
|
} while (0)
|
|
|
|
# define TEST_INF_NAN(x, y) \
|
|
do { \
|
|
uint32_t hx, hy; \
|
|
GET_TW0_HIGH_WORD(x, y, hx, hy); \
|
|
if (hy > hx) { \
|
|
uint32_t ht = hx; hx = hy; hy = ht; \
|
|
} \
|
|
if (hx >= 0x7ff00000) { \
|
|
if ((hx == 0x7ff00000 || hy == 0x7ff00000) \
|
|
&& !issignaling (x) && !issignaling (y)) \
|
|
return INFINITY; \
|
|
return x + y; \
|
|
} \
|
|
} while (0)
|
|
|
|
#endif
|
|
|
|
|
|
double
|
|
__ieee754_hypot (double x, double y)
|
|
{
|
|
x = fabs (x);
|
|
y = fabs (y);
|
|
|
|
TEST_INF_NAN (x, y);
|
|
|
|
if (y > x)
|
|
{
|
|
double t = x;
|
|
x = y;
|
|
y = t;
|
|
}
|
|
if (y == 0.0)
|
|
return x;
|
|
/* if y is higher enough, y * 2^60 might overflow. The tests if
|
|
y >= 1.7976931348623157e+308/2^60 (two60factor) and uses the
|
|
appropriate check to avoid the overflow exception generation. */
|
|
if (y > two60factor)
|
|
{
|
|
if ((x / y) > two60)
|
|
return x + y;
|
|
}
|
|
else
|
|
{
|
|
if (x > (y * two60))
|
|
return x + y;
|
|
}
|
|
if (x > two500)
|
|
{
|
|
x *= twoM600;
|
|
y *= twoM600;
|
|
return sqrt (x * x + y * y) / twoM600;
|
|
}
|
|
if (y < twoM500)
|
|
{
|
|
if (y <= pdnum)
|
|
{
|
|
x *= two1022;
|
|
y *= two1022;
|
|
double ret = sqrt (x * x + y * y) / two1022;
|
|
math_check_force_underflow_nonneg (ret);
|
|
return ret;
|
|
}
|
|
else
|
|
{
|
|
x *= two600;
|
|
y *= two600;
|
|
return sqrt (x * x + y * y) / two600;
|
|
}
|
|
}
|
|
return sqrt (x * x + y * y);
|
|
}
|
|
strong_alias (__ieee754_hypot, __hypot_finite)
|