mirror of
https://sourceware.org/git/glibc.git
synced 2024-12-27 05:00:15 +00:00
43576de04a
With this patch, the maximal known error for tgamma is now reduced to 9 ulps for dbl-64, for all rounding modes. Since exhaustive testing is not possible for dbl-64, it might be that there are still cases with an error larger than 9 ulps, but all known cases are fixed (intensive tests were done to find cases with large errors). Tested on x86_64 and powerpc (and by Adhemerval Zanella on aarch64, arm, s390x, sparc, and i686). Reviewed-by: Adhemerval Zanella <adhemerval.zanella@linaro.org>
116 lines
3.5 KiB
C
116 lines
3.5 KiB
C
/* Compute full X * Y for double type.
|
|
Copyright (C) 2013-2021 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<https://www.gnu.org/licenses/>. */
|
|
|
|
#ifndef _MUL_SPLIT_H
|
|
#define _MUL_SPLIT_H
|
|
|
|
#include <float.h>
|
|
|
|
/* Calculate X * Y exactly and store the result in *HI + *LO. It is
|
|
given that the values are small enough that no overflow occurs and
|
|
large enough (or zero) that no underflow occurs. */
|
|
|
|
static void
|
|
mul_split (double *hi, double *lo, double x, double y)
|
|
{
|
|
#ifdef __FP_FAST_FMA
|
|
/* Fast built-in fused multiply-add. */
|
|
*hi = x * y;
|
|
*lo = __builtin_fma (x, y, -*hi);
|
|
#else
|
|
/* Apply Dekker's algorithm. */
|
|
*hi = x * y;
|
|
# define C ((1 << (DBL_MANT_DIG + 1) / 2) + 1)
|
|
double x1 = x * C;
|
|
double y1 = y * C;
|
|
# undef C
|
|
x1 = (x - x1) + x1;
|
|
y1 = (y - y1) + y1;
|
|
double x2 = x - x1;
|
|
double y2 = y - y1;
|
|
*lo = (((x1 * y1 - *hi) + x1 * y2) + x2 * y1) + x2 * y2;
|
|
#endif
|
|
}
|
|
|
|
/* Add a + b exactly, such that *hi + *lo = a + b.
|
|
Assumes |a| >= |b| and rounding to nearest. */
|
|
static inline void
|
|
fast_two_sum (double *hi, double *lo, double a, double b)
|
|
{
|
|
double e;
|
|
|
|
*hi = a + b;
|
|
e = *hi - a; /* exact */
|
|
*lo = b - e; /* exact */
|
|
/* Now *hi + *lo = a + b exactly. */
|
|
}
|
|
|
|
/* Multiplication of two floating-point expansions: *hi + *lo is an
|
|
approximation of (h1+l1)*(h2+l2), assuming |l1| <= 1/2*ulp(h1)
|
|
and |l2| <= 1/2*ulp(h2) and rounding to nearest. */
|
|
static inline void
|
|
mul_expansion (double *hi, double *lo, double h1, double l1,
|
|
double h2, double l2)
|
|
{
|
|
double r, e;
|
|
|
|
mul_split (hi, lo, h1, h2);
|
|
r = h1 * l2 + h2 * l1;
|
|
/* Now add r to (hi,lo) using fast two-sum, where we know |r| < |hi|. */
|
|
fast_two_sum (hi, &e, *hi, r);
|
|
*lo -= e;
|
|
}
|
|
|
|
/* Calculate X / Y and store the approximate result in *HI + *LO. It is
|
|
assumed that Y is not zero, that no overflow nor underflow occurs, and
|
|
rounding is to nearest. */
|
|
static inline void
|
|
div_split (double *hi, double *lo, double x, double y)
|
|
{
|
|
double a, b;
|
|
|
|
*hi = x / y;
|
|
mul_split (&a, &b, *hi, y);
|
|
/* a + b = hi*y, which should be near x. */
|
|
a = x - a; /* huge cancellation */
|
|
a = a - b;
|
|
/* Now x ~ hi*y + a thus x/y ~ hi + a/y. */
|
|
*lo = a / y;
|
|
}
|
|
|
|
/* Division of two floating-point expansions: *hi + *lo is an
|
|
approximation of (h1+l1)/(h2+l2), assuming |l1| <= 1/2*ulp(h1)
|
|
and |l2| <= 1/2*ulp(h2), h2+l2 is not zero, and rounding to nearest. */
|
|
static inline void
|
|
div_expansion (double *hi, double *lo, double h1, double l1,
|
|
double h2, double l2)
|
|
{
|
|
double r, e;
|
|
|
|
div_split (hi, lo, h1, h2);
|
|
/* (h1+l1)/(h2+l2) ~ h1/h2 + (l1*h2 - l2*h1)/h2^2 */
|
|
r = (l1 * h2 - l2 * h1) / (h2 * h2);
|
|
/* Now add r to (hi,lo) using fast two-sum, where we know |r| < |hi|. */
|
|
fast_two_sum (hi, &e, *hi, r);
|
|
*lo += e;
|
|
/* Renormalize since |lo| might be larger than 0.5 ulp(hi). */
|
|
fast_two_sum (hi, lo, *hi, *lo);
|
|
}
|
|
|
|
#endif /* _MUL_SPLIT_H */
|