glibc/sysdeps/i386/fpu/s_asinhl.S
Joseph Myers 8db3cdefef Fix asinh missing underflows (bug 16350).
Similar to various other bugs in this area, some asinh implementations
do not raise the underflow exception for subnormal arguments, when the
result is tiny and inexact.  This patch forces the exception in a
similar way to previous fixes.

Tested for x86_64, x86 and mips64.

	[BZ #16350]
	* sysdeps/i386/fpu/s_asinh.S (__asinh): Force underflow exception
	for arguments with small absolute value.
	* sysdeps/i386/fpu/s_asinhf.S (__asinhf): Likewise.
	* sysdeps/i386/fpu/s_asinhl.S (__asinhl): Likewise.
	* sysdeps/ieee754/dbl-64/s_asinh.c: Include <float.h>.
	(__asinh): Force underflow exception for arguments with small
	absolute value.
	* sysdeps/ieee754/flt-32/s_asinhf.c: Include <float.h>.
	(__asinhf): Force underflow exception for arguments with small
	absolute value.
	* sysdeps/ieee754/ldbl-128/s_asinhl.c: Include <float.h>.
	(__asinhl): Force underflow exception for arguments with small
	absolute value.
	* sysdeps/ieee754/ldbl-128ibm/s_asinhl.c: Include <float.h>.
	(__asinhl): Force underflow exception for arguments with small
	absolute value.
	* sysdeps/ieee754/ldbl-96/s_asinhl.c: Include <float.h>.
	(__asinhl): Force underflow exception for arguments with small
	absolute value.
	* math/auto-libm-test-in: Do not mark underflow exceptions as
	possibly missing for bug 16350.
	* math/auto-libm-test-out: Regenerated.
2015-06-18 23:27:41 +00:00

144 lines
3.7 KiB
ArmAsm

/* ix87 specific implementation of arcsinh.
Copyright (C) 1996-2015 Free Software Foundation, Inc.
This file is part of the GNU C Library.
Contributed by Ulrich Drepper <drepper@cygnus.com>, 1996.
The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with the GNU C Library; if not, see
<http://www.gnu.org/licenses/>. */
#include <machine/asm.h>
.section .rodata
.align ALIGNARG(4)
.type huge,@object
huge: .tfloat 1e+4930
ASM_SIZE_DIRECTIVE(huge)
.align ALIGNARG(4)
/* Please note that we use double value for 1.0. This number
has an exact representation and so we don't get accuracy
problems. The advantage is that the code is simpler. */
.type one,@object
one: .double 1.0
ASM_SIZE_DIRECTIVE(one)
/* It is not important that this constant is precise. It is only
a value which is known to be on the safe side for using the
fyl2xp1 instruction. */
.type limit,@object
limit: .double 0.29
ASM_SIZE_DIRECTIVE(limit)
#ifdef PIC
#define MO(op) op##@GOTOFF(%edx)
#else
#define MO(op) op
#endif
.text
ENTRY(__asinhl)
movl 12(%esp), %ecx
movl $0x7fff, %eax
andl %ecx, %eax
andl $0x8000, %ecx
movl %eax, %edx
orl $0xffff8000, %edx
incl %edx
jz 7f // x in ±Inf or NaN
xorl %ecx, 12(%esp)
fldt 4(%esp) // |x|
cmpl $0x3fde, %eax
jb 2f // |x| < 2^-34
fldln2 // log(2) : |x|
cmpl $0x4020, %eax
fxch // |x| : log(2)
ja 3f // |x| > 2^34
#ifdef PIC
LOAD_PIC_REG (dx)
#endif
cmpl $0x4000, %eax
ja 5f // |x| > 2
// 2^-34 <= |x| <= 2 => y = sign(x)*log1p(|x|+|x|^2/(1+sqrt(1+|x|^2)))
fld %st // |x| : |x| : log(2)
fmul %st(1) // |x|^2 : |x| : log(2)
fld %st // |x|^2 : |x|^2 : |x| : log(2)
faddl MO(one) // 1+|x|^2 : |x|^2 : |x| : log(2)
fsqrt // sqrt(1+|x|^2) : |x|^2 : |x| : log(2)
faddl MO(one) // 1+sqrt(1+|x|^2) : |x|^2 : |x| : log(2)
fdivrp // |x|^2/(1+sqrt(1+|x|^2)) : |x| : log(2)
faddp // |x|+|x|^2/(1+sqrt(1+|x|^2)) : log(2)
fcoml MO(limit)
fnstsw
sahf
ja 6f
fyl2xp1
jecxz 4f
fchs
4: ret
7: fldt 4(%esp)
ret
6: faddl MO(one)
fyl2x
jecxz 4f
fchs
4: ret
// |x| < 2^-34 => y = x (inexact iff |x| != 0.0)
.align ALIGNARG(4)
2:
#ifdef PIC
LOAD_PIC_REG (dx)
#endif
jecxz 4f
fchs // x
4: fld %st // x : x
fldt MO(huge) // huge : x : x
faddp // huge+x : x
fstp %st(0) // x
cmpl $0x0001, %eax
jae 8f
fld %st(0)
fmul %st(0)
fstp %st(0)
8: ret
// |x| > 2^34 => y = sign(x) * (log(|x|) + log(2))
.align ALIGNARG(4)
3: fyl2x // log(|x|)
fldln2 // log(2) : log(|x|)
faddp // log(|x|)+log(2)
jecxz 4f
fchs
4: ret
// |x| > 2 => y = sign(x) * log(2*|x| + 1/(|x|+sqrt(x*x+1)))
.align ALIGNARG(4)
5: fld %st // |x| : |x| : log(2)
fadd %st, %st(1) // |x| : 2*|x| : log(2)
fld %st // |x| : |x| : 2*|x| : log(2)
fmul %st(1) // |x|^2 : |x| : 2*|x| : log(2)
faddl MO(one) // 1+|x|^2 : |x| : 2*|x| : log(2)
fsqrt // sqrt(1+|x|^2) : |x| : 2*|x| : log(2)
faddp // |x|+sqrt(1+|x|^2) : 2*|x| : log(2)
fdivrl MO(one) // 1/(|x|+sqrt(1+|x|^2)) : 2*|x| : log(2)
faddp // 2*|x|+1/(|x|+sqrt(1+|x|^2)) : log(2)
fyl2x // log(2*|x|+1/(|x|+sqrt(1+|x|^2)))
jecxz 4f
fchs
4: ret
END(__asinhl)
weak_alias (__asinhl, asinhl)