glibc/sysdeps/powerpc/bits/fenvinline.h
Paul A. Clarke 3db85a9814 powerpc: Use faster means to access FPSCR when possible in some cases
Using 'mffs' instruction to read the Floating Point Status Control Register
(FPSCR) can force a processor flush in some cases, with undesirable
performance impact.  If the values of the bits in the FPSCR which force the
flush are not needed, an instruction that is new to POWER9 (ISA version 3.0),
'mffsl' can be used instead.

Cases included:  get_rounding_mode, fegetround, fegetmode, fegetexcept.

	* sysdeps/powerpc/bits/fenvinline.h (__fegetround): Use
	__fegetround_ISA300() or __fegetround_ISA2() as appropriate.
	(__fegetround_ISA300) New.
	(__fegetround_ISA2) New.
	* sysdeps/powerpc/fpu_control.h (IS_ISA300): New.
	(_FPU_MFFS): Move implementation...
	(_FPU_GETCW): Here.
	(_FPU_MFFSL): Move implementation....
	(_FPU_GET_RC_ISA300): Here. New.
	(_FPU_GET_RC): Use _FPU_GET_RC_ISA300() or _FPU_GETCW() as appropriate.
	* sysdeps/powerpc/fpu/fenv_libc.h (fegetenv_status_ISA300): New.
	(fegetenv_status): New.
	* sysdeps/powerpc/fpu/fegetmode.c (fegetmode): Use fegetenv_status()
	instead of fegetenv_register().
	* sysdeps/powerpc/fpu/fegetexcept.c (__fegetexcept): Likewise.

Reviewed-by: Tulio Magno Quites Machado Filho <tuliom@linux.ibm.com>
2019-06-30 08:40:44 -03:00

103 lines
3.4 KiB
C

/* Inline floating-point environment handling functions for powerpc.
Copyright (C) 1995-2019 Free Software Foundation, Inc.
This file is part of the GNU C Library.
The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with the GNU C Library; if not, see
<http://www.gnu.org/licenses/>. */
#if defined __GNUC__ && !defined _SOFT_FLOAT && !defined __NO_FPRS__
/* Inline definitions for fegetround. */
# define __fegetround_ISA300() \
(__extension__ ({ \
union { double __d; unsigned long long __ll; } __u; \
__asm__ __volatile__ ( \
".machine push; .machine \"power9\"; mffsl %0; .machine pop" \
: "=f" (__u.__d)); \
__u.__ll & 0x0000000000000003LL; \
}))
# define __fegetround_ISA2() \
(__extension__ ({ \
int __fegetround_result; \
__asm__ __volatile__ ("mcrfs 7,7 ; mfcr %0" \
: "=r"(__fegetround_result) : : "cr7"); \
__fegetround_result & 3; \
}))
# ifdef _ARCH_PWR9
# define __fegetround() __fegetround_ISA300()
# elif defined __BUILTIN_CPU_SUPPORTS__
# define __fegetround() \
(__glibc_likely (__builtin_cpu_supports ("arch_3_00")) \
? __fegetround_ISA300() \
: __fegetround_ISA2() \
)
# else
# define __fegetround() __fegetround_ISA2()
# endif
# define fegetround() __fegetround ()
# ifndef __NO_MATH_INLINES
/* The weird 'i#*X' constraints on the following suppress a gcc
warning when __excepts is not a constant. Otherwise, they mean the
same as just plain 'i'. */
# if __GNUC_PREREQ(3, 4)
/* Inline definition for feraiseexcept. */
# define feraiseexcept(__excepts) \
(__extension__ ({ \
int __e = __excepts; \
int __ret; \
if (__builtin_constant_p (__e) \
&& (__e & (__e - 1)) == 0 \
&& __e != FE_INVALID) \
{ \
if (__e != 0) \
__asm__ __volatile__ ("mtfsb1 %0" \
: : "i#*X" (__builtin_clz (__e))); \
__ret = 0; \
} \
else \
__ret = feraiseexcept (__e); \
__ret; \
}))
/* Inline definition for feclearexcept. */
# define feclearexcept(__excepts) \
(__extension__ ({ \
int __e = __excepts; \
int __ret; \
if (__builtin_constant_p (__e) \
&& (__e & (__e - 1)) == 0 \
&& __e != FE_INVALID) \
{ \
if (__e != 0) \
__asm__ __volatile__ ("mtfsb0 %0" \
: : "i#*X" (__builtin_clz (__e))); \
__ret = 0; \
} \
else \
__ret = feclearexcept (__e); \
__ret; \
}))
# endif /* __GNUC_PREREQ(3, 4). */
# endif /* !__NO_MATH_INLINES. */
#endif /* __GNUC__ && !_SOFT_FLOAT && !__NO_FPRS__ */