PowerPC: Optimized finite/finitef for POWER8

This patch add a optimized finite/finitef implementation for POWER8
using the new Move From VSR Doubleword instruction to gains some
cycles from FP to GRP register move.
This commit is contained in:
Adhemerval Zanella 2014-02-27 09:46:46 -06:00
parent 4393fc119c
commit cac626d60a
7 changed files with 116 additions and 6 deletions

View File

@ -1,3 +1,17 @@
2014-02-27 Adhemerval Zanella <azanella@linux.vnet.ibm.com>
* sysdeps/powerpc/powerpc64/fpu/multiarch/Makefile: Add finite power8
implementation.
* sysdeps/powerpc/powerpc64/fpu/multiarch/s_finite-power8.S: New file:
POWER8 finite ifunc implementation.
* sysdeps/powerpc/powerpc64/fpu/multiarch/s_finite.c (__finite): Add
POWER8 implementation.
* sysdeps/powerpc/powerpc64/fpu/multiarch/s_finitef.c (__finitef):
Likewise.
* sysdeps/powerpc/powerpc64/power8/fpu/s_finite.S: New file:
POWER8 finite implementation.
* sysdeps/powerpc/powerpc64/power8/fpu/s_finitef.S: New file.
2014-02-27 Adhemerval Zanella <azanella@linux.vnet.ibm.com>
* sysdeps/powerpc/powerpc64/fpu/multiarch/Makefile: Add isinf power8

View File

@ -5,7 +5,7 @@ sysdep_routines += s_isnan-power7 s_isnan-power6x s_isnan-power6 \
s_finitef-ppc64 s_isinff-ppc64 s_isinf-power7 \
s_isinf-ppc64 s_modf-power5+ s_modf-ppc64 \
s_modff-power5+ s_modff-ppc64 s_isnan-power8 \
s_isinf-power8
s_isinf-power8 s_finite-power8
libm-sysdep_routines += s_isnan-power7 s_isnan-power6x s_isnan-power6 \
s_isnan-power5 s_isnan-ppc64 s_llround-power6x \
@ -23,7 +23,7 @@ libm-sysdep_routines += s_isnan-power7 s_isnan-power6x s_isnan-power6 \
s_logbl-ppc64 s_modf-power5+ s_modf-ppc64 \
s_modff-power5+ s_modff-ppc64 e_hypot-ppc64 \
e_hypot-power7 e_hypotf-ppc64 e_hypotf-power7 \
s_isnan-power8 s_isinf-power8
s_isnan-power8 s_isinf-power8 s_finite-power8
CFLAGS-s_logbf-power7.c = -mcpu=power7
CFLAGS-s_logbl-power7.c = -mcpu=power7

View File

@ -0,0 +1,33 @@
/* isnan(). PowerPC64/POWER7 version.
Copyright (C) 2014 Free Software Foundation, Inc.
This file is part of the GNU C Library.
The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with the GNU C Library; if not, see
<http://www.gnu.org/licenses/>. */
#include <sysdep.h>
#include <math_ldbl_opt.h>
#undef hidden_def
#define hidden_def(name)
#undef weak_alias
#define weak_alias(name, alias)
#undef strong_alias
#define strong_alias(name, alias)
#undef compat_symbol
#define compat_symbol(lib, name, symbol, ver)
#define __finite __finite_power8
#include <sysdeps/powerpc/powerpc64/power8/fpu/s_finite.S>

View File

@ -23,10 +23,13 @@
extern __typeof (__finite) __finite_ppc64 attribute_hidden;
extern __typeof (__finite) __finite_power7 attribute_hidden;
extern __typeof (__finite) __finite_power8 attribute_hidden;
libc_ifunc (__finite,
(hwcap & PPC_FEATURE_ARCH_2_06)
? __finite_power7
(hwcap2 & PPC_FEATURE2_ARCH_2_07)
? __finite_power8 :
(hwcap & PPC_FEATURE_ARCH_2_06)
? __finite_power7
: __finite_ppc64);
weak_alias (__finite, finite)

View File

@ -23,10 +23,13 @@
extern __typeof (__finitef) __finitef_ppc64 attribute_hidden;
/* The double-precision version also works for single-precision. */
extern __typeof (__finitef) __finite_power7 attribute_hidden;
extern __typeof (__finitef) __finite_power8 attribute_hidden;
libc_ifunc (__finitef,
(hwcap & PPC_FEATURE_ARCH_2_06)
? __finite_power7
(hwcap2 & PPC_FEATURE2_ARCH_2_07)
? __finite_power8 :
(hwcap & PPC_FEATURE_ARCH_2_06)
? __finite_power7
: __finitef_ppc64);
weak_alias (__finitef, finitef)

View File

@ -0,0 +1,56 @@
/* isfinite(). PowerPC64/POWER8 version.
Copyright (C) 2014 Free Software Foundation, Inc.
This file is part of the GNU C Library.
The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with the GNU C Library; if not, see
<http://www.gnu.org/licenses/>. */
#include <sysdep.h>
#include <math_ldbl_opt.h>
#define MFVSRD_R3_V1 .byte 0x7c,0x23,0x00,0x66 /* mfvsrd r3,vs1 */
/* int [r3] __finite ([fp1] x) */
EALIGN (__finite, 4, 0)
CALL_MCOUNT 0
MFVSRD_R3_V1
lis r9,0x8010
clrldi r3,r3,1 /* r3 = r3 & 0x8000000000000000 */
rldicr r9,r9,32,31 /* r9 = (r9 << 32) & 0xffffffff */
add r3,r3,r9
rldicl r3,r3,1,63
blr
END (__finite)
hidden_def (__finite)
weak_alias (__finite, finite)
/* It turns out that the 'double' version will also always work for
single-precision. */
strong_alias (__finite, __finitef)
hidden_def (__finitef)
weak_alias (__finitef, finitef)
#ifdef IS_IN_libm
# if LONG_DOUBLE_COMPAT (libm, GLIBC_2_0)
compat_symbol (libm, __finite, __finitel, GLIBC_2_0)
compat_symbol (libm, finite, finitel, GLIBC_2_0)
# endif
#else
# if LONG_DOUBLE_COMPAT (libc, GLIBC_2_0)
compat_symbol (libc, __finite, __finitel, GLIBC_2_0);
compat_symbol (libc, finite, finitel, GLIBC_2_0);
# endif
#endif

View File

@ -0,0 +1 @@
/* This function uses the same code as s_finite.S. */