mirror of
https://sourceware.org/git/glibc.git
synced 2024-12-11 05:40:06 +00:00
71ae86478e
This patch adds an optimized memset implementation for POWER8. For sizes from 0 to 255 bytes, a word/doubleword algorithm similar to POWER7 optimized one is used. For size higher than 255 two strategies are used: 1. If the constant is different than 0, the memory is written with altivec vector instruction; 2. If constant is 0, dbcz instructions are used. The loop is unrolled to clear 512 byte at time. Using vector instructions increases throughput considerable, with a double performance for sizes larger than 1024. The dcbz loops unrolls also shows performance improvement, by doubling throughput for sizes larger than 8192 bytes.
333 lines
12 KiB
C
333 lines
12 KiB
C
/* Enumerate available IFUNC implementations of a function. PowerPC64 version.
|
|
Copyright (C) 2013-2014 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include <assert.h>
|
|
#include <string.h>
|
|
#include <wchar.h>
|
|
#include <ldsodefs.h>
|
|
#include <ifunc-impl-list.h>
|
|
|
|
/* Maximum number of IFUNC implementations. */
|
|
#define MAX_IFUNC 6
|
|
|
|
size_t
|
|
__libc_ifunc_impl_list (const char *name, struct libc_ifunc_impl *array,
|
|
size_t max)
|
|
{
|
|
assert (max >= MAX_IFUNC);
|
|
|
|
size_t i = 0;
|
|
|
|
unsigned long int hwcap = GLRO(dl_hwcap);
|
|
unsigned long int hwcap2 = GLRO(dl_hwcap2);
|
|
|
|
/* hwcap contains only the latest supported ISA, the code checks which is
|
|
and fills the previous supported ones. */
|
|
if (hwcap & PPC_FEATURE_ARCH_2_06)
|
|
hwcap |= PPC_FEATURE_ARCH_2_05 | PPC_FEATURE_POWER5_PLUS |
|
|
PPC_FEATURE_POWER5 | PPC_FEATURE_POWER4;
|
|
else if (hwcap & PPC_FEATURE_ARCH_2_05)
|
|
hwcap |= PPC_FEATURE_POWER5_PLUS | PPC_FEATURE_POWER5 | PPC_FEATURE_POWER4;
|
|
else if (hwcap & PPC_FEATURE_POWER5_PLUS)
|
|
hwcap |= PPC_FEATURE_POWER5 | PPC_FEATURE_POWER4;
|
|
else if (hwcap & PPC_FEATURE_POWER5)
|
|
hwcap |= PPC_FEATURE_POWER4;
|
|
|
|
#ifdef SHARED
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memcpy.c. */
|
|
IFUNC_IMPL (i, name, memcpy,
|
|
IFUNC_IMPL_ADD (array, i, memcpy, hwcap & PPC_FEATURE_HAS_VSX,
|
|
__memcpy_power7)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, hwcap & PPC_FEATURE_ARCH_2_06,
|
|
__memcpy_a2)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, hwcap & PPC_FEATURE_ARCH_2_05,
|
|
__memcpy_power6)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, hwcap & PPC_FEATURE_CELL_BE,
|
|
__memcpy_cell)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, hwcap & PPC_FEATURE_POWER4,
|
|
__memcpy_power4)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, 1, __memcpy_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memmove.c. */
|
|
IFUNC_IMPL (i, name, memmove,
|
|
IFUNC_IMPL_ADD (array, i, memmove, hwcap & PPC_FEATURE_HAS_VSX,
|
|
__memmove_power7)
|
|
IFUNC_IMPL_ADD (array, i, memmove, 1, __memmove_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memset.c. */
|
|
IFUNC_IMPL (i, name, memset,
|
|
IFUNC_IMPL_ADD (array, i, memset, hwcap2 & PPC_FEATURE2_ARCH_2_07,
|
|
__memset_power8)
|
|
IFUNC_IMPL_ADD (array, i, memset, hwcap & PPC_FEATURE_HAS_VSX,
|
|
__memset_power7)
|
|
IFUNC_IMPL_ADD (array, i, memset, hwcap & PPC_FEATURE_ARCH_2_05,
|
|
__memset_power6)
|
|
IFUNC_IMPL_ADD (array, i, memset, hwcap & PPC_FEATURE_POWER4,
|
|
__memset_power4)
|
|
IFUNC_IMPL_ADD (array, i, memset, 1, __memset_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcpy.c. */
|
|
IFUNC_IMPL (i, name, strcpy,
|
|
IFUNC_IMPL_ADD (array, i, strcpy, hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strcpy_power7)
|
|
IFUNC_IMPL_ADD (array, i, strcpy, 1,
|
|
__strcpy_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/stpcpy.c. */
|
|
IFUNC_IMPL (i, name, stpcpy,
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, hwcap & PPC_FEATURE_HAS_VSX,
|
|
__stpcpy_power7)
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, 1,
|
|
__stpcpy_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strlen.c. */
|
|
IFUNC_IMPL (i, name, strlen,
|
|
IFUNC_IMPL_ADD (array, i, strlen, hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strlen_power7)
|
|
IFUNC_IMPL_ADD (array, i, strlen, 1,
|
|
__strlen_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strncmp.c. */
|
|
IFUNC_IMPL (i, name, strncmp,
|
|
IFUNC_IMPL_ADD (array, i, strncmp, hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strncmp_power7)
|
|
IFUNC_IMPL_ADD (array, i, strncmp, hwcap & PPC_FEATURE_POWER4,
|
|
__strncmp_power4)
|
|
IFUNC_IMPL_ADD (array, i, strncmp, 1,
|
|
__strncmp_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strchr.c. */
|
|
IFUNC_IMPL (i, name, strchr,
|
|
IFUNC_IMPL_ADD (array, i, strchr,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strchr_power7)
|
|
IFUNC_IMPL_ADD (array, i, strchr, 1,
|
|
__strchr_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strchrnul.c. */
|
|
IFUNC_IMPL (i, name, strchrnul,
|
|
IFUNC_IMPL_ADD (array, i, strchrnul,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strchrnul_power7)
|
|
IFUNC_IMPL_ADD (array, i, strchrnul, 1,
|
|
__strchrnul_ppc))
|
|
#endif
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memcmp.c. */
|
|
IFUNC_IMPL (i, name, memcmp,
|
|
IFUNC_IMPL_ADD (array, i, memcmp, hwcap & PPC_FEATURE_HAS_VSX,
|
|
__memcmp_power7)
|
|
IFUNC_IMPL_ADD (array, i, memcmp, hwcap & PPC_FEATURE_POWER4,
|
|
__memcmp_power4)
|
|
IFUNC_IMPL_ADD (array, i, memcmp, 1, __memcmp_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/bzero.c. */
|
|
IFUNC_IMPL (i, name, bzero,
|
|
IFUNC_IMPL_ADD (array, i, bzero, hwcap2 & PPC_FEATURE2_ARCH_2_07,
|
|
__bzero_power8)
|
|
IFUNC_IMPL_ADD (array, i, bzero, hwcap & PPC_FEATURE_HAS_VSX,
|
|
__bzero_power7)
|
|
IFUNC_IMPL_ADD (array, i, bzero, hwcap & PPC_FEATURE_ARCH_2_05,
|
|
__bzero_power6)
|
|
IFUNC_IMPL_ADD (array, i, bzero, hwcap & PPC_FEATURE_POWER4,
|
|
__bzero_power4)
|
|
IFUNC_IMPL_ADD (array, i, bzero, 1, __bzero_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/bcopy.c. */
|
|
IFUNC_IMPL (i, name, bcopy,
|
|
IFUNC_IMPL_ADD (array, i, bcopy, hwcap & PPC_FEATURE_HAS_VSX,
|
|
__bcopy_power7)
|
|
IFUNC_IMPL_ADD (array, i, bcopy, 1, __bcopy_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/mempcpy.c. */
|
|
IFUNC_IMPL (i, name, mempcpy,
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__mempcpy_power7)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, 1,
|
|
__mempcpy_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memchr.c. */
|
|
IFUNC_IMPL (i, name, memchr,
|
|
IFUNC_IMPL_ADD (array, i, memchr,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__memchr_power7)
|
|
IFUNC_IMPL_ADD (array, i, memchr, 1,
|
|
__memchr_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memrchr.c. */
|
|
IFUNC_IMPL (i, name, memrchr,
|
|
IFUNC_IMPL_ADD (array, i, memrchr,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__memrchr_power7)
|
|
IFUNC_IMPL_ADD (array, i, memrchr, 1,
|
|
__memrchr_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/rawmemchr.c. */
|
|
IFUNC_IMPL (i, name, rawmemchr,
|
|
IFUNC_IMPL_ADD (array, i, rawmemchr,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__rawmemchr_power7)
|
|
IFUNC_IMPL_ADD (array, i, rawmemchr, 1,
|
|
__rawmemchr_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strnlen.c. */
|
|
IFUNC_IMPL (i, name, strnlen,
|
|
IFUNC_IMPL_ADD (array, i, strnlen, hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strnlen_power7)
|
|
IFUNC_IMPL_ADD (array, i, strnlen, 1,
|
|
__strnlen_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcasecmp.c. */
|
|
IFUNC_IMPL (i, name, strcasecmp,
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strcasecmp_power7)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp, 1, __strcasecmp_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcasecmp_l.c. */
|
|
IFUNC_IMPL (i, name, strcasecmp_l,
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strcasecmp_l_power7)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l, 1,
|
|
__strcasecmp_l_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strncase.c. */
|
|
IFUNC_IMPL (i, name, strncasecmp,
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strncasecmp_power7)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp, 1, __strncasecmp_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strncase_l.c. */
|
|
IFUNC_IMPL (i, name, strncasecmp_l,
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strncasecmp_l_power7)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l, 1,
|
|
__strncasecmp_l_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/wcschr.c. */
|
|
IFUNC_IMPL (i, name, wcschr,
|
|
IFUNC_IMPL_ADD (array, i, wcschr,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__wcschr_power7)
|
|
IFUNC_IMPL_ADD (array, i, wcschr,
|
|
hwcap & PPC_FEATURE_ARCH_2_05,
|
|
__wcschr_power6)
|
|
IFUNC_IMPL_ADD (array, i, wcschr, 1,
|
|
__wcschr_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/wcschr.c. */
|
|
IFUNC_IMPL (i, name, wcsrchr,
|
|
IFUNC_IMPL_ADD (array, i, wcsrchr,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__wcsrchr_power7)
|
|
IFUNC_IMPL_ADD (array, i, wcsrchr,
|
|
hwcap & PPC_FEATURE_ARCH_2_05,
|
|
__wcsrchr_power6)
|
|
IFUNC_IMPL_ADD (array, i, wcsrchr, 1,
|
|
__wcsrchr_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/wcscpy.c. */
|
|
IFUNC_IMPL (i, name, wcscpy,
|
|
IFUNC_IMPL_ADD (array, i, wcscpy,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__wcscpy_power7)
|
|
IFUNC_IMPL_ADD (array, i, wcscpy,
|
|
hwcap & PPC_FEATURE_ARCH_2_05,
|
|
__wcscpy_power6)
|
|
IFUNC_IMPL_ADD (array, i, wcscpy, 1,
|
|
__wcscpy_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strrchr.c. */
|
|
IFUNC_IMPL (i, name, strrchr,
|
|
IFUNC_IMPL_ADD (array, i, strrchr,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strrchr_power7)
|
|
IFUNC_IMPL_ADD (array, i, strrchr, 1,
|
|
__strrchr_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strncat.c. */
|
|
IFUNC_IMPL (i, name, strncat,
|
|
IFUNC_IMPL_ADD (array, i, strncat,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strncat_power7)
|
|
IFUNC_IMPL_ADD (array, i, strncat, 1,
|
|
__strncat_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strspn.c. */
|
|
IFUNC_IMPL (i, name, strspn,
|
|
IFUNC_IMPL_ADD (array, i, strspn,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strspn_power7)
|
|
IFUNC_IMPL_ADD (array, i, strspn, 1,
|
|
__strspn_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcspn.c. */
|
|
IFUNC_IMPL (i, name, strcspn,
|
|
IFUNC_IMPL_ADD (array, i, strcspn,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strcspn_power7)
|
|
IFUNC_IMPL_ADD (array, i, strcspn, 1,
|
|
__strcspn_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strpbrk.c. */
|
|
IFUNC_IMPL (i, name, strpbrk,
|
|
IFUNC_IMPL_ADD (array, i, strpbrk,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strpbrk_power7)
|
|
IFUNC_IMPL_ADD (array, i, strpbrk, 1,
|
|
__strpbrk_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strncpy.c. */
|
|
IFUNC_IMPL (i, name, strncpy,
|
|
IFUNC_IMPL_ADD (array, i, strncpy,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strncpy_power7)
|
|
IFUNC_IMPL_ADD (array, i, strncpy, 1,
|
|
__strncpy_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/stpncpy.c. */
|
|
IFUNC_IMPL (i, name, stpncpy,
|
|
IFUNC_IMPL_ADD (array, i, stpncpy,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__stpncpy_power7)
|
|
IFUNC_IMPL_ADD (array, i, stpncpy, 1,
|
|
__stpncpy_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcmp.c. */
|
|
IFUNC_IMPL (i, name, strcmp,
|
|
IFUNC_IMPL_ADD (array, i, strcmp,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strcmp_power7)
|
|
IFUNC_IMPL_ADD (array, i, strcmp, 1,
|
|
__strcmp_ppc))
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcat.c. */
|
|
IFUNC_IMPL (i, name, strcat,
|
|
IFUNC_IMPL_ADD (array, i, strcat,
|
|
hwcap & PPC_FEATURE_HAS_VSX,
|
|
__strcat_power7)
|
|
IFUNC_IMPL_ADD (array, i, strcat, 1,
|
|
__strcat_ppc))
|
|
|
|
return i;
|
|
}
|