mirror of
https://sourceware.org/git/glibc.git
synced 2024-12-27 05:00:15 +00:00
830566307f
Implement x86-64 memset with unaligned store and rep movsb. Support 16-byte, 32-byte and 64-byte vector register sizes. A single file provides 2 implementations of memset, one with rep stosb and the other without rep stosb. They share the same codes when size is between 2 times of vector register size and REP_STOSB_THRESHOLD which defaults to 2KB. Key features: 1. Use overlapping store to avoid branch. 2. For size <= 4 times of vector register size, fully unroll the loop. 3. For size > 4 times of vector register size, store 4 times of vector register size at a time. [BZ #19881] * sysdeps/x86_64/multiarch/Makefile (sysdep_routines): Add memset-sse2-unaligned-erms, memset-avx2-unaligned-erms and memset-avx512-unaligned-erms. * sysdeps/x86_64/multiarch/ifunc-impl-list.c (__libc_ifunc_impl_list): Test __memset_chk_sse2_unaligned, __memset_chk_sse2_unaligned_erms, __memset_chk_avx2_unaligned, __memset_chk_avx2_unaligned_erms, __memset_chk_avx512_unaligned, __memset_chk_avx512_unaligned_erms, __memset_sse2_unaligned, __memset_sse2_unaligned_erms, __memset_erms, __memset_avx2_unaligned, __memset_avx2_unaligned_erms, __memset_avx512_unaligned_erms and __memset_avx512_unaligned. * sysdeps/x86_64/multiarch/memset-avx2-unaligned-erms.S: New file. * sysdeps/x86_64/multiarch/memset-avx512-unaligned-erms.S: Likewise. * sysdeps/x86_64/multiarch/memset-sse2-unaligned-erms.S: Likewise. * sysdeps/x86_64/multiarch/memset-vec-unaligned-erms.S: Likewise.
478 lines
18 KiB
C
478 lines
18 KiB
C
/* Enumerate available IFUNC implementations of a function. x86-64 version.
|
|
Copyright (C) 2012-2016 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include <assert.h>
|
|
#include <string.h>
|
|
#include <wchar.h>
|
|
#include <ifunc-impl-list.h>
|
|
#include <sysdep.h>
|
|
#include "init-arch.h"
|
|
|
|
/* Maximum number of IFUNC implementations. */
|
|
#define MAX_IFUNC 5
|
|
|
|
/* Fill ARRAY of MAX elements with IFUNC implementations for function
|
|
NAME supported on target machine and return the number of valid
|
|
entries. */
|
|
|
|
size_t
|
|
__libc_ifunc_impl_list (const char *name, struct libc_ifunc_impl *array,
|
|
size_t max)
|
|
{
|
|
assert (max >= MAX_IFUNC);
|
|
|
|
size_t i = 0;
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memcmp.S. */
|
|
IFUNC_IMPL (i, name, memcmp,
|
|
IFUNC_IMPL_ADD (array, i, memcmp, HAS_CPU_FEATURE (SSE4_1),
|
|
__memcmp_sse4_1)
|
|
IFUNC_IMPL_ADD (array, i, memcmp, HAS_CPU_FEATURE (SSSE3),
|
|
__memcmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, memcmp, 1, __memcmp_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memmove_chk.c. */
|
|
IFUNC_IMPL (i, name, __memmove_chk,
|
|
#ifdef HAVE_AVX512_ASM_SUPPORT
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_chk_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_chk_avx512_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_chk_avx512_unaligned_erms)
|
|
#endif
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memmove_chk_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memmove_chk_avx_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memmove_chk_avx_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__memmove_chk_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__memmove_chk_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk, 1,
|
|
__memmove_chk_sse2_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk, 1,
|
|
__memmove_chk_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk, 1,
|
|
__memmove_chk_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memmove.S. */
|
|
IFUNC_IMPL (i, name, memmove,
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memmove_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memmove_avx_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memmove_avx_unaligned_erms)
|
|
#ifdef HAVE_AVX512_ASM_SUPPORT
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_avx512_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_avx512_unaligned_erms)
|
|
#endif
|
|
IFUNC_IMPL_ADD (array, i, memmove, HAS_CPU_FEATURE (SSSE3),
|
|
__memmove_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, memmove, HAS_CPU_FEATURE (SSSE3),
|
|
__memmove_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, memmove, 1, __memmove_erms)
|
|
IFUNC_IMPL_ADD (array, i, memmove, 1,
|
|
__memmove_sse2_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, memmove, 1,
|
|
__memmove_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memmove, 1, __memmove_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memset_chk.S. */
|
|
IFUNC_IMPL (i, name, __memset_chk,
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk, 1,
|
|
__memset_chk_sse2)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk, 1,
|
|
__memset_chk_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk, 1,
|
|
__memset_chk_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__memset_chk_avx2)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__memset_chk_avx2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__memset_chk_avx2_unaligned_erms)
|
|
#ifdef HAVE_AVX512_ASM_SUPPORT
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_chk_avx512_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_chk_avx512_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_chk_avx512_no_vzeroupper)
|
|
#endif
|
|
)
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memset.S. */
|
|
IFUNC_IMPL (i, name, memset,
|
|
IFUNC_IMPL_ADD (array, i, memset, 1, __memset_sse2)
|
|
IFUNC_IMPL_ADD (array, i, memset, 1,
|
|
__memset_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memset, 1,
|
|
__memset_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memset, 1, __memset_erms)
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__memset_avx2)
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__memset_avx2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__memset_avx2_unaligned_erms)
|
|
#ifdef HAVE_AVX512_ASM_SUPPORT
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_avx512_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_avx512_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_avx512_no_vzeroupper)
|
|
#endif
|
|
)
|
|
|
|
/* Support sysdeps/x86_64/multiarch/stpncpy.S. */
|
|
IFUNC_IMPL (i, name, stpncpy,
|
|
IFUNC_IMPL_ADD (array, i, stpncpy, HAS_CPU_FEATURE (SSSE3),
|
|
__stpncpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, stpncpy, 1,
|
|
__stpncpy_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, stpncpy, 1, __stpncpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/stpcpy.S. */
|
|
IFUNC_IMPL (i, name, stpcpy,
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__stpcpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, 1, __stpcpy_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, 1, __stpcpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcasecmp_l.S. */
|
|
IFUNC_IMPL (i, name, strcasecmp,
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__strcasecmp_avx)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp,
|
|
HAS_CPU_FEATURE (SSE4_2),
|
|
__strcasecmp_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__strcasecmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp, 1, __strcasecmp_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcasecmp_l.S. */
|
|
IFUNC_IMPL (i, name, strcasecmp_l,
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__strcasecmp_l_avx)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l,
|
|
HAS_CPU_FEATURE (SSE4_2),
|
|
__strcasecmp_l_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__strcasecmp_l_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l, 1,
|
|
__strcasecmp_l_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcat.S. */
|
|
IFUNC_IMPL (i, name, strcat,
|
|
IFUNC_IMPL_ADD (array, i, strcat, HAS_CPU_FEATURE (SSSE3),
|
|
__strcat_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strcat, 1, __strcat_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strcat, 1, __strcat_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strchr.S. */
|
|
IFUNC_IMPL (i, name, strchr,
|
|
IFUNC_IMPL_ADD (array, i, strchr, 1, __strchr_sse2_no_bsf)
|
|
IFUNC_IMPL_ADD (array, i, strchr, 1, __strchr_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcmp.S. */
|
|
IFUNC_IMPL (i, name, strcmp,
|
|
IFUNC_IMPL_ADD (array, i, strcmp, HAS_CPU_FEATURE (SSE4_2),
|
|
__strcmp_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strcmp, HAS_CPU_FEATURE (SSSE3),
|
|
__strcmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strcmp, 1, __strcmp_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strcmp, 1, __strcmp_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcpy.S. */
|
|
IFUNC_IMPL (i, name, strcpy,
|
|
IFUNC_IMPL_ADD (array, i, strcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__strcpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strcpy, 1, __strcpy_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strcpy, 1, __strcpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcspn.S. */
|
|
IFUNC_IMPL (i, name, strcspn,
|
|
IFUNC_IMPL_ADD (array, i, strcspn, HAS_CPU_FEATURE (SSE4_2),
|
|
__strcspn_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strcspn, 1, __strcspn_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strncase_l.S. */
|
|
IFUNC_IMPL (i, name, strncasecmp,
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__strncasecmp_avx)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp,
|
|
HAS_CPU_FEATURE (SSE4_2),
|
|
__strncasecmp_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__strncasecmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp, 1,
|
|
__strncasecmp_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strncase_l.S. */
|
|
IFUNC_IMPL (i, name, strncasecmp_l,
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__strncasecmp_l_avx)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l,
|
|
HAS_CPU_FEATURE (SSE4_2),
|
|
__strncasecmp_l_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__strncasecmp_l_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l, 1,
|
|
__strncasecmp_l_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strncat.S. */
|
|
IFUNC_IMPL (i, name, strncat,
|
|
IFUNC_IMPL_ADD (array, i, strncat, HAS_CPU_FEATURE (SSSE3),
|
|
__strncat_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strncat, 1,
|
|
__strncat_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strncat, 1, __strncat_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strncpy.S. */
|
|
IFUNC_IMPL (i, name, strncpy,
|
|
IFUNC_IMPL_ADD (array, i, strncpy, HAS_CPU_FEATURE (SSSE3),
|
|
__strncpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strncpy, 1,
|
|
__strncpy_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strncpy, 1, __strncpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strpbrk.S. */
|
|
IFUNC_IMPL (i, name, strpbrk,
|
|
IFUNC_IMPL_ADD (array, i, strpbrk, HAS_CPU_FEATURE (SSE4_2),
|
|
__strpbrk_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strpbrk, 1, __strpbrk_sse2))
|
|
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strspn.S. */
|
|
IFUNC_IMPL (i, name, strspn,
|
|
IFUNC_IMPL_ADD (array, i, strspn, HAS_CPU_FEATURE (SSE4_2),
|
|
__strspn_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strspn, 1, __strspn_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strstr.c. */
|
|
IFUNC_IMPL (i, name, strstr,
|
|
IFUNC_IMPL_ADD (array, i, strstr, 1, __strstr_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strstr, 1, __strstr_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/wcscpy.S. */
|
|
IFUNC_IMPL (i, name, wcscpy,
|
|
IFUNC_IMPL_ADD (array, i, wcscpy, HAS_CPU_FEATURE (SSSE3),
|
|
__wcscpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, wcscpy, 1, __wcscpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/wmemcmp.S. */
|
|
IFUNC_IMPL (i, name, wmemcmp,
|
|
IFUNC_IMPL_ADD (array, i, wmemcmp, HAS_CPU_FEATURE (SSE4_1),
|
|
__wmemcmp_sse4_1)
|
|
IFUNC_IMPL_ADD (array, i, wmemcmp, HAS_CPU_FEATURE (SSSE3),
|
|
__wmemcmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, wmemcmp, 1, __wmemcmp_sse2))
|
|
|
|
#ifdef SHARED
|
|
/* Support sysdeps/x86_64/multiarch/memcpy_chk.S. */
|
|
IFUNC_IMPL (i, name, __memcpy_chk,
|
|
#ifdef HAVE_AVX512_ASM_SUPPORT
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_chk_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_chk_avx512_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_chk_avx512_unaligned_erms)
|
|
#endif
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memcpy_chk_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memcpy_chk_avx_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memcpy_chk_avx_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__memcpy_chk_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__memcpy_chk_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk, 1,
|
|
__memcpy_chk_sse2_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk, 1,
|
|
__memcpy_chk_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk, 1,
|
|
__memcpy_chk_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memcpy.S. */
|
|
IFUNC_IMPL (i, name, memcpy,
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memcpy_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memcpy_avx_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memcpy_avx_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__memcpy_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__memcpy_ssse3)
|
|
#ifdef HAVE_AVX512_ASM_SUPPORT
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_avx512_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_avx512_unaligned_erms)
|
|
#endif
|
|
IFUNC_IMPL_ADD (array, i, memcpy, 1, __memcpy_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, 1,
|
|
__memcpy_sse2_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, 1,
|
|
__memcpy_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, 1, __memcpy_erms)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, 1, __memcpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/mempcpy_chk.S. */
|
|
IFUNC_IMPL (i, name, __mempcpy_chk,
|
|
#ifdef HAVE_AVX512_ASM_SUPPORT
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_chk_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_chk_avx512_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_chk_avx512_unaligned_erms)
|
|
#endif
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__mempcpy_chk_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__mempcpy_chk_avx_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__mempcpy_chk_avx_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__mempcpy_chk_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__mempcpy_chk_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk, 1,
|
|
__mempcpy_chk_sse2_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk, 1,
|
|
__mempcpy_chk_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk, 1,
|
|
__mempcpy_chk_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/mempcpy.S. */
|
|
IFUNC_IMPL (i, name, mempcpy,
|
|
#ifdef HAVE_AVX512_ASM_SUPPORT
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_avx512_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_avx512_unaligned_erms)
|
|
#endif
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__mempcpy_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__mempcpy_avx_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__mempcpy_avx_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__mempcpy_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__mempcpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, 1,
|
|
__mempcpy_sse2_unaligned_2)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, 1,
|
|
__mempcpy_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, 1, __mempcpy_erms)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, 1, __mempcpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strncmp.S. */
|
|
IFUNC_IMPL (i, name, strncmp,
|
|
IFUNC_IMPL_ADD (array, i, strncmp, HAS_CPU_FEATURE (SSE4_2),
|
|
__strncmp_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strncmp, HAS_CPU_FEATURE (SSSE3),
|
|
__strncmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strncmp, 1, __strncmp_sse2))
|
|
#endif
|
|
|
|
return i;
|
|
}
|