mirror of
https://sourceware.org/git/glibc.git
synced 2024-11-30 00:31:08 +00:00
dc485ceb2a
Optimize strlen/strnlen/wcslen/wcsnlen with AVX2 to check 32 bytes with a single vector compare instruction. It is as fast as SSE2 versions for size <= 16 bytes and up to 1X faster for or size > 16 bytes on Haswell. Select AVX2 version on AVX2 machines where vzeroupper is preferred and AVX unaligned load is fast. NB: It uses TZCNT instead of BSF since TZCNT produces the same result as BSF for non-zero input. TZCNT is faster than BSF and is executed as BSF if machine doesn't support TZCNT. * sysdeps/x86_64/multiarch/Makefile (sysdep_routines): Add strlen-sse2, strnlen-sse2, strlen-avx2, strnlen-avx2, wcslen-sse2, wcslen-avx2 and wcsnlen-avx2. * sysdeps/x86_64/multiarch/ifunc-impl-list.c (__libc_ifunc_impl_list): Add tests for __strlen_avx2, __strlen_sse2, __strnlen_avx2, __strnlen_sse2, __wcslen_avx2, __wcslen_sse2 and __wcsnlen_avx2. * sysdeps/x86_64/multiarch/strlen-avx2.S: New file. * sysdeps/x86_64/multiarch/strlen-sse2.S: Likewise. * sysdeps/x86_64/multiarch/strlen.c: Likewise. * sysdeps/x86_64/multiarch/strnlen-avx2.S: Likewise. * sysdeps/x86_64/multiarch/strnlen-sse2.S: Likewise. * sysdeps/x86_64/multiarch/strnlen.c: Likewise. * sysdeps/x86_64/multiarch/wcslen-avx2.S: Likewise. * sysdeps/x86_64/multiarch/wcslen-sse2.S: Likewise. * sysdeps/x86_64/multiarch/wcslen.c: Likewise. * sysdeps/x86_64/multiarch/wcsnlen-avx2.S: Likewise. * sysdeps/x86_64/multiarch/wcsnlen.c (OPTIMIZE (avx2)): New. (IFUNC_SELECTOR): Return OPTIMIZE (avx2) on AVX2 machines where vzeroupper is preferred and AVX unaligned load is fast.
506 lines
19 KiB
C
506 lines
19 KiB
C
/* Enumerate available IFUNC implementations of a function. x86-64 version.
|
|
Copyright (C) 2012-2017 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include <assert.h>
|
|
#include <string.h>
|
|
#include <wchar.h>
|
|
#include <ifunc-impl-list.h>
|
|
#include <sysdep.h>
|
|
#include "init-arch.h"
|
|
|
|
/* Maximum number of IFUNC implementations. */
|
|
#define MAX_IFUNC 5
|
|
|
|
/* Fill ARRAY of MAX elements with IFUNC implementations for function
|
|
NAME supported on target machine and return the number of valid
|
|
entries. */
|
|
|
|
size_t
|
|
__libc_ifunc_impl_list (const char *name, struct libc_ifunc_impl *array,
|
|
size_t max)
|
|
{
|
|
assert (max >= MAX_IFUNC);
|
|
|
|
size_t i = 0;
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memchr.S. */
|
|
IFUNC_IMPL (i, name, memchr,
|
|
IFUNC_IMPL_ADD (array, i, memchr,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__memchr_avx2)
|
|
IFUNC_IMPL_ADD (array, i, memchr, 1, __memchr_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memcmp.S. */
|
|
IFUNC_IMPL (i, name, memcmp,
|
|
IFUNC_IMPL_ADD (array, i, memcmp,
|
|
(HAS_ARCH_FEATURE (AVX2_Usable)
|
|
&& HAS_CPU_FEATURE (MOVBE)),
|
|
__memcmp_avx2_movbe)
|
|
IFUNC_IMPL_ADD (array, i, memcmp, HAS_CPU_FEATURE (SSE4_1),
|
|
__memcmp_sse4_1)
|
|
IFUNC_IMPL_ADD (array, i, memcmp, HAS_CPU_FEATURE (SSSE3),
|
|
__memcmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, memcmp, 1, __memcmp_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memmove_chk.c. */
|
|
IFUNC_IMPL (i, name, __memmove_chk,
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_chk_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_chk_avx512_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_chk_avx512_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memmove_chk_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memmove_chk_avx_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__memmove_chk_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__memmove_chk_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk, 1,
|
|
__memmove_chk_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memmove_chk, 1,
|
|
__memmove_chk_sse2_unaligned_erms))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memmove.S. */
|
|
IFUNC_IMPL (i, name, memmove,
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memmove_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memmove_avx_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_avx512_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memmove_avx512_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memmove, HAS_CPU_FEATURE (SSSE3),
|
|
__memmove_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, memmove, HAS_CPU_FEATURE (SSSE3),
|
|
__memmove_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, memmove, 1, __memmove_erms)
|
|
IFUNC_IMPL_ADD (array, i, memmove, 1,
|
|
__memmove_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memmove, 1,
|
|
__memmove_sse2_unaligned_erms))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memset_chk.S. */
|
|
IFUNC_IMPL (i, name, __memset_chk,
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk, 1,
|
|
__memset_chk_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk, 1,
|
|
__memset_chk_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__memset_chk_avx2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__memset_chk_avx2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_chk_avx512_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_chk_avx512_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memset_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_chk_avx512_no_vzeroupper)
|
|
)
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memset.S. */
|
|
IFUNC_IMPL (i, name, memset,
|
|
IFUNC_IMPL_ADD (array, i, memset, 1,
|
|
__memset_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memset, 1,
|
|
__memset_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memset, 1, __memset_erms)
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__memset_avx2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__memset_avx2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_avx512_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_avx512_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memset_avx512_no_vzeroupper)
|
|
)
|
|
|
|
/* Support sysdeps/x86_64/multiarch/rawmemchr.S. */
|
|
IFUNC_IMPL (i, name, rawmemchr,
|
|
IFUNC_IMPL_ADD (array, i, rawmemchr,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__rawmemchr_avx2)
|
|
IFUNC_IMPL_ADD (array, i, rawmemchr, 1, __rawmemchr_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strlen.S. */
|
|
IFUNC_IMPL (i, name, strlen,
|
|
IFUNC_IMPL_ADD (array, i, strlen,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__strlen_avx2)
|
|
IFUNC_IMPL_ADD (array, i, strlen, 1, __strlen_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strnlen.S. */
|
|
IFUNC_IMPL (i, name, strnlen,
|
|
IFUNC_IMPL_ADD (array, i, strnlen,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__strnlen_avx2)
|
|
IFUNC_IMPL_ADD (array, i, strnlen, 1, __strnlen_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/stpncpy.S. */
|
|
IFUNC_IMPL (i, name, stpncpy,
|
|
IFUNC_IMPL_ADD (array, i, stpncpy, HAS_CPU_FEATURE (SSSE3),
|
|
__stpncpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, stpncpy, 1,
|
|
__stpncpy_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, stpncpy, 1, __stpncpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/stpcpy.S. */
|
|
IFUNC_IMPL (i, name, stpcpy,
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__stpcpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, 1, __stpcpy_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, 1, __stpcpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcasecmp_l.S. */
|
|
IFUNC_IMPL (i, name, strcasecmp,
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__strcasecmp_avx)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp,
|
|
HAS_CPU_FEATURE (SSE4_2),
|
|
__strcasecmp_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__strcasecmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp, 1, __strcasecmp_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcasecmp_l.S. */
|
|
IFUNC_IMPL (i, name, strcasecmp_l,
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__strcasecmp_l_avx)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l,
|
|
HAS_CPU_FEATURE (SSE4_2),
|
|
__strcasecmp_l_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__strcasecmp_l_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l, 1,
|
|
__strcasecmp_l_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcat.S. */
|
|
IFUNC_IMPL (i, name, strcat,
|
|
IFUNC_IMPL_ADD (array, i, strcat, HAS_CPU_FEATURE (SSSE3),
|
|
__strcat_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strcat, 1, __strcat_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strcat, 1, __strcat_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strchr.S. */
|
|
IFUNC_IMPL (i, name, strchr,
|
|
IFUNC_IMPL_ADD (array, i, strchr, 1, __strchr_sse2_no_bsf)
|
|
IFUNC_IMPL_ADD (array, i, strchr, 1, __strchr_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcmp.S. */
|
|
IFUNC_IMPL (i, name, strcmp,
|
|
IFUNC_IMPL_ADD (array, i, strcmp, HAS_CPU_FEATURE (SSE4_2),
|
|
__strcmp_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strcmp, HAS_CPU_FEATURE (SSSE3),
|
|
__strcmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strcmp, 1, __strcmp_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strcmp, 1, __strcmp_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcpy.S. */
|
|
IFUNC_IMPL (i, name, strcpy,
|
|
IFUNC_IMPL_ADD (array, i, strcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__strcpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strcpy, 1, __strcpy_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strcpy, 1, __strcpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strcspn.S. */
|
|
IFUNC_IMPL (i, name, strcspn,
|
|
IFUNC_IMPL_ADD (array, i, strcspn, HAS_CPU_FEATURE (SSE4_2),
|
|
__strcspn_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strcspn, 1, __strcspn_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strncase_l.S. */
|
|
IFUNC_IMPL (i, name, strncasecmp,
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__strncasecmp_avx)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp,
|
|
HAS_CPU_FEATURE (SSE4_2),
|
|
__strncasecmp_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__strncasecmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp, 1,
|
|
__strncasecmp_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strncase_l.S. */
|
|
IFUNC_IMPL (i, name, strncasecmp_l,
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__strncasecmp_l_avx)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l,
|
|
HAS_CPU_FEATURE (SSE4_2),
|
|
__strncasecmp_l_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__strncasecmp_l_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l, 1,
|
|
__strncasecmp_l_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strncat.S. */
|
|
IFUNC_IMPL (i, name, strncat,
|
|
IFUNC_IMPL_ADD (array, i, strncat, HAS_CPU_FEATURE (SSSE3),
|
|
__strncat_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strncat, 1,
|
|
__strncat_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strncat, 1, __strncat_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strncpy.S. */
|
|
IFUNC_IMPL (i, name, strncpy,
|
|
IFUNC_IMPL_ADD (array, i, strncpy, HAS_CPU_FEATURE (SSSE3),
|
|
__strncpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strncpy, 1,
|
|
__strncpy_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strncpy, 1, __strncpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strpbrk.S. */
|
|
IFUNC_IMPL (i, name, strpbrk,
|
|
IFUNC_IMPL_ADD (array, i, strpbrk, HAS_CPU_FEATURE (SSE4_2),
|
|
__strpbrk_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strpbrk, 1, __strpbrk_sse2))
|
|
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strspn.S. */
|
|
IFUNC_IMPL (i, name, strspn,
|
|
IFUNC_IMPL_ADD (array, i, strspn, HAS_CPU_FEATURE (SSE4_2),
|
|
__strspn_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strspn, 1, __strspn_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strstr.c. */
|
|
IFUNC_IMPL (i, name, strstr,
|
|
IFUNC_IMPL_ADD (array, i, strstr, 1, __strstr_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, strstr, 1, __strstr_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/wcscpy.S. */
|
|
IFUNC_IMPL (i, name, wcscpy,
|
|
IFUNC_IMPL_ADD (array, i, wcscpy, HAS_CPU_FEATURE (SSSE3),
|
|
__wcscpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, wcscpy, 1, __wcscpy_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/wcslen.c. */
|
|
IFUNC_IMPL (i, name, wcslen,
|
|
IFUNC_IMPL_ADD (array, i, wcslen,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__wcslen_avx2)
|
|
IFUNC_IMPL_ADD (array, i, wcslen, 1, __wcslen_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/wcsnlen.c. */
|
|
IFUNC_IMPL (i, name, wcsnlen,
|
|
IFUNC_IMPL_ADD (array, i, wcsnlen,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__wcsnlen_avx2)
|
|
IFUNC_IMPL_ADD (array, i, wcsnlen,
|
|
HAS_CPU_FEATURE (SSE4_1),
|
|
__wcsnlen_sse4_1)
|
|
IFUNC_IMPL_ADD (array, i, wcsnlen, 1, __wcsnlen_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/wmemchr.c. */
|
|
IFUNC_IMPL (i, name, wmemchr,
|
|
IFUNC_IMPL_ADD (array, i, wmemchr,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__wmemchr_avx2)
|
|
IFUNC_IMPL_ADD (array, i, wmemchr, 1, __wmemchr_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/wmemcmp.S. */
|
|
IFUNC_IMPL (i, name, wmemcmp,
|
|
IFUNC_IMPL_ADD (array, i, wmemcmp,
|
|
(HAS_ARCH_FEATURE (AVX2_Usable)
|
|
&& HAS_CPU_FEATURE (MOVBE)),
|
|
__wmemcmp_avx2_movbe)
|
|
IFUNC_IMPL_ADD (array, i, wmemcmp, HAS_CPU_FEATURE (SSE4_1),
|
|
__wmemcmp_sse4_1)
|
|
IFUNC_IMPL_ADD (array, i, wmemcmp, HAS_CPU_FEATURE (SSSE3),
|
|
__wmemcmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, wmemcmp, 1, __wmemcmp_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/wmemset.c. */
|
|
IFUNC_IMPL (i, name, wmemset,
|
|
IFUNC_IMPL_ADD (array, i, wmemset, 1,
|
|
__wmemset_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, wmemset,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__wmemset_avx2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, wmemset,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__wmemset_avx512_unaligned))
|
|
|
|
#ifdef SHARED
|
|
/* Support sysdeps/x86_64/multiarch/memcpy_chk.S. */
|
|
IFUNC_IMPL (i, name, __memcpy_chk,
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_chk_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_chk_avx512_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_chk_avx512_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memcpy_chk_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memcpy_chk_avx_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__memcpy_chk_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__memcpy_chk_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk, 1,
|
|
__memcpy_chk_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __memcpy_chk, 1,
|
|
__memcpy_chk_sse2_unaligned_erms))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/memcpy.S. */
|
|
IFUNC_IMPL (i, name, memcpy,
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memcpy_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__memcpy_avx_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__memcpy_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__memcpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_avx512_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__memcpy_avx512_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, 1, __memcpy_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, 1,
|
|
__memcpy_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, memcpy, 1, __memcpy_erms))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/mempcpy_chk.S. */
|
|
IFUNC_IMPL (i, name, __mempcpy_chk,
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_chk_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_chk_avx512_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_chk_avx512_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__mempcpy_chk_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__mempcpy_chk_avx_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__mempcpy_chk_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk,
|
|
HAS_CPU_FEATURE (SSSE3),
|
|
__mempcpy_chk_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk, 1,
|
|
__mempcpy_chk_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __mempcpy_chk, 1,
|
|
__mempcpy_chk_sse2_unaligned_erms))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/mempcpy.S. */
|
|
IFUNC_IMPL (i, name, mempcpy,
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_avx512_no_vzeroupper)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_avx512_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__mempcpy_avx512_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__mempcpy_avx_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
|
HAS_ARCH_FEATURE (AVX_Usable),
|
|
__mempcpy_avx_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__mempcpy_ssse3_back)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, HAS_CPU_FEATURE (SSSE3),
|
|
__mempcpy_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, 1,
|
|
__mempcpy_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, 1,
|
|
__mempcpy_sse2_unaligned_erms)
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, 1, __mempcpy_erms))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/strncmp.S. */
|
|
IFUNC_IMPL (i, name, strncmp,
|
|
IFUNC_IMPL_ADD (array, i, strncmp, HAS_CPU_FEATURE (SSE4_2),
|
|
__strncmp_sse42)
|
|
IFUNC_IMPL_ADD (array, i, strncmp, HAS_CPU_FEATURE (SSSE3),
|
|
__strncmp_ssse3)
|
|
IFUNC_IMPL_ADD (array, i, strncmp, 1, __strncmp_sse2))
|
|
|
|
/* Support sysdeps/x86_64/multiarch/wmemset_chk.c. */
|
|
IFUNC_IMPL (i, name, __wmemset_chk,
|
|
IFUNC_IMPL_ADD (array, i, __wmemset_chk, 1,
|
|
__wmemset_chk_sse2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __wmemset_chk,
|
|
HAS_ARCH_FEATURE (AVX2_Usable),
|
|
__wmemset_chk_avx2_unaligned)
|
|
IFUNC_IMPL_ADD (array, i, __wmemset_chk,
|
|
HAS_ARCH_FEATURE (AVX512F_Usable),
|
|
__wmemset_chk_avx512_unaligned))
|
|
#endif
|
|
|
|
return i;
|
|
}
|