2009-07-31 18:53:35 +00:00
|
|
|
ifeq ($(subdir),csu)
|
2012-05-17 03:14:24 +00:00
|
|
|
tests += test-multiarch
|
2009-07-31 18:53:35 +00:00
|
|
|
gen-as-const-headers += ifunc-defines.sym
|
|
|
|
endif
|
2009-08-04 19:13:43 +00:00
|
|
|
|
|
|
|
ifeq ($(subdir),string)
|
2011-11-13 14:50:13 +00:00
|
|
|
gen-as-const-headers += locale-defines.sym
|
2010-01-12 19:22:03 +00:00
|
|
|
sysdep_routines += bzero-sse2 memset-sse2 memcpy-ssse3 mempcpy-ssse3 \
|
|
|
|
memmove-ssse3 memcpy-ssse3-rep mempcpy-ssse3-rep \
|
|
|
|
memmove-ssse3-rep bcopy-ssse3 bcopy-ssse3-rep \
|
2010-02-15 19:17:50 +00:00
|
|
|
memset-sse2-rep bzero-sse2-rep strcmp-ssse3 \
|
|
|
|
strcmp-sse4 strncmp-c strncmp-ssse3 strncmp-sse4 \
|
2013-12-18 01:53:27 +00:00
|
|
|
memcmp-ssse3 memcmp-sse4 varshift \
|
2011-06-24 18:15:32 +00:00
|
|
|
strlen-sse2 strlen-sse2-bsf strncpy-c strcpy-ssse3 \
|
|
|
|
strncpy-ssse3 stpcpy-ssse3 stpncpy-ssse3 strcpy-sse2 \
|
2011-08-04 19:33:38 +00:00
|
|
|
strncpy-sse2 stpcpy-sse2 stpncpy-sse2 strcat-ssse3 \
|
2011-09-05 17:53:27 +00:00
|
|
|
strcat-sse2 strncat-ssse3 strncat-sse2 strncat-c \
|
2011-09-05 21:11:11 +00:00
|
|
|
strchr-sse2 strrchr-sse2 strchr-sse2-bsf strrchr-sse2-bsf \
|
2011-10-28 09:39:07 +00:00
|
|
|
memchr-sse2 memchr-sse2-bsf \
|
2011-10-12 15:42:04 +00:00
|
|
|
memrchr-sse2 memrchr-sse2-bsf memrchr-c \
|
2011-10-15 15:10:08 +00:00
|
|
|
rawmemchr-sse2 rawmemchr-sse2-bsf \
|
2011-11-13 14:50:13 +00:00
|
|
|
strnlen-sse2 strnlen-c \
|
|
|
|
strcasecmp_l-c strcasecmp-c strcasecmp_l-ssse3 \
|
2011-11-14 23:24:35 +00:00
|
|
|
strncase_l-c strncase-c strncase_l-ssse3 \
|
i386: memcpy functions with SSE2 unaligned load/store
These new memcpy functions are the 32-bit version of x86_64 SSE2 unaligned
memcpy. Memcpy average performace benefit is 18% on Silvermont, other
platforms also improved about 35%, benchmarked on Silvermont, Haswell, Ivy
Bridge, Sandy Bridge and Westmere, performance results attached in
https://sourceware.org/ml/libc-alpha/2014-07/msg00157.html
* sysdeps/i386/i686/multiarch/bcopy-sse2-unaligned.S: New file.
* sysdeps/i386/i686/multiarch/memcpy-sse2-unaligned.S: Likewise.
* sysdeps/i386/i686/multiarch/memmove-sse2-unaligned.S: Likewise.
* sysdeps/i386/i686/multiarch/mempcpy-sse2-unaligned.S: Likewise.
* sysdeps/i386/i686/multiarch/bcopy.S: Select the sse2_unaligned
version if bit_Fast_Unaligned_Load is set.
* sysdeps/i386/i686/multiarch/memcpy.S: Likewise.
* sysdeps/i386/i686/multiarch/memcpy_chk.S: Likewise.
* sysdeps/i386/i686/multiarch/memmove.S: Likewise.
* sysdeps/i386/i686/multiarch/memmove_chk.S: Likewise.
* sysdeps/i386/i686/multiarch/mempcpy.S: Likewise.
* sysdeps/i386/i686/multiarch/mempcpy_chk.S: Likewise.
* sysdeps/i386/i686/multiarch/Makefile (sysdep_routines): Add
bcopy-sse2-unaligned, memcpy-sse2-unaligned,
memmove-sse2-unaligned and mempcpy-sse2-unaligned.
* sysdeps/i386/i686/multiarch/ifunc-impl-list.c (MAX_IFUNC): Set
to 4.
(__libc_ifunc_impl_list): Test __bcopy_sse2_unaligned,
__memmove_chk_sse2_unaligned, __memmove_sse2_unaligned,
__memcpy_chk_sse2_unaligned, __memcpy_sse2_unaligned,
__mempcpy_chk_sse2_unaligned, and __mempcpy_sse2_unaligned.
2014-12-29 11:39:46 +00:00
|
|
|
strcasecmp_l-sse4 strncase_l-sse4 \
|
|
|
|
bcopy-sse2-unaligned memcpy-sse2-unaligned \
|
2015-10-06 20:47:40 +00:00
|
|
|
mempcpy-sse2-unaligned memmove-sse2-unaligned \
|
|
|
|
strcspn-c strpbrk-c strspn-c
|
2010-08-28 00:11:38 +00:00
|
|
|
CFLAGS-varshift.c += -msse4
|
2009-08-04 19:13:43 +00:00
|
|
|
CFLAGS-strcspn-c.c += -msse4
|
|
|
|
CFLAGS-strpbrk-c.c += -msse4
|
|
|
|
CFLAGS-strspn-c.c += -msse4
|
|
|
|
endif
|
2010-04-15 05:27:59 +00:00
|
|
|
|
2011-10-28 09:39:07 +00:00
|
|
|
ifeq ($(subdir),wcsmbs)
|
|
|
|
sysdep_routines += wcscmp-sse2 wcscmp-c wcslen-sse2 wcslen-c \
|
2011-12-17 19:39:23 +00:00
|
|
|
wmemcmp-sse4 wmemcmp-ssse3 wmemcmp-c wcschr-sse2 \
|
|
|
|
wcschr-c wcsrchr-sse2 wcsrchr-c wcscpy-ssse3 wcscpy-c
|
2011-10-28 09:39:07 +00:00
|
|
|
endif
|
|
|
|
|
2010-04-15 05:27:59 +00:00
|
|
|
ifeq (mathyes,$(subdir)$(config-cflags-avx))
|
|
|
|
libm-sysdep_routines += s_fma-fma s_fmaf-fma
|
|
|
|
CFLAGS-s_fma-fma.c += -mavx -mfpmath=sse
|
|
|
|
CFLAGS-s_fmaf-fma.c += -mavx -mfpmath=sse
|
|
|
|
endif
|