glibc/sysdeps/powerpc/powerpc64/multiarch/strchr-power8.S
Rajalakshmi Srinivasaraghavan 9314d3545e powerpc64: strchr/strchrnul optimization for power8
The P7 code is used for <=32B strings and for > 32B vectorized loops are used.
This shows as an average 25% improvement depending on the position of search
character.  The performance is same for shorter strings.
Tested on ppc64 and ppc64le.
2016-12-28 11:44:31 -02:00

40 lines
1.3 KiB
ArmAsm

/* Optimized strchr implementation for POWER8.
Copyright (C) 2016 Free Software Foundation, Inc.
This file is part of the GNU C Library.
The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with the GNU C Library; if not, see
<http://www.gnu.org/licenses/>. */
#include <sysdep.h>
#undef ENTRY
#define ENTRY(name) \
.section ".text"; \
ENTRY_2(__strchr_power8) \
.align ALIGNARG(2); \
BODY_LABEL(__strchr_power8): \
cfi_startproc; \
LOCALENTRY(__strchr_power8)
#undef END
#define END(name) \
cfi_endproc; \
TRACEBACK(__strchr_power8) \
END_2(__strchr_power8)
#undef libc_hidden_builtin_def
#define libc_hidden_builtin_def(name)
#include <sysdeps/powerpc/powerpc64/power8/strchr.S>