mirror of
https://sourceware.org/git/glibc.git
synced 2024-11-15 01:21:06 +00:00
7e8283170c
The AVX2 strrchr and wcsrchr implementation uses the 'blsmsk'
instruction which belongs to the BMI1 CPU feature and the 'shrx'
instruction, which belongs to the BMI2 CPU feature.
Fixes: df7e295d18
("x86: Optimize {str|wcs}rchr-avx2")
Partially resolves: BZ #29611
Reviewed-by: Noah Goldstein <goldstein.w.n@gmail.com>
148 lines
5.3 KiB
C
148 lines
5.3 KiB
C
/* Header defining the minimum x86 ISA level
|
|
Copyright (C) 2022 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
In addition to the permissions in the GNU Lesser General Public
|
|
License, the Free Software Foundation gives you unlimited
|
|
permission to link the compiled version of this file with other
|
|
programs, and to distribute those programs without any restriction
|
|
coming from the use of this file. (The Lesser General Public
|
|
License restrictions do apply in other respects; for example, they
|
|
cover modification of the file, and distribution when not linked
|
|
into another program.)
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<https://www.gnu.org/licenses/>. */
|
|
|
|
#ifndef _ISA_LEVEL_H
|
|
#define _ISA_LEVEL_H
|
|
|
|
#if defined __SSE__ && defined __SSE2__
|
|
/* NB: ISAs, excluding MMX, in x86-64 ISA level baseline are used. */
|
|
# define __X86_ISA_V1 1
|
|
#else
|
|
# define __X86_ISA_V1 0
|
|
#endif
|
|
|
|
#if __X86_ISA_V1 && defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16 \
|
|
&& defined HAVE_X86_LAHF_SAHF && defined __POPCNT__ && defined __SSE3__ \
|
|
&& defined __SSSE3__ && defined __SSE4_1__ && defined __SSE4_2__
|
|
/* NB: ISAs in x86-64 ISA level v2 are used. */
|
|
# define __X86_ISA_V2 1
|
|
#else
|
|
# define __X86_ISA_V2 0
|
|
#endif
|
|
|
|
#if __X86_ISA_V2 && defined __AVX__ && defined __AVX2__ && defined __F16C__ \
|
|
&& defined __FMA__ && defined __LZCNT__ && defined HAVE_X86_MOVBE \
|
|
&& defined __BMI__ && defined __BMI2__
|
|
/* NB: ISAs in x86-64 ISA level v3 are used. */
|
|
# define __X86_ISA_V3 1
|
|
#else
|
|
# define __X86_ISA_V3 0
|
|
#endif
|
|
|
|
#if __X86_ISA_V3 && defined __AVX512F__ && defined __AVX512BW__ \
|
|
&& defined __AVX512CD__ && defined __AVX512DQ__ && defined __AVX512VL__
|
|
/* NB: ISAs in x86-64 ISA level v4 are used. */
|
|
# define __X86_ISA_V4 1
|
|
#else
|
|
# define __X86_ISA_V4 0
|
|
#endif
|
|
|
|
#define MINIMUM_X86_ISA_LEVEL \
|
|
(__X86_ISA_V1 + __X86_ISA_V2 + __X86_ISA_V3 + __X86_ISA_V4)
|
|
|
|
/* Depending on the minimum ISA level, a feature check result can be a
|
|
compile-time constant.. */
|
|
|
|
|
|
/* For CPU_FEATURE_USABLE_P. */
|
|
|
|
/* ISA level >= 4 guaranteed includes. */
|
|
#define AVX512F_X86_ISA_LEVEL 4
|
|
#define AVX512VL_X86_ISA_LEVEL 4
|
|
#define AVX512BW_X86_ISA_LEVEL 4
|
|
#define AVX512DQ_X86_ISA_LEVEL 4
|
|
|
|
/* ISA level >= 3 guaranteed includes. */
|
|
#define AVX_X86_ISA_LEVEL 3
|
|
#define AVX2_X86_ISA_LEVEL 3
|
|
#define BMI1_X86_ISA_LEVEL 3
|
|
#define BMI2_X86_ISA_LEVEL 3
|
|
#define LZCNT_X86_ISA_LEVEL 3
|
|
#define MOVBE_X86_ISA_LEVEL 3
|
|
|
|
/* ISA level >= 2 guaranteed includes. */
|
|
#define SSE4_2_X86_ISA_LEVEL 2
|
|
#define SSE4_1_X86_ISA_LEVEL 2
|
|
#define SSSE3_X86_ISA_LEVEL 2
|
|
|
|
|
|
/* For X86_ISA_CPU_FEATURES_ARCH_P. */
|
|
|
|
/* NB: This feature is enabled when ISA level >= 3, which was disabled
|
|
for the following CPUs:
|
|
- AMD Excavator
|
|
when ISA level < 3. */
|
|
#define AVX_Fast_Unaligned_Load_X86_ISA_LEVEL 3
|
|
|
|
/* NB: This feature is disabled when ISA level >= 3, which was enabled
|
|
for the following CPUs:
|
|
- Intel KNL
|
|
when ISA level < 3. */
|
|
#define Prefer_No_VZEROUPPER_X86_ISA_LEVEL 3
|
|
|
|
/* NB: This feature is disable when ISA level >= 3. All CPUs with
|
|
this feature don't run on glibc built with ISA level >= 3. */
|
|
#define Slow_SSE42_X86_ISA_LEVEL 3
|
|
|
|
/* Feature(s) enabled when ISA level >= 2. */
|
|
#define Fast_Unaligned_Load_X86_ISA_LEVEL 2
|
|
|
|
/* NB: This feature is disable when ISA level >= 2, which was enabled
|
|
for the early Atom CPUs. */
|
|
#define Slow_BSF_X86_ISA_LEVEL 2
|
|
|
|
|
|
/* Both X86_ISA_CPU_FEATURE_USABLE_P and X86_ISA_CPU_FEATURES_ARCH_P
|
|
macros are wrappers for the respective CPU_FEATURE{S}_{USABLE|ARCH}_P
|
|
runtime checks. They differ in two ways.
|
|
|
|
1. The USABLE_P version is evaluated to true when the feature
|
|
is enabled.
|
|
|
|
2. The ARCH_P version has a third argument `not`. The `not`
|
|
argument can either be `!` or empty. If the feature is
|
|
enabled above an ISA level, the third argument should be empty
|
|
and the expression is evaluated to true when the feature is
|
|
enabled. If the feature is disabled above an ISA level, the
|
|
third argument should be `!` and the expression is evaluated
|
|
to true when the feature is disabled.
|
|
*/
|
|
|
|
#define X86_ISA_CPU_FEATURE_USABLE_P(ptr, name) \
|
|
(((name##_X86_ISA_LEVEL) <= MINIMUM_X86_ISA_LEVEL) \
|
|
|| CPU_FEATURE_USABLE_P (ptr, name))
|
|
|
|
#define X86_ISA_CPU_FEATURES_ARCH_P(ptr, name, not) \
|
|
(((name##_X86_ISA_LEVEL) <= MINIMUM_X86_ISA_LEVEL) \
|
|
|| not CPU_FEATURES_ARCH_P (ptr, name))
|
|
|
|
#define ISA_SHOULD_BUILD(isa_build_level) \
|
|
(MINIMUM_X86_ISA_LEVEL <= (isa_build_level) && IS_IN (libc)) \
|
|
|| defined ISA_DEFAULT_IMPL
|
|
|
|
#endif
|