mirror of
https://sourceware.org/git/glibc.git
synced 2024-11-26 23:10:06 +00:00
2193311288
Here is implementation of cos containing SSE, AVX, AVX2 and AVX512 versions according to Vector ABI which had been discussed in <https://groups.google.com/forum/#!topic/x86-64-abi/LmppCfN1rZ4>. Vector math library build and ABI testing enabled by default for x86_64. * sysdeps/x86_64/fpu/Makefile: New file. * sysdeps/x86_64/fpu/Versions: New file. * sysdeps/x86_64/fpu/svml_d_cos_data.S: New file. * sysdeps/x86_64/fpu/svml_d_cos_data.h: New file. * sysdeps/x86_64/fpu/svml_d_cos2_core.S: New file. * sysdeps/x86_64/fpu/svml_d_cos4_core.S: New file. * sysdeps/x86_64/fpu/svml_d_cos4_core_avx.S: New file. * sysdeps/x86_64/fpu/svml_d_cos8_core.S: New file. * sysdeps/x86_64/fpu/svml_d_wrapper_impl.h: New file. * sysdeps/x86_64/fpu/multiarch/svml_d_cos2_core.S: New file. * sysdeps/x86_64/fpu/multiarch/svml_d_cos2_core_sse4.S: New file. * sysdeps/x86_64/fpu/multiarch/svml_d_cos4_core.S: New file. * sysdeps/x86_64/fpu/multiarch/svml_d_cos4_core_avx2.S: New file. * sysdeps/x86_64/fpu/multiarch/svml_d_cos8_core.S: New file. * sysdeps/x86_64/fpu/multiarch/svml_d_cos8_core_avx512.S: New file. * sysdeps/x86_64/fpu/multiarch/Makefile (libmvec-sysdep_routines): Added build of SSE, AVX2 and AVX512 IFUNC versions. * sysdeps/x86/fpu/bits/math-vector.h: Added SIMD declaration for cos. * math/bits/mathcalls.h: Added cos declaration with __MATHCALL_VEC. * sysdeps/x86_64/configure.ac: Options for libmvec build. * sysdeps/x86_64/configure: Regenerated. * sysdeps/x86_64/sysdep.h (cfi_offset_rel_rsp): New macro. * sysdeps/unix/sysv/linux/x86_64/libmvec.abilist: New file. * manual/install.texi (Configuring and compiling): Document --disable-mathvec. * INSTALL: Regenerated. * NEWS: Mention addition of libmvec and x86_64 vector cos.
285 lines
8.5 KiB
Plaintext
285 lines
8.5 KiB
Plaintext
|
|
# ac_fn_c_check_header_compile LINENO HEADER VAR INCLUDES
|
|
# -------------------------------------------------------
|
|
# Tests whether HEADER exists and can be compiled using the include files in
|
|
# INCLUDES, setting the cache variable VAR accordingly.
|
|
ac_fn_c_check_header_compile ()
|
|
{
|
|
as_lineno=${as_lineno-"$1"} as_lineno_stack=as_lineno_stack=$as_lineno_stack
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for $2" >&5
|
|
$as_echo_n "checking for $2... " >&6; }
|
|
if eval \${$3+:} false; then :
|
|
$as_echo_n "(cached) " >&6
|
|
else
|
|
cat confdefs.h - <<_ACEOF >conftest.$ac_ext
|
|
/* end confdefs.h. */
|
|
$4
|
|
#include <$2>
|
|
_ACEOF
|
|
if ac_fn_c_try_compile "$LINENO"; then :
|
|
eval "$3=yes"
|
|
else
|
|
eval "$3=no"
|
|
fi
|
|
rm -f core conftest.err conftest.$ac_objext conftest.$ac_ext
|
|
fi
|
|
eval ac_res=\$$3
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $ac_res" >&5
|
|
$as_echo "$ac_res" >&6; }
|
|
eval $as_lineno_stack; ${as_lineno_stack:+:} unset as_lineno
|
|
|
|
} # ac_fn_c_check_header_compile
|
|
# This file is generated from configure.ac by Autoconf. DO NOT EDIT!
|
|
# Local configure fragment for sysdeps/x86_64.
|
|
|
|
|
|
ac_fn_c_check_header_compile "$LINENO" "cpuid.h" "ac_cv_header_cpuid_h" "/* No default includes. */
|
|
"
|
|
if test "x$ac_cv_header_cpuid_h" = xyes; then :
|
|
|
|
else
|
|
as_fn_error $? "gcc must provide the <cpuid.h> header" "$LINENO" 5
|
|
fi
|
|
|
|
|
|
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for SSE4 support" >&5
|
|
$as_echo_n "checking for SSE4 support... " >&6; }
|
|
if ${libc_cv_cc_sse4+:} false; then :
|
|
$as_echo_n "(cached) " >&6
|
|
else
|
|
if { ac_try='${CC-cc} -msse4 -xc /dev/null -S -o /dev/null'
|
|
{ { eval echo "\"\$as_me\":${as_lineno-$LINENO}: \"$ac_try\""; } >&5
|
|
(eval $ac_try) 2>&5
|
|
ac_status=$?
|
|
$as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
|
|
test $ac_status = 0; }; }; then :
|
|
libc_cv_cc_sse4=yes
|
|
else
|
|
libc_cv_cc_sse4=no
|
|
fi
|
|
|
|
fi
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $libc_cv_cc_sse4" >&5
|
|
$as_echo "$libc_cv_cc_sse4" >&6; }
|
|
if test $libc_cv_cc_sse4 = yes; then
|
|
$as_echo "#define HAVE_SSE4_SUPPORT 1" >>confdefs.h
|
|
|
|
fi
|
|
config_vars="$config_vars
|
|
config-cflags-sse4 = $libc_cv_cc_sse4"
|
|
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for AVX support" >&5
|
|
$as_echo_n "checking for AVX support... " >&6; }
|
|
if ${libc_cv_cc_avx+:} false; then :
|
|
$as_echo_n "(cached) " >&6
|
|
else
|
|
if { ac_try='${CC-cc} -mavx -xc /dev/null -S -o /dev/null'
|
|
{ { eval echo "\"\$as_me\":${as_lineno-$LINENO}: \"$ac_try\""; } >&5
|
|
(eval $ac_try) 2>&5
|
|
ac_status=$?
|
|
$as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
|
|
test $ac_status = 0; }; }; then :
|
|
libc_cv_cc_avx=yes
|
|
else
|
|
libc_cv_cc_avx=no
|
|
fi
|
|
|
|
fi
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $libc_cv_cc_avx" >&5
|
|
$as_echo "$libc_cv_cc_avx" >&6; }
|
|
if test $libc_cv_cc_avx = yes; then
|
|
$as_echo "#define HAVE_AVX_SUPPORT 1" >>confdefs.h
|
|
|
|
fi
|
|
config_vars="$config_vars
|
|
config-cflags-avx = $libc_cv_cc_avx"
|
|
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for AVX512 support in assembler" >&5
|
|
$as_echo_n "checking for AVX512 support in assembler... " >&6; }
|
|
if ${libc_cv_asm_avx512+:} false; then :
|
|
$as_echo_n "(cached) " >&6
|
|
else
|
|
cat > conftest.s <<\EOF
|
|
vmovdqu64 %zmm0, (%rsp)
|
|
EOF
|
|
if { ac_try='${CC-cc} -c $ASFLAGS conftest.s 1>&5'
|
|
{ { eval echo "\"\$as_me\":${as_lineno-$LINENO}: \"$ac_try\""; } >&5
|
|
(eval $ac_try) 2>&5
|
|
ac_status=$?
|
|
$as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
|
|
test $ac_status = 0; }; }; then
|
|
libc_cv_asm_avx512=yes
|
|
else
|
|
libc_cv_asm_avx512=no
|
|
fi
|
|
rm -f conftest*
|
|
fi
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $libc_cv_asm_avx512" >&5
|
|
$as_echo "$libc_cv_asm_avx512" >&6; }
|
|
if test $libc_cv_asm_avx512 == yes; then
|
|
$as_echo "#define HAVE_AVX512_ASM_SUPPORT 1" >>confdefs.h
|
|
|
|
fi
|
|
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for AVX512 support" >&5
|
|
$as_echo_n "checking for AVX512 support... " >&6; }
|
|
if ${libc_cv_cc_avx512+:} false; then :
|
|
$as_echo_n "(cached) " >&6
|
|
else
|
|
if { ac_try='${CC-cc} -mavx512f -xc /dev/null -S -o /dev/null'
|
|
{ { eval echo "\"\$as_me\":${as_lineno-$LINENO}: \"$ac_try\""; } >&5
|
|
(eval $ac_try) 2>&5
|
|
ac_status=$?
|
|
$as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
|
|
test $ac_status = 0; }; }; then :
|
|
libc_cv_cc_avx512=$libc_cv_asm_avx512
|
|
else
|
|
libc_cv_cc_avx512=no
|
|
fi
|
|
|
|
fi
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $libc_cv_cc_avx512" >&5
|
|
$as_echo "$libc_cv_cc_avx512" >&6; }
|
|
if test $libc_cv_cc_avx512 = yes; then
|
|
$as_echo "#define HAVE_AVX512_SUPPORT 1" >>confdefs.h
|
|
|
|
fi
|
|
config_vars="$config_vars
|
|
config-cflags-avx512 = $libc_cv_cc_avx512"
|
|
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for AVX encoding of SSE instructions" >&5
|
|
$as_echo_n "checking for AVX encoding of SSE instructions... " >&6; }
|
|
if ${libc_cv_cc_sse2avx+:} false; then :
|
|
$as_echo_n "(cached) " >&6
|
|
else
|
|
if { ac_try='${CC-cc} -msse2avx -xc /dev/null -S -o /dev/null'
|
|
{ { eval echo "\"\$as_me\":${as_lineno-$LINENO}: \"$ac_try\""; } >&5
|
|
(eval $ac_try) 2>&5
|
|
ac_status=$?
|
|
$as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
|
|
test $ac_status = 0; }; }; then :
|
|
libc_cv_cc_sse2avx=yes
|
|
else
|
|
libc_cv_cc_sse2avx=no
|
|
fi
|
|
|
|
fi
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $libc_cv_cc_sse2avx" >&5
|
|
$as_echo "$libc_cv_cc_sse2avx" >&6; }
|
|
if test $libc_cv_cc_sse2avx = yes; then
|
|
$as_echo "#define HAVE_SSE2AVX_SUPPORT 1" >>confdefs.h
|
|
|
|
fi
|
|
config_vars="$config_vars
|
|
config-cflags-sse2avx = $libc_cv_cc_sse2avx"
|
|
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for FMA4 support" >&5
|
|
$as_echo_n "checking for FMA4 support... " >&6; }
|
|
if ${libc_cv_cc_fma4+:} false; then :
|
|
$as_echo_n "(cached) " >&6
|
|
else
|
|
if { ac_try='${CC-cc} -mfma4 -xc /dev/null -S -o /dev/null'
|
|
{ { eval echo "\"\$as_me\":${as_lineno-$LINENO}: \"$ac_try\""; } >&5
|
|
(eval $ac_try) 2>&5
|
|
ac_status=$?
|
|
$as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
|
|
test $ac_status = 0; }; }; then :
|
|
libc_cv_cc_fma4=yes
|
|
else
|
|
libc_cv_cc_fma4=no
|
|
fi
|
|
|
|
fi
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $libc_cv_cc_fma4" >&5
|
|
$as_echo "$libc_cv_cc_fma4" >&6; }
|
|
if test $libc_cv_cc_fma4 = yes; then
|
|
$as_echo "#define HAVE_FMA4_SUPPORT 1" >>confdefs.h
|
|
|
|
fi
|
|
config_vars="$config_vars
|
|
have-mfma4 = $libc_cv_cc_fma4"
|
|
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for -mno-vzeroupper support" >&5
|
|
$as_echo_n "checking for -mno-vzeroupper support... " >&6; }
|
|
if ${libc_cv_cc_novzeroupper+:} false; then :
|
|
$as_echo_n "(cached) " >&6
|
|
else
|
|
if { ac_try='${CC-cc} -mno-vzeroupper -xc /dev/null -S -o /dev/null'
|
|
{ { eval echo "\"\$as_me\":${as_lineno-$LINENO}: \"$ac_try\""; } >&5
|
|
(eval $ac_try) 2>&5
|
|
ac_status=$?
|
|
$as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
|
|
test $ac_status = 0; }; }; then :
|
|
libc_cv_cc_novzeroupper=yes
|
|
else
|
|
libc_cv_cc_novzeroupper=no
|
|
fi
|
|
|
|
fi
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $libc_cv_cc_novzeroupper" >&5
|
|
$as_echo "$libc_cv_cc_novzeroupper" >&6; }
|
|
config_vars="$config_vars
|
|
config-cflags-novzeroupper = $libc_cv_cc_novzeroupper"
|
|
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for Intel MPX support" >&5
|
|
$as_echo_n "checking for Intel MPX support... " >&6; }
|
|
if ${libc_cv_asm_mpx+:} false; then :
|
|
$as_echo_n "(cached) " >&6
|
|
else
|
|
cat > conftest.s <<\EOF
|
|
bndmov %bnd0,(%rsp)
|
|
EOF
|
|
if { ac_try='${CC-cc} -c $ASFLAGS conftest.s 1>&5'
|
|
{ { eval echo "\"\$as_me\":${as_lineno-$LINENO}: \"$ac_try\""; } >&5
|
|
(eval $ac_try) 2>&5
|
|
ac_status=$?
|
|
$as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
|
|
test $ac_status = 0; }; }; then
|
|
libc_cv_asm_mpx=yes
|
|
else
|
|
libc_cv_asm_mpx=no
|
|
fi
|
|
rm -f conftest*
|
|
fi
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $libc_cv_asm_mpx" >&5
|
|
$as_echo "$libc_cv_asm_mpx" >&6; }
|
|
if test $libc_cv_asm_mpx == yes; then
|
|
$as_echo "#define HAVE_MPX_SUPPORT 1" >>confdefs.h
|
|
|
|
fi
|
|
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for AVX2 support" >&5
|
|
$as_echo_n "checking for AVX2 support... " >&6; }
|
|
if ${libc_cv_cc_avx2+:} false; then :
|
|
$as_echo_n "(cached) " >&6
|
|
else
|
|
if { ac_try='${CC-cc} -mavx2 -xc /dev/null -S -o /dev/null'
|
|
{ { eval echo "\"\$as_me\":${as_lineno-$LINENO}: \"$ac_try\""; } >&5
|
|
(eval $ac_try) 2>&5
|
|
ac_status=$?
|
|
$as_echo "$as_me:${as_lineno-$LINENO}: \$? = $ac_status" >&5
|
|
test $ac_status = 0; }; }; then :
|
|
libc_cv_cc_avx2=yes
|
|
else
|
|
libc_cv_cc_avx2=no
|
|
fi
|
|
|
|
fi
|
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $libc_cv_cc_avx2" >&5
|
|
$as_echo "$libc_cv_cc_avx2" >&6; }
|
|
if test $libc_cv_cc_avx2 = yes; then
|
|
$as_echo "#define HAVE_AVX2_SUPPORT 1" >>confdefs.h
|
|
|
|
fi
|
|
config_vars="$config_vars
|
|
config-cflags-avx2 = $libc_cv_cc_avx2"
|
|
|
|
if test x"$build_mathvec" = xnotset; then
|
|
build_mathvec=yes
|
|
fi
|
|
|
|
$as_echo "#define PI_STATIC_AND_HIDDEN 1" >>confdefs.h
|
|
|
|
# work around problem with autoconf and empty lines at the end of files
|