mirror of
https://sourceware.org/git/glibc.git
synced 2025-01-08 18:30:18 +00:00
2d63a517e4
AVX-512 ISA adds 512-bit zmm registers. This patch updates _dl_runtime_profile to pass zmm registers to run-time audit. It also changes _dl_x86_64_save_sse and _dl_x86_64_restore_sse to upport zmm registers, which are called when only when RTLD_PREPARE_FOREIGN_CALL is used. Its performance impact is minimum. * config.h.in (HAVE_AVX512_SUPPORT): New #undef. (HAVE_AVX512_ASM_SUPPORT): Likewise. * sysdeps/x86_64/bits/link.h (La_x86_64_zmm): New. (La_x86_64_vector): Add zmm. * sysdeps/x86_64/Makefile (tests): Add tst-audit10. (modules-names): Add tst-auditmod10a and tst-auditmod10b. ($(objpfx)tst-audit10): New target. ($(objpfx)tst-audit10.out): Likewise. (tst-audit10-ENV): New. (AVX512-CFLAGS): Likewise. (CFLAGS-tst-audit10.c): Likewise. (CFLAGS-tst-auditmod10a.c): Likewise. (CFLAGS-tst-auditmod10b.c): Likewise. * sysdeps/x86_64/configure.ac: Set config-cflags-avx512, HAVE_AVX512_SUPPORT and HAVE_AVX512_ASM_SUPPORT. * sysdeps/x86_64/configure: Regenerated. * sysdeps/x86_64/dl-trampoline.S (_dl_runtime_profile): Add AVX-512 zmm register support. (_dl_x86_64_save_sse): Likewise. (_dl_x86_64_restore_sse): Likewise. * sysdeps/x86_64/dl-trampoline.h: Updated to support different size vector registers. * sysdeps/x86_64/link-defines.sym (YMM_SIZE): New. (ZMM_SIZE): Likewise. * sysdeps/x86_64/tst-audit10.c: New file. * sysdeps/x86_64/tst-auditmod10a.c: Likewise. * sysdeps/x86_64/tst-auditmod10b.c: Likewise.
151 lines
4.0 KiB
C
151 lines
4.0 KiB
C
/* Copyright (C) 2004-2014 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#ifndef _LINK_H
|
|
# error "Never include <bits/link.h> directly; use <link.h> instead."
|
|
#endif
|
|
|
|
|
|
#ifndef __x86_64__
|
|
/* Registers for entry into PLT on IA-32. */
|
|
typedef struct La_i86_regs
|
|
{
|
|
uint32_t lr_edx;
|
|
uint32_t lr_ecx;
|
|
uint32_t lr_eax;
|
|
uint32_t lr_ebp;
|
|
uint32_t lr_esp;
|
|
} La_i86_regs;
|
|
|
|
/* Return values for calls from PLT on IA-32. */
|
|
typedef struct La_i86_retval
|
|
{
|
|
uint32_t lrv_eax;
|
|
uint32_t lrv_edx;
|
|
long double lrv_st0;
|
|
long double lrv_st1;
|
|
} La_i86_retval;
|
|
|
|
|
|
__BEGIN_DECLS
|
|
|
|
extern Elf32_Addr la_i86_gnu_pltenter (Elf32_Sym *__sym, unsigned int __ndx,
|
|
uintptr_t *__refcook,
|
|
uintptr_t *__defcook,
|
|
La_i86_regs *__regs,
|
|
unsigned int *__flags,
|
|
const char *__symname,
|
|
long int *__framesizep);
|
|
extern unsigned int la_i86_gnu_pltexit (Elf32_Sym *__sym, unsigned int __ndx,
|
|
uintptr_t *__refcook,
|
|
uintptr_t *__defcook,
|
|
const La_i86_regs *__inregs,
|
|
La_i86_retval *__outregs,
|
|
const char *symname);
|
|
|
|
__END_DECLS
|
|
|
|
#else
|
|
|
|
/* Registers for entry into PLT on x86-64. */
|
|
# if __GNUC_PREREQ (4,0)
|
|
typedef float La_x86_64_xmm __attribute__ ((__vector_size__ (16)));
|
|
typedef float La_x86_64_ymm
|
|
__attribute__ ((__vector_size__ (32), __aligned__ (16)));
|
|
typedef double La_x86_64_zmm
|
|
__attribute__ ((__vector_size__ (64), __aligned__ (16)));
|
|
# else
|
|
typedef float La_x86_64_xmm __attribute__ ((__mode__ (__V4SF__)));
|
|
# endif
|
|
|
|
typedef union
|
|
{
|
|
# if __GNUC_PREREQ (4,0)
|
|
La_x86_64_ymm ymm[2];
|
|
La_x86_64_zmm zmm[1];
|
|
# endif
|
|
La_x86_64_xmm xmm[4];
|
|
} La_x86_64_vector __attribute__ ((__aligned__ (16)));
|
|
|
|
typedef struct La_x86_64_regs
|
|
{
|
|
uint64_t lr_rdx;
|
|
uint64_t lr_r8;
|
|
uint64_t lr_r9;
|
|
uint64_t lr_rcx;
|
|
uint64_t lr_rsi;
|
|
uint64_t lr_rdi;
|
|
uint64_t lr_rbp;
|
|
uint64_t lr_rsp;
|
|
La_x86_64_xmm lr_xmm[8];
|
|
La_x86_64_vector lr_vector[8];
|
|
} La_x86_64_regs;
|
|
|
|
/* Return values for calls from PLT on x86-64. */
|
|
typedef struct La_x86_64_retval
|
|
{
|
|
uint64_t lrv_rax;
|
|
uint64_t lrv_rdx;
|
|
La_x86_64_xmm lrv_xmm0;
|
|
La_x86_64_xmm lrv_xmm1;
|
|
long double lrv_st0;
|
|
long double lrv_st1;
|
|
La_x86_64_vector lrv_vector0;
|
|
La_x86_64_vector lrv_vector1;
|
|
} La_x86_64_retval;
|
|
|
|
#define La_x32_regs La_x86_64_regs
|
|
#define La_x32_retval La_x86_64_retval
|
|
|
|
__BEGIN_DECLS
|
|
|
|
extern Elf64_Addr la_x86_64_gnu_pltenter (Elf64_Sym *__sym,
|
|
unsigned int __ndx,
|
|
uintptr_t *__refcook,
|
|
uintptr_t *__defcook,
|
|
La_x86_64_regs *__regs,
|
|
unsigned int *__flags,
|
|
const char *__symname,
|
|
long int *__framesizep);
|
|
extern unsigned int la_x86_64_gnu_pltexit (Elf64_Sym *__sym,
|
|
unsigned int __ndx,
|
|
uintptr_t *__refcook,
|
|
uintptr_t *__defcook,
|
|
const La_x86_64_regs *__inregs,
|
|
La_x86_64_retval *__outregs,
|
|
const char *__symname);
|
|
|
|
extern Elf32_Addr la_x32_gnu_pltenter (Elf32_Sym *__sym,
|
|
unsigned int __ndx,
|
|
uintptr_t *__refcook,
|
|
uintptr_t *__defcook,
|
|
La_x32_regs *__regs,
|
|
unsigned int *__flags,
|
|
const char *__symname,
|
|
long int *__framesizep);
|
|
extern unsigned int la_x32_gnu_pltexit (Elf32_Sym *__sym,
|
|
unsigned int __ndx,
|
|
uintptr_t *__refcook,
|
|
uintptr_t *__defcook,
|
|
const La_x32_regs *__inregs,
|
|
La_x32_retval *__outregs,
|
|
const char *__symname);
|
|
|
|
__END_DECLS
|
|
|
|
#endif
|