mirror of
https://sourceware.org/git/glibc.git
synced 2024-11-24 22:10:13 +00:00
9b7091415a
_dl_tlsdesc_dynamic should also preserve AMX registers which are caller-saved. Add X86_XSTATE_TILECFG_ID and X86_XSTATE_TILEDATA_ID to x86-64 TLSDESC_CALL_STATE_SAVE_MASK. Compute the AMX state size and save it in xsave_state_full_size which is only used by _dl_tlsdesc_dynamic_xsave and _dl_tlsdesc_dynamic_xsavec. This fixes the AMX part of BZ #31372. Tested on AMX processor. AMX test is enabled only for compilers with the fix for https://gcc.gnu.org/bugzilla/show_bug.cgi?id=114098 GCC 14 and GCC 11/12/13 branches have the bug fix. Reviewed-by: Sunil K Pandey <skpgkp2@gmail.com>
137 lines
4.4 KiB
C
137 lines
4.4 KiB
C
/* Assembler macros for x86.
|
|
Copyright (C) 2017-2024 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<https://www.gnu.org/licenses/>. */
|
|
|
|
#ifndef _X86_SYSDEP_H
|
|
#define _X86_SYSDEP_H 1
|
|
|
|
#include <sysdeps/generic/sysdep.h>
|
|
|
|
/* The extended state feature IDs in the state component bitmap. */
|
|
#define X86_XSTATE_X87_ID 0
|
|
#define X86_XSTATE_SSE_ID 1
|
|
#define X86_XSTATE_AVX_ID 2
|
|
#define X86_XSTATE_BNDREGS_ID 3
|
|
#define X86_XSTATE_BNDCFG_ID 4
|
|
#define X86_XSTATE_K_ID 5
|
|
#define X86_XSTATE_ZMM_H_ID 6
|
|
#define X86_XSTATE_ZMM_ID 7
|
|
#define X86_XSTATE_PKRU_ID 9
|
|
#define X86_XSTATE_TILECFG_ID 17
|
|
#define X86_XSTATE_TILEDATA_ID 18
|
|
#define X86_XSTATE_APX_F_ID 19
|
|
|
|
#ifdef __x86_64__
|
|
/* Offset for fxsave/xsave area used by _dl_runtime_resolve. Also need
|
|
space to preserve RCX, RDX, RSI, RDI, R8, R9 and RAX. It must be
|
|
aligned to 16 bytes for fxsave and 64 bytes for xsave.
|
|
|
|
NB: Is is non-zero because of the 128-byte red-zone. Some registers
|
|
are saved on stack without adjusting stack pointer first. When we
|
|
update stack pointer to allocate more space, we need to take the
|
|
red-zone into account. */
|
|
# define STATE_SAVE_OFFSET (8 * 7 + 8)
|
|
|
|
/* Save SSE, AVX, AVX512, mask, bound and APX registers. Bound and APX
|
|
registers are mutually exclusive. */
|
|
# define STATE_SAVE_MASK \
|
|
((1 << X86_XSTATE_SSE_ID) \
|
|
| (1 << X86_XSTATE_AVX_ID) \
|
|
| (1 << X86_XSTATE_BNDREGS_ID) \
|
|
| (1 << X86_XSTATE_K_ID) \
|
|
| (1 << X86_XSTATE_ZMM_H_ID) \
|
|
| (1 << X86_XSTATE_ZMM_ID) \
|
|
| (1 << X86_XSTATE_APX_F_ID))
|
|
|
|
/* AMX state mask. */
|
|
# define AMX_STATE_SAVE_MASK \
|
|
((1 << X86_XSTATE_TILECFG_ID) | (1 << X86_XSTATE_TILEDATA_ID))
|
|
|
|
/* States to be included in xsave_state_full_size. */
|
|
# define FULL_STATE_SAVE_MASK \
|
|
(STATE_SAVE_MASK | AMX_STATE_SAVE_MASK)
|
|
#else
|
|
/* Offset for fxsave/xsave area used by _dl_tlsdesc_dynamic. Since i386
|
|
doesn't have red-zone, use 0 here. */
|
|
# define STATE_SAVE_OFFSET 0
|
|
|
|
/* Save SSE, AVX, AXV512, mask and bound registers. */
|
|
# define STATE_SAVE_MASK \
|
|
((1 << X86_XSTATE_SSE_ID) \
|
|
| (1 << X86_XSTATE_AVX_ID) \
|
|
| (1 << X86_XSTATE_BNDREGS_ID) \
|
|
| (1 << X86_XSTATE_K_ID) \
|
|
| (1 << X86_XSTATE_ZMM_H_ID))
|
|
|
|
/* States to be included in xsave_state_size. */
|
|
# define FULL_STATE_SAVE_MASK STATE_SAVE_MASK
|
|
#endif
|
|
|
|
/* States which should be saved for TLSDESC_CALL and TLS_DESC_CALL.
|
|
Compiler assumes that all registers, including AMX and x87 FPU
|
|
stack registers, are unchanged after CALL, except for EFLAGS and
|
|
RAX/EAX. */
|
|
#define TLSDESC_CALL_STATE_SAVE_MASK \
|
|
(FULL_STATE_SAVE_MASK | (1 << X86_XSTATE_X87_ID))
|
|
|
|
/* Constants for bits in __x86_string_control: */
|
|
|
|
/* Avoid short distance REP MOVSB. */
|
|
#define X86_STRING_CONTROL_AVOID_SHORT_DISTANCE_REP_MOVSB (1 << 0)
|
|
|
|
#ifdef __ASSEMBLER__
|
|
|
|
/* Syntactic details of assembler. */
|
|
|
|
/* ELF uses byte-counts for .align, most others use log2 of count of bytes. */
|
|
#define ALIGNARG(log2) 1<<log2
|
|
#define ASM_SIZE_DIRECTIVE(name) .size name,.-name;
|
|
|
|
/* Common entry 16 byte aligns. */
|
|
#define ENTRY(name) ENTRY_P2ALIGN (name, 4)
|
|
|
|
#undef END
|
|
#define END(name) \
|
|
cfi_endproc; \
|
|
ASM_SIZE_DIRECTIVE(name)
|
|
|
|
#define ENTRY_CHK(name) ENTRY (name)
|
|
#define END_CHK(name) END (name)
|
|
|
|
/* Since C identifiers are not normally prefixed with an underscore
|
|
on this system, the asm identifier `syscall_error' intrudes on the
|
|
C name space. Make sure we use an innocuous name. */
|
|
#define syscall_error __syscall_error
|
|
#define mcount _mcount
|
|
|
|
#undef PSEUDO_END
|
|
#define PSEUDO_END(name) \
|
|
END (name)
|
|
|
|
/* Local label name for asm code. */
|
|
#ifndef L
|
|
/* ELF-like local names start with `.L'. */
|
|
# define LOCAL_LABEL(name) .L##name
|
|
# define L(name) LOCAL_LABEL(name)
|
|
#endif
|
|
|
|
#define atom_text_section .section ".text.atom", "ax"
|
|
|
|
#endif /* __ASSEMBLER__ */
|
|
|
|
#endif /* _X86_SYSDEP_H */
|