mirror of
https://sourceware.org/git/glibc.git
synced 2024-11-30 08:40:07 +00:00
5cdd1989d1
Starting with z13, vector registers can also occur as argument registers. Thus the passed input/output register structs for la_s390_[32|64]_gnu_plt[enter|exit] functions should reflect those new registers. This patch extends these structs La_s390_regs and La_s390_retval and adjusts _dl_runtime_profile() to handle those fields in case of running on a z13 machine. ChangeLog: * sysdeps/s390/bits/link.h: (La_s390_vr) New typedef. (La_s390_32_regs): Append vector register lr_v24-lr_v31. (La_s390_64_regs): Likewise. (La_s390_32_retval): Append vector register lrv_v24. (La_s390_64_retval): Likeweise. * sysdeps/s390/s390-32/dl-trampoline.h (_dl_runtime_profile): Handle extended structs La_s390_32_regs and La_s390_32_retval. * sysdeps/s390/s390-64/dl-trampoline.h (_dl_runtime_profile): Handle extended structs La_s390_64_regs and La_s390_64_retval.
226 lines
6.8 KiB
C
226 lines
6.8 KiB
C
/* PLT trampolines. s390x version.
|
|
Copyright (C) 2016 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
/* The PLT stubs will call _dl_runtime_resolve/_dl_runtime_profile
|
|
* with the following linkage:
|
|
* r2 - r6 : parameter registers
|
|
* f0, f2, f4, f6 : floating point parameter registers
|
|
* v24, v26, v28, v30, v25, v27, v29, v31 : vector parameter registers
|
|
* 48(r15), 56(r15) : PLT arguments PLT1, PLT2
|
|
* 160(r15) : additional stack parameters
|
|
* The normal clobber rules for function calls apply:
|
|
* r0 - r5 : call clobbered
|
|
* r6 - r13 : call saved
|
|
* r14 : return address (call clobbered)
|
|
* r15 : stack pointer (call saved)
|
|
* f0 - f7 : call clobbered
|
|
* f8 - f15 : call saved
|
|
* v0 - v7 : bytes 0-7 overlap with f0-f7: call clobbered
|
|
bytes 8-15: call clobbered
|
|
* v8 - v15 : bytes 0-7 overlap with f8-f15: call saved
|
|
bytes 8-15: call clobbered
|
|
* v16 - v31 : call clobbered
|
|
*/
|
|
|
|
.globl _dl_runtime_resolve
|
|
.type _dl_runtime_resolve, @function
|
|
cfi_startproc
|
|
.align 16
|
|
_dl_runtime_resolve:
|
|
stmg %r2,%r5,64(%r15) # save call-clobbered argument registers
|
|
cfi_offset (r2, -96)
|
|
cfi_offset (r3, -88)
|
|
cfi_offset (r4, -80)
|
|
cfi_offset (r5, -72)
|
|
std %f0,104(%r15)
|
|
cfi_offset (f0, -56)
|
|
std %f2,112(%r15)
|
|
cfi_offset (f2, -48)
|
|
std %f4,120(%r15)
|
|
cfi_offset (f4, -40)
|
|
std %f6,128(%r15)
|
|
cfi_offset (f6, -32)
|
|
stg %r14,96(15)
|
|
cfi_offset (r14, -64)
|
|
lmg %r2,%r3,48(%r15) # load args for fixup saved by PLT
|
|
lgr %r0,%r15
|
|
#ifdef RESTORE_VRS
|
|
aghi %r15,-288 # create stack frame
|
|
cfi_adjust_cfa_offset (288)
|
|
.machine push
|
|
.machine "z13"
|
|
vstm %v24,%v31,160(%r15)# store call-clobbered vector argument registers
|
|
cfi_offset (v24, -288)
|
|
cfi_offset (v25, -272)
|
|
cfi_offset (v26, -256)
|
|
cfi_offset (v27, -240)
|
|
cfi_offset (v28, -224)
|
|
cfi_offset (v29, -208)
|
|
cfi_offset (v30, -192)
|
|
cfi_offset (v31, -176)
|
|
.machine pop
|
|
#else
|
|
aghi %r15,-160 # create stack frame
|
|
cfi_adjust_cfa_offset (160)
|
|
#endif
|
|
stg %r0,0(%r15) # write backchain
|
|
brasl %r14,_dl_fixup # call _dl_fixup
|
|
lgr %r1,%r2 # function addr returned in r2
|
|
#ifdef RESTORE_VRS
|
|
.machine push
|
|
.machine "z13"
|
|
vlm %v24,%v31,160(%r15)# restore vector registers
|
|
.machine pop
|
|
aghi %r15,288 # remove stack frame
|
|
cfi_adjust_cfa_offset (-288)
|
|
#else
|
|
aghi %r15,160 # remove stack frame
|
|
cfi_adjust_cfa_offset (-160)
|
|
#endif
|
|
lg %r14,96(%r15) # restore registers
|
|
ld %f0,104(%r15)
|
|
ld %f2,112(%r15)
|
|
ld %f4,120(%r15)
|
|
ld %f6,128(%r15)
|
|
lmg %r2,%r5,64(%r15)
|
|
br %r1
|
|
cfi_endproc
|
|
.size _dl_runtime_resolve, .-_dl_runtime_resolve
|
|
|
|
|
|
#ifndef PROF
|
|
.globl _dl_runtime_profile
|
|
.type _dl_runtime_profile, @function
|
|
cfi_startproc
|
|
.align 16
|
|
_dl_runtime_profile:
|
|
stg %r12,24(%r15) # r12 is used as backup of r15
|
|
cfi_offset (r12, -136)
|
|
stg %r14,32(%r15)
|
|
cfi_offset (r14, -128)
|
|
lgr %r12,%r15 # backup stack pointer
|
|
cfi_def_cfa_register (12)
|
|
aghi %r15,-360 # create stack frame:
|
|
# 160 + sizeof(La_s390_64_regs)
|
|
stg %r12,0(%r15) # save backchain
|
|
|
|
stmg %r2,%r6,160(%r15) # save call-clobbered arg regs
|
|
cfi_offset (r2, -360) # + r6 needed as arg for
|
|
cfi_offset (r3, -352) # _dl_profile_fixup
|
|
cfi_offset (r4, -344)
|
|
cfi_offset (r5, -336)
|
|
cfi_offset (r6, -328)
|
|
std %f0,200(%r15)
|
|
cfi_offset (f0, -320)
|
|
std %f2,208(%r15)
|
|
cfi_offset (f2, -312)
|
|
std %f4,216(%r15)
|
|
cfi_offset (f4, -304)
|
|
std %f6,224(%r15)
|
|
cfi_offset (f6, -296)
|
|
#ifdef RESTORE_VRS
|
|
.machine push
|
|
.machine "z13"
|
|
vstm %v24,%v31,232(%r15) # store call-clobbered vector arguments
|
|
cfi_offset (v24, -288)
|
|
cfi_offset (v25, -272)
|
|
cfi_offset (v26, -256)
|
|
cfi_offset (v27, -240)
|
|
cfi_offset (v28, -224)
|
|
cfi_offset (v29, -208)
|
|
cfi_offset (v30, -192)
|
|
cfi_offset (v31, -176)
|
|
.machine pop
|
|
#endif
|
|
lmg %r2,%r3,48(%r12) # load arguments saved by PLT
|
|
lgr %r4,%r14 # return address as third parameter
|
|
la %r5,160(%r15) # pointer to struct La_s390_64_regs
|
|
la %r6,40(%r12) # long int * framesize
|
|
brasl %r14,_dl_profile_fixup # call resolver
|
|
lgr %r1,%r2 # function addr returned in r2
|
|
ld %f0,200(%r15) # restore call-clobbered arg fprs
|
|
ld %f2,208(%r15)
|
|
ld %f4,216(%r15)
|
|
ld %f6,224(%r15)
|
|
#ifdef RESTORE_VRS
|
|
.machine push
|
|
.machine "z13"
|
|
vlm %v24,%v31,232(%r15) # restore call-clobbered arg vrs
|
|
.machine pop
|
|
#endif
|
|
lg %r0,40(%r12) # load framesize
|
|
ltgr %r0,%r0
|
|
jnm 1f
|
|
|
|
lmg %r2,%r6,160(%r15) # framesize < 0 means no pltexit call
|
|
# so we can do a tail call without
|
|
# copying the arg overflow area
|
|
lgr %r15,%r12 # remove stack frame
|
|
cfi_def_cfa_register (15)
|
|
lg %r14,32(%r15) # restore registers
|
|
lg %r12,24(%r15)
|
|
br %r1 # tail-call to resolved function
|
|
|
|
cfi_def_cfa_register (12)
|
|
1: la %r4,160(%r15) # pointer to struct La_s390_64_regs
|
|
stg %r4,64(%r12)
|
|
jz 4f # framesize == 0 ?
|
|
aghi %r0,7 # align framesize to 8
|
|
nill %r0,0xfff8
|
|
slgr %r15,%r0 # make room for framesize bytes
|
|
stg %r12,0(%r15) # save backchain
|
|
la %r2,160(%r15)
|
|
la %r3,160(%r12)
|
|
srlg %r0,%r0,3
|
|
3: mvc 0(8,%r2),0(%r3) # copy additional parameters
|
|
la %r2,8(%r2) # depending on framesize
|
|
la %r3,8(%r3)
|
|
brctg %r0,3b
|
|
4: lmg %r2,%r6,0(%r4) # restore call-clobbered arg gprs
|
|
basr %r14,%r1 # call resolved function
|
|
stg %r2,72(%r12) # store return values r2, f0
|
|
std %f0,80(%r12) # to struct La_s390_64_retval
|
|
#ifdef RESTORE_VRS
|
|
.machine push
|
|
.machine "z13"
|
|
vst %v24,88(%r12) # store return value v24
|
|
.machine pop
|
|
#endif
|
|
lmg %r2,%r4,48(%r12) # r2, r3: load arguments saved by PLT
|
|
# r4: pointer to struct La_s390_64_regs
|
|
la %r5,72(%r12) # pointer to struct La_s390_64_retval
|
|
brasl %r14,_dl_call_pltexit
|
|
|
|
lgr %r15,%r12 # remove stack frame
|
|
cfi_def_cfa_register (15)
|
|
lg %r14,32(%r15) # restore registers
|
|
lg %r12,24(%r15)
|
|
lg %r2,72(%r15) # restore return values
|
|
ld %f0,80(%r15)
|
|
#ifdef RESTORE_VRS
|
|
.machine push
|
|
.machine "z13"
|
|
vl %v24,88(%r15) # restore return value v24
|
|
.machine pop
|
|
#endif
|
|
br %r14 # Jump back to caller
|
|
|
|
cfi_endproc
|
|
.size _dl_runtime_profile, .-_dl_runtime_profile
|
|
#endif
|