gcc/libgcc/config/rs6000/morestack.S
Alan Modra cd6ca96f5d [POWER10] __morestack calls from pcrel code
Compiling gcc/testsuite/gcc.dg/split-*.c and others with -mcpu=power10
and linking with a non-pcrel libgcc results in crashes due to the
power10 pcrel code not having r2 set for the generic-morestack.c
functions called from __morestack.  There is also a problem when
non-pcrel code calls a pcrel libgcc.  See the patch comments.

A similar situation theoretically occurs with ELFv1 multi-toc
executables, when __morestack might be located in a different toc
group to its caller.  This patch makes no attempt to fix that, since
the gold linker does not support multi-toc (gold is needed for proper
support of -fsplit-stack code) nor does gcc emit __morestack calls
that support multi-toc.

	* config/rs6000/morestack.S (R2_SAVE): Define.
	(__morestack): Save and restore r2.  Set up r2 for called
	functions.
2021-07-15 15:27:09 +09:30

408 lines
11 KiB
ArmAsm

#ifdef __powerpc64__
# PowerPC64 support for -fsplit-stack.
# Copyright (C) 2009-2021 Free Software Foundation, Inc.
# Contributed by Alan Modra <amodra@gmail.com>.
# This file is part of GCC.
# GCC is free software; you can redistribute it and/or modify it under
# the terms of the GNU General Public License as published by the Free
# Software Foundation; either version 3, or (at your option) any later
# version.
# GCC is distributed in the hope that it will be useful, but WITHOUT ANY
# WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
# for more details.
# Under Section 7 of GPL version 3, you are granted additional
# permissions described in the GCC Runtime Library Exception, version
# 3.1, as published by the Free Software Foundation.
# You should have received a copy of the GNU General Public License and
# a copy of the GCC Runtime Library Exception along with this program;
# see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
# <http://www.gnu.org/licenses/>.
#if _CALL_ELF == 2
.abiversion 2
#define PARAMS 32
#else
#define PARAMS 48
#endif
#define MORESTACK_FRAMESIZE (PARAMS+96)
#define R2_SAVE -MORESTACK_FRAMESIZE+PARAMS-8
#define PARAMREG_SAVE -MORESTACK_FRAMESIZE+PARAMS+0
#define STATIC_CHAIN_SAVE -MORESTACK_FRAMESIZE+PARAMS+64
#define R29_SAVE -MORESTACK_FRAMESIZE+PARAMS+72
#define LINKREG_SAVE -MORESTACK_FRAMESIZE+PARAMS+80
#define NEWSTACKSIZE_SAVE -MORESTACK_FRAMESIZE+PARAMS+88
# Excess space needed to call ld.so resolver for lazy plt
# resolution. Go uses sigaltstack so this doesn't need to
# also cover signal frame size.
#define BACKOFF 4096
# Large excess allocated when calling non-split-stack code.
#define NON_SPLIT_STACK 0x100000
#if _CALL_ELF == 2
#define BODY_LABEL(name) name
#define ENTRY0(name) \
.global name; \
.hidden name; \
.type name,@function; \
name##:
#ifdef __PCREL__
#define ENTRY(name) \
ENTRY0(name); \
.localentry name, 1
#define JUMP_TARGET(name) name##@notoc
#else
#define ENTRY(name) \
ENTRY0(name); \
0: addis %r2,%r12,.TOC.-0b@ha; \
addi %r2,%r2,.TOC.-0b@l; \
.localentry name, .-name
#endif
#else
#define BODY_LABEL(name) .L.##name
#define ENTRY0(name) \
.global name; \
.hidden name; \
.type name,@function; \
.pushsection ".opd","aw"; \
.p2align 3; \
name##: .quad BODY_LABEL (name), .TOC.@tocbase, 0; \
.popsection; \
BODY_LABEL(name)##:
#define ENTRY(name) ENTRY0(name)
#endif
#define SIZE(name) .size name, .-BODY_LABEL(name)
#ifndef JUMP_TARGET
#define JUMP_TARGET(name) name
#endif
.text
# Just like __morestack, but with larger excess allocation
ENTRY0(__morestack_non_split)
.LFB1:
.cfi_startproc
# We use a cleanup to restore the tcbhead_t.__private_ss if
# an exception is thrown through this code.
#ifdef __PIC__
.cfi_personality 0x9b,DW.ref.__gcc_personality_v0
.cfi_lsda 0x1b,.LLSDA1
#else
.cfi_personality 0x3,__gcc_personality_v0
.cfi_lsda 0x3,.LLSDA1
#endif
# LR is already saved by the split-stack prologue code.
# We may as well have the unwinder skip over the call in the
# prologue too.
.cfi_offset %lr,16
addis %r12,%r12,-NON_SPLIT_STACK@h
SIZE (__morestack_non_split)
# Fall through into __morestack
# This function is called with non-standard calling conventions.
# On entry, r12 is the requested stack pointer. One version of the
# split-stack prologue that calls __morestack looks like
# ld %r0,-0x7000-64(%r13)
# addis %r12,%r1,-allocate@ha
# addi %r12,%r12,-allocate@l
# cmpld %r12,%r0
# bge+ enough
# mflr %r0
# std %r0,16(%r1)
# bl __morestack
# ld %r0,16(%r1)
# mtlr %r0
# blr
# enough:
# The normal function prologue follows here, with a small addition at
# the end to set up the arg pointer. The arg pointer is set up with:
# addi %r12,%r1,offset
# bge %cr7,.+8
# mr %r12,%r29
#
# Note that the lr save slot 16(%r1) has already been used.
# r3 thru r11 possibly contain arguments and a static chain
# pointer for the function we're calling, so must be preserved.
# cr7 must also be preserved.
ENTRY0(__morestack)
#if _CALL_ELF == 2
# Functions with localentry bits of zero cannot make calls if those
# calls might change r2. This is true generally, and also true for
# __morestack with its special calling convention. When __morestack's
# caller is non-pcrel but libgcc is pcrel, the functions called here
# might modify r2. r2 must be preserved on exit, and also restored
# for the call back to our caller.
std %r2,R2_SAVE(%r1)
#endif
# Save parameter passing registers, our arguments, lr, r29
# and use r29 as a frame pointer.
std %r3,PARAMREG_SAVE+0(%r1)
sub %r3,%r1,%r12 # calculate requested stack size
mflr %r12
std %r4,PARAMREG_SAVE+8(%r1)
std %r5,PARAMREG_SAVE+16(%r1)
std %r6,PARAMREG_SAVE+24(%r1)
std %r7,PARAMREG_SAVE+32(%r1)
addi %r3,%r3,BACKOFF
std %r8,PARAMREG_SAVE+40(%r1)
std %r9,PARAMREG_SAVE+48(%r1)
std %r10,PARAMREG_SAVE+56(%r1)
std %r11,STATIC_CHAIN_SAVE(%r1)
std %r29,R29_SAVE(%r1)
std %r12,LINKREG_SAVE(%r1)
std %r3,NEWSTACKSIZE_SAVE(%r1) # new stack size
mr %r29,%r1
#if _CALL_ELF == 2
.cfi_offset %r2,R2_SAVE
#endif
.cfi_offset %r29,R29_SAVE
.cfi_def_cfa_register %r29
stdu %r1,-MORESTACK_FRAMESIZE(%r1)
#if _CALL_ELF == 2 && !defined __PCREL__
# If this isn't a pcrel libgcc then the functions we call here will
# require r2 to be valid. If __morestack is called from pcrel code r2
# won't be valid. Set it up.
bcl 20,31,1f
1:
mflr %r12
addis %r2,%r12,.TOC.-1b@ha
addi %r2,%r2,.TOC.-1b@l
#endif
# void __morestack_block_signals (void)
bl JUMP_TARGET(__morestack_block_signals)
# void *__generic_morestack (size_t *pframe_size,
# void *old_stack,
# size_t param_size)
addi %r3,%r29,NEWSTACKSIZE_SAVE
mr %r4,%r29
li %r5,0 # no copying from old stack
bl JUMP_TARGET(__generic_morestack)
# Start using new stack
stdu %r29,-32(%r3) # back-chain
mr %r1,%r3
# Set __private_ss stack guard for the new stack.
ld %r12,NEWSTACKSIZE_SAVE(%r29) # modified size
addi %r3,%r3,BACKOFF-32
sub %r3,%r3,%r12
# Note that a signal frame has $pc pointing at the instruction
# where the signal occurred. For something like a timer
# interrupt this means the instruction has already executed,
# thus the region starts at the instruction modifying
# __private_ss, not one instruction after.
.LEHB0:
std %r3,-0x7000-64(%r13) # tcbhead_t.__private_ss
# void __morestack_unblock_signals (void)
bl JUMP_TARGET(__morestack_unblock_signals)
# Set up for a call to the target function, located 3
# instructions after __morestack's return address.
#
ld %r12,LINKREG_SAVE(%r29)
#if _CALL_ELF == 2
ld %r2,R2_SAVE(%r29)
#endif
ld %r3,PARAMREG_SAVE+0(%r29) # restore arg regs
ld %r4,PARAMREG_SAVE+8(%r29)
ld %r5,PARAMREG_SAVE+16(%r29)
ld %r6,PARAMREG_SAVE+24(%r29)
ld %r7,PARAMREG_SAVE+32(%r29)
ld %r8,PARAMREG_SAVE+40(%r29)
ld %r9,PARAMREG_SAVE+48(%r29)
addi %r0,%r12,12 # add 3 instructions
ld %r10,PARAMREG_SAVE+56(%r29)
ld %r11,STATIC_CHAIN_SAVE(%r29)
cmpld %cr7,%r12,%r0 # indicate we were called
mtctr %r0
bctrl # call caller!
# On return, save regs possibly used to return a value, and
# possibly trashed by calls to __morestack_block_signals,
# __generic_releasestack and __morestack_unblock_signals.
# Assume those calls don't use vector or floating point regs.
std %r3,PARAMREG_SAVE+0(%r29)
std %r4,PARAMREG_SAVE+8(%r29)
std %r5,PARAMREG_SAVE+16(%r29)
std %r6,PARAMREG_SAVE+24(%r29)
#if _CALL_ELF == 2
std %r7,PARAMREG_SAVE+32(%r29)
std %r8,PARAMREG_SAVE+40(%r29)
std %r9,PARAMREG_SAVE+48(%r29)
std %r10,PARAMREG_SAVE+56(%r29)
#endif
#if _CALL_ELF == 2 && !defined __PCREL__
# r2 was restored for calling back into our caller. Set it up again.
bcl 20,31,1f
1:
mflr %r12
addis %r2,%r12,.TOC.-1b@ha
addi %r2,%r2,.TOC.-1b@l
#endif
bl JUMP_TARGET(__morestack_block_signals)
# void *__generic_releasestack (size_t *pavailable)
addi %r3,%r29,NEWSTACKSIZE_SAVE
bl JUMP_TARGET(__generic_releasestack)
# Reset __private_ss stack guard to value for old stack
ld %r12,NEWSTACKSIZE_SAVE(%r29)
addi %r3,%r3,BACKOFF
sub %r3,%r3,%r12
.LEHE0:
std %r3,-0x7000-64(%r13) # tcbhead_t.__private_ss
bl JUMP_TARGET(__morestack_unblock_signals)
# Use old stack again.
mr %r1,%r29
# Restore return value regs, and return.
ld %r0,LINKREG_SAVE(%r29)
mtlr %r0
#if _CALL_ELF == 2
ld %r2,R2_SAVE(%r29)
#endif
ld %r3,PARAMREG_SAVE+0(%r29)
ld %r4,PARAMREG_SAVE+8(%r29)
ld %r5,PARAMREG_SAVE+16(%r29)
ld %r6,PARAMREG_SAVE+24(%r29)
#if _CALL_ELF == 2
ld %r7,PARAMREG_SAVE+32(%r29)
ld %r8,PARAMREG_SAVE+40(%r29)
ld %r9,PARAMREG_SAVE+48(%r29)
ld %r10,PARAMREG_SAVE+56(%r29)
#endif
ld %r29,R29_SAVE(%r29)
.cfi_def_cfa_register %r1
blr
# This is the cleanup code called by the stack unwinder when
# unwinding through code between .LEHB0 and .LEHE0 above.
cleanup:
.cfi_def_cfa_register %r29
std %r3,PARAMREG_SAVE(%r29) # Save exception header
# size_t __generic_findstack (void *stack)
mr %r3,%r29
bl JUMP_TARGET(__generic_findstack)
sub %r3,%r29,%r3
addi %r3,%r3,BACKOFF
std %r3,-0x7000-64(%r13) # tcbhead_t.__private_ss
ld %r3,PARAMREG_SAVE(%r29)
bl JUMP_TARGET(_Unwind_Resume)
#ifndef __PCREL__
nop
#endif
.cfi_endproc
SIZE (__morestack)
.section .gcc_except_table,"a",@progbits
.p2align 2
.LLSDA1:
.byte 0xff # @LPStart format (omit)
.byte 0xff # @TType format (omit)
.byte 0x1 # call-site format (uleb128)
.uleb128 .LLSDACSE1-.LLSDACSB1 # Call-site table length
.LLSDACSB1:
.uleb128 .LEHB0-.LFB1 # region 0 start
.uleb128 .LEHE0-.LEHB0 # length
.uleb128 cleanup-.LFB1 # landing pad
.uleb128 0 # no action, ie. a cleanup
.LLSDACSE1:
#ifdef __PIC__
# Build a position independent reference to the personality function.
.hidden DW.ref.__gcc_personality_v0
.weak DW.ref.__gcc_personality_v0
.section .data.DW.ref.__gcc_personality_v0,"awG",@progbits,DW.ref.__gcc_personality_v0,comdat
.p2align 3
DW.ref.__gcc_personality_v0:
.quad __gcc_personality_v0
.type DW.ref.__gcc_personality_v0, @object
.size DW.ref.__gcc_personality_v0, 8
#endif
.text
# Initialize the stack guard when the program starts or when a
# new thread starts. This is called from a constructor.
# void __stack_split_initialize (void)
ENTRY(__stack_split_initialize)
.cfi_startproc
addi %r3,%r1,-0x4000 # We should have at least 16K.
std %r3,-0x7000-64(%r13) # tcbhead_t.__private_ss
# void __generic_morestack_set_initial_sp (void *sp, size_t len)
mr %r3,%r1
li %r4, 0x4000
b JUMP_TARGET(__generic_morestack_set_initial_sp)
# The lack of .cfi_endproc here is deliberate. This function and the
# following ones can all use the default FDE.
SIZE (__stack_split_initialize)
# Return current __private_ss
# void *__morestack_get_guard (void)
ENTRY0(__morestack_get_guard)
ld %r3,-0x7000-64(%r13) # tcbhead_t.__private_ss
blr
SIZE (__morestack_get_guard)
# Set __private_ss
# void __morestack_set_guard (void *ptr)
ENTRY0(__morestack_set_guard)
std %r3,-0x7000-64(%r13) # tcbhead_t.__private_ss
blr
SIZE (__morestack_set_guard)
# Return the stack guard value for given stack
# void *__morestack_make_guard (void *stack, size_t size)
ENTRY0(__morestack_make_guard)
sub %r3,%r3,%r4
addi %r3,%r3,BACKOFF
blr
.cfi_endproc
SIZE (__morestack_make_guard)
# Make __stack_split_initialize a high priority constructor.
.section .ctors.65535,"aw",@progbits
.p2align 3
.quad __stack_split_initialize
.quad __morestack_load_mmap
.section .note.GNU-stack,"",@progbits
.section .note.GNU-split-stack,"",@progbits
.section .note.GNU-no-split-stack,"",@progbits
#endif /* __powerpc64__ */