/* Copyright (C) 2008-2021 Free Software Foundation, Inc. Contributed by Richard Henderson . This file is part of the GNU Transactional Memory Library (libitm). Libitm is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3 of the License, or (at your option) any later version. Libitm is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. Under Section 7 of GPL version 3, you are granted additional permissions described in the GCC Runtime Library Exception, version 3.1, as published by the Free Software Foundation. You should have received a copy of the GNU General Public License and a copy of the GCC Runtime Library Exception along with this program; see the files COPYING3 and COPYING.RUNTIME respectively. If not, see . */ #include "asmcfi.h" #include "config.h" #include "cet.h" #define CONCAT1(a, b) CONCAT2(a, b) #define CONCAT2(a, b) a ## b #ifdef __USER_LABEL_PREFIX__ # define SYM(x) CONCAT1 (__USER_LABEL_PREFIX__, x) #else # define SYM(x) x #endif #ifdef __ELF__ # define TYPE(x) .type SYM(x), @function # define SIZE(x) .size SYM(x), . - SYM(x) # ifdef HAVE_ATTRIBUTE_VISIBILITY # define HIDDEN(x) .hidden SYM(x) # else # define HIDDEN(x) # endif #else # define TYPE(x) # define SIZE(x) # ifdef __MACH__ # define HIDDEN(x) .private_extern SYM(x) # else # define HIDDEN(x) # endif #endif /* These are duplicates of the canonical definitions in libitm.h. Note that the code relies on pr_uninstrumentedCode == a_runUninstrumentedCode. */ #define pr_uninstrumentedCode 0x02 #define pr_hasNoAbort 0x08 #define pr_HTMRetryableAbort 0x800000 #define pr_HTMRetriedAfterAbort 0x1000000 #define a_runInstrumentedCode 0x01 #define a_runUninstrumentedCode 0x02 #define a_tryHTMFastPath 0x20 #define _XABORT_EXPLICIT (1 << 0) #define _XABORT_RETRY (1 << 1) .text .align 4 .globl SYM(_ITM_beginTransaction) SYM(_ITM_beginTransaction): cfi_startproc _CET_ENDBR #ifdef __x86_64__ #ifdef HAVE_AS_RTM /* Custom HTM fast path. We start the HW transaction here and let gtm_thread::begin_transaction (aka GTM_begin_transaction) decide how to proceed on aborts: We either retry the fast path, or fall back to another execution method. RTM restores all registers after a HW transaction abort, so we can do the SW setjmp after aborts, and we have to because we might choose a SW fall back. However, we have to explicitly save/restore the first argument (edi). The htm_fastpath field is the second int in gtm_rwlock. */ cmpl $0, (SYM(gtm_serial_lock)+4)(%rip) jz .Lno_htm testl $pr_hasNoAbort, %edi jz .Lno_htm .Lhtm_fastpath: xbegin .Ltxn_abort /* Monitor the serial lock (specifically, the 32b writer/summary field at its start), and only continue if there is no serial-mode transaction. Note that we might be just a nested transaction and our outermost transaction might be in serial mode; we check for this case in the retry policy implementation. */ cmpl $0, SYM(gtm_serial_lock)(%rip) jnz 1f /* Now also check that HW transactions are still allowed to run (see gtm_thread::begin_transaction for why this is necessary). */ cmpl $0, (SYM(gtm_serial_lock)+4)(%rip) jz 1f /* Everything is good. Run the transaction, preferably using the uninstrumented code path. Note that the following works because pr_uninstrumentedCode == a_runUninstrumentedCode. */ andl $pr_uninstrumentedCode, %edi mov $a_runInstrumentedCode, %eax cmovnz %edi, %eax ret /* There is a serial-mode transaction or HW transactions are not allowed anymore, so abort (see htm_abort() regarding the abort code). */ 1: xabort $0xff .Ltxn_abort: /* If it might make sense to retry the HTM fast path, let the C++ code decide. */ testl $(_XABORT_RETRY|_XABORT_EXPLICIT), %eax jz .Lno_htm orl $pr_HTMRetryableAbort, %edi /* Let the C++ code handle the retry policy. */ .Lno_htm: #endif leaq 8(%rsp), %rax subq $72, %rsp cfi_adjust_cfa_offset(72) /* Store edi for future HTM fast path retries. We use a stack slot lower than the jmpbuf so that the jmpbuf's rip field will overlap with the proper return address on the stack. */ movl %edi, (%rsp) /* Save the jmpbuf for any non-HTM-fastpath execution method. Because rsp-based addressing is 1 byte larger and we've got rax handy, use it. */ movq %rax, -72(%rax) movq %rbx, -64(%rax) movq %rbp, -56(%rax) movq %r12, -48(%rax) movq %r13, -40(%rax) movq %r14, -32(%rax) movq %r15, -24(%rax) xorq %rdx, %rdx /* Save zero or shadow stack pointer in the new field. */ #if defined __SHSTK__ && defined __CET__ && (__CET__ & 2) != 0 rdsspq %rdx #endif movq %rdx, -16(%rax) leaq -72(%rax), %rsi call SYM(GTM_begin_transaction) movl (%rsp), %edi addq $72, %rsp cfi_adjust_cfa_offset(-72) #ifdef HAVE_AS_RTM /* If a_tryHTMFastPath was returned, then we need to retry the fast path. We also restore edi and set pr_HTMRetriedAfterAbort to state that we have retried the fast path already (it's harmless if this bit is set even if we don't retry the fast path because it is checked iff pr_HTMRetryableAbort is set). We clear pr_HTMRetryableAbort because it applies to a previous HW transaction attempt. */ cmpl $a_tryHTMFastPath, %eax jnz 2f andl $(0xffffffff-pr_HTMRetryableAbort), %edi orl $pr_HTMRetriedAfterAbort, %edi jmp .Lhtm_fastpath 2: #endif #else leal 4(%esp), %ecx movl 4(%esp), %eax subl $28, %esp cfi_def_cfa_offset(32) movl %ecx, 4(%esp) movl %ebx, 8(%esp) movl %esi, 12(%esp) movl %edi, 16(%esp) movl %ebp, 20(%esp) xorl %edx, %edx /* Save zero or shadow stack pointer in the new field. */ #if defined __SHSTK__ && defined __CET__ && (__CET__ & 2) != 0 rdsspd %edx #endif movl %edx, 24(%esp) leal 4(%esp), %edx #if defined HAVE_ATTRIBUTE_VISIBILITY || !defined __PIC__ call SYM(GTM_begin_transaction) #elif defined __ELF__ call 1f 1: popl %ebx addl $_GLOBAL_OFFSET_TABLE_+[.-1b], %ebx call SYM(GTM_begin_transaction)@PLT movl 8(%esp), %ebx #else # error "Unsupported PIC sequence" #endif addl $28, %esp cfi_def_cfa_offset(4) #endif ret cfi_endproc TYPE(_ITM_beginTransaction) SIZE(_ITM_beginTransaction) .align 4 .globl SYM(GTM_longjmp) SYM(GTM_longjmp): cfi_startproc _CET_ENDBR #ifdef __x86_64__ movq (%rsi), %rcx movq 8(%rsi), %rbx movq 16(%rsi), %rbp movq 24(%rsi), %r12 movq 32(%rsi), %r13 movq 40(%rsi), %r14 movq 48(%rsi), %r15 movl %edi, %eax cfi_def_cfa(%rsi, 0) cfi_offset(%rip, 64) cfi_register(%rsp, %rcx) movq %rcx, %rsp #if defined __SHSTK__ && defined __CET__ && (__CET__ & 2) != 0 /* Check if Shadow Stack is enabled. */ xorq %rcx, %rcx rdsspq %rcx testq %rcx, %rcx je .L1 /* Calculate number of frames to skip. */ subq 56(%rsi), %rcx negq %rcx shrq $3, %rcx incq %rcx /* If # of frames is greater 255 then loop and adjust. */ cmpq $255, %rcx jbe .L3 movl $255, %edi .p2align 4,,10 .p2align 3 .L4: incsspq %rdi subq $255, %rcx cmpq $255, %rcx ja .L4 .L3: incsspq %rcx .L1: #endif jmp *64(%rsi) #else movl (%edx), %ecx movl 4(%edx), %ebx movl 8(%edx), %esi movl 12(%edx), %edi movl 16(%edx), %ebp cfi_def_cfa(%edx, 0) cfi_offset(%eip, 24) cfi_register(%esp, %ecx) movl %ecx, %esp #if defined __SHSTK__ && defined __CET__ && (__CET__ & 2) != 0 /* Check if Shadow Stack is enabled. */ xorl %ecx, %ecx rdsspd %ecx testl %ecx, %ecx je .L1 /* Calculate # of frames to skip. */ subl 20(%edx), %ecx negl %ecx shrl $2, %ecx incl %ecx /* If # of frames is greater 255 then loop and adjust. */ cmpl $255, %ecx jbe .L3 pushl %eax movl $255, %eax .p2align 4,,10 .p2align 3 .L4: incsspd %eax subl $255, %ecx cmpl $255, %ecx ja .L4 popl %eax .L3: incsspd %ecx .L1: #endif jmp *24(%edx) #endif cfi_endproc TYPE(GTM_longjmp) HIDDEN(GTM_longjmp) SIZE(GTM_longjmp) #ifdef __linux__ .section .note.GNU-stack, "", @progbits #endif