2005-04-17 00:20:36 +02:00
|
|
|
/*
|
|
|
|
* Compatibility mode system call entry point for x86-64.
|
|
|
|
*
|
|
|
|
* Copyright 2000-2002 Andi Kleen, SuSE Labs.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <asm/dwarf2.h>
|
|
|
|
#include <asm/calling.h>
|
2005-09-09 21:28:48 +02:00
|
|
|
#include <asm/asm-offsets.h>
|
2005-04-17 00:20:36 +02:00
|
|
|
#include <asm/current.h>
|
|
|
|
#include <asm/errno.h>
|
|
|
|
#include <asm/ia32_unistd.h>
|
|
|
|
#include <asm/thread_info.h>
|
|
|
|
#include <asm/segment.h>
|
2006-07-03 09:24:45 +02:00
|
|
|
#include <asm/irqflags.h>
|
2012-04-20 21:19:50 +02:00
|
|
|
#include <asm/asm.h>
|
2012-09-21 21:43:12 +02:00
|
|
|
#include <asm/smap.h>
|
2005-04-17 00:20:36 +02:00
|
|
|
#include <linux/linkage.h>
|
2012-01-03 20:23:06 +01:00
|
|
|
#include <linux/err.h>
|
2005-04-17 00:20:36 +02:00
|
|
|
|
2008-06-24 10:13:31 +02:00
|
|
|
/* Avoid __ASSEMBLER__'ifying <linux/audit.h> just for this. */
|
|
|
|
#include <linux/elf-em.h>
|
|
|
|
#define AUDIT_ARCH_I386 (EM_386|__AUDIT_ARCH_LE)
|
|
|
|
#define __AUDIT_ARCH_LE 0x40000000
|
|
|
|
|
|
|
|
#ifndef CONFIG_AUDITSYSCALL
|
2009-09-30 12:22:11 +02:00
|
|
|
#define sysexit_audit ia32_ret_from_sys_call
|
|
|
|
#define sysretl_audit ia32_ret_from_sys_call
|
2008-06-24 10:13:31 +02:00
|
|
|
#endif
|
|
|
|
|
2011-03-07 19:10:39 +01:00
|
|
|
.section .entry.text, "ax"
|
|
|
|
|
2005-04-17 00:20:36 +02:00
|
|
|
.macro IA32_ARG_FIXUP noebp=0
|
|
|
|
movl %edi,%r8d
|
|
|
|
.if \noebp
|
|
|
|
.else
|
|
|
|
movl %ebp,%r9d
|
|
|
|
.endif
|
|
|
|
xchg %ecx,%esi
|
|
|
|
movl %ebx,%edi
|
|
|
|
movl %edx,%edx /* zero extension */
|
|
|
|
.endm
|
|
|
|
|
|
|
|
/* clobbers %eax */
|
2009-09-30 12:22:11 +02:00
|
|
|
.macro CLEAR_RREGS offset=0, _r9=rax
|
2005-04-17 00:20:36 +02:00
|
|
|
xorl %eax,%eax
|
2009-09-30 12:22:11 +02:00
|
|
|
movq %rax,\offset+R11(%rsp)
|
|
|
|
movq %rax,\offset+R10(%rsp)
|
|
|
|
movq %\_r9,\offset+R9(%rsp)
|
|
|
|
movq %rax,\offset+R8(%rsp)
|
2005-04-17 00:20:36 +02:00
|
|
|
.endm
|
|
|
|
|
2008-07-09 11:38:07 +02:00
|
|
|
/*
|
|
|
|
* Reload arg registers from stack in case ptrace changed them.
|
|
|
|
* We don't reload %eax because syscall_trace_enter() returned
|
2010-09-14 21:22:58 +02:00
|
|
|
* the %rax value we should see. Instead, we just truncate that
|
|
|
|
* value to 32 bits again as we did on entry from user mode.
|
|
|
|
* If it's a new value set by user_regset during entry tracing,
|
|
|
|
* this matches the normal truncation of the user-mode value.
|
|
|
|
* If it's -1 to make us punt the syscall, then (u32)-1 is still
|
|
|
|
* an appropriately invalid value.
|
2008-07-09 11:38:07 +02:00
|
|
|
*/
|
2008-08-29 14:21:11 +02:00
|
|
|
.macro LOAD_ARGS32 offset, _r9=0
|
|
|
|
.if \_r9
|
2007-09-21 16:16:18 +02:00
|
|
|
movl \offset+16(%rsp),%r9d
|
2008-08-29 14:21:11 +02:00
|
|
|
.endif
|
2007-09-21 16:16:18 +02:00
|
|
|
movl \offset+40(%rsp),%ecx
|
|
|
|
movl \offset+48(%rsp),%edx
|
|
|
|
movl \offset+56(%rsp),%esi
|
|
|
|
movl \offset+64(%rsp),%edi
|
2010-09-14 21:22:58 +02:00
|
|
|
movl %eax,%eax /* zero extension */
|
2007-09-21 16:16:18 +02:00
|
|
|
.endm
|
|
|
|
|
2006-01-11 22:41:59 +01:00
|
|
|
.macro CFI_STARTPROC32 simple
|
|
|
|
CFI_STARTPROC \simple
|
|
|
|
CFI_UNDEFINED r8
|
|
|
|
CFI_UNDEFINED r9
|
|
|
|
CFI_UNDEFINED r10
|
|
|
|
CFI_UNDEFINED r11
|
|
|
|
CFI_UNDEFINED r12
|
|
|
|
CFI_UNDEFINED r13
|
|
|
|
CFI_UNDEFINED r14
|
|
|
|
CFI_UNDEFINED r15
|
|
|
|
.endm
|
|
|
|
|
2008-06-25 06:19:28 +02:00
|
|
|
#ifdef CONFIG_PARAVIRT
|
|
|
|
ENTRY(native_usergs_sysret32)
|
|
|
|
swapgs
|
|
|
|
sysretl
|
|
|
|
ENDPROC(native_usergs_sysret32)
|
|
|
|
|
|
|
|
ENTRY(native_irq_enable_sysexit)
|
|
|
|
swapgs
|
|
|
|
sti
|
|
|
|
sysexit
|
|
|
|
ENDPROC(native_irq_enable_sysexit)
|
|
|
|
#endif
|
|
|
|
|
2005-04-17 00:20:36 +02:00
|
|
|
/*
|
|
|
|
* 32bit SYSENTER instruction entry.
|
|
|
|
*
|
|
|
|
* Arguments:
|
|
|
|
* %eax System call number.
|
|
|
|
* %ebx Arg1
|
|
|
|
* %ecx Arg2
|
|
|
|
* %edx Arg3
|
|
|
|
* %esi Arg4
|
|
|
|
* %edi Arg5
|
|
|
|
* %ebp user stack
|
|
|
|
* 0(%ebp) Arg6
|
|
|
|
*
|
|
|
|
* Interrupts off.
|
|
|
|
*
|
|
|
|
* This is purely a fast path. For anything complicated we use the int 0x80
|
|
|
|
* path below. Set up a complete hardware stack frame to share code
|
|
|
|
* with the int 0x80 path.
|
|
|
|
*/
|
|
|
|
ENTRY(ia32_sysenter_target)
|
2006-01-11 22:41:59 +01:00
|
|
|
CFI_STARTPROC32 simple
|
2006-09-26 10:52:41 +02:00
|
|
|
CFI_SIGNAL_FRAME
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_DEF_CFA rsp,0
|
|
|
|
CFI_REGISTER rsp,rbp
|
2008-06-26 16:28:51 +02:00
|
|
|
SWAPGS_UNSAFE_STACK
|
2009-01-18 16:38:58 +01:00
|
|
|
movq PER_CPU_VAR(kernel_stack), %rsp
|
|
|
|
addq $(KERNEL_STACK_OFFSET),%rsp
|
2006-07-03 09:24:45 +02:00
|
|
|
/*
|
|
|
|
* No need to follow this irqs on/off section: the syscall
|
|
|
|
* disabled irqs, here we enable it straight after entry:
|
|
|
|
*/
|
2008-06-25 06:19:29 +02:00
|
|
|
ENABLE_INTERRUPTS(CLBR_NONE)
|
2005-04-17 00:20:36 +02:00
|
|
|
movl %ebp,%ebp /* zero extension */
|
2011-02-28 16:54:40 +01:00
|
|
|
pushq_cfi $__USER32_DS
|
2005-09-12 18:49:24 +02:00
|
|
|
/*CFI_REL_OFFSET ss,0*/
|
2011-02-28 16:54:40 +01:00
|
|
|
pushq_cfi %rbp
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_REL_OFFSET rsp,0
|
2011-02-28 16:54:40 +01:00
|
|
|
pushfq_cfi
|
2005-09-12 18:49:24 +02:00
|
|
|
/*CFI_REL_OFFSET rflags,0*/
|
2011-11-29 12:17:45 +01:00
|
|
|
movl TI_sysenter_return+THREAD_INFO(%rsp,3*8-KERNEL_STACK_OFFSET),%r10d
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_REGISTER rip,r10
|
2011-02-28 16:54:40 +01:00
|
|
|
pushq_cfi $__USER32_CS
|
2005-09-12 18:49:24 +02:00
|
|
|
/*CFI_REL_OFFSET cs,0*/
|
2005-04-17 00:20:36 +02:00
|
|
|
movl %eax, %eax
|
2011-02-28 16:54:40 +01:00
|
|
|
pushq_cfi %r10
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_REL_OFFSET rip,0
|
2011-02-28 16:54:40 +01:00
|
|
|
pushq_cfi %rax
|
2005-04-17 00:20:36 +02:00
|
|
|
cld
|
2011-05-31 22:21:52 +02:00
|
|
|
SAVE_ARGS 0,1,0
|
2005-04-17 00:20:36 +02:00
|
|
|
/* no need to do an access_ok check here because rbp has been
|
|
|
|
32bit zero extended */
|
2012-09-21 21:43:12 +02:00
|
|
|
ASM_STAC
|
2008-08-29 14:21:11 +02:00
|
|
|
1: movl (%rbp),%ebp
|
2012-04-20 21:19:50 +02:00
|
|
|
_ASM_EXTABLE(1b,ia32_badarg)
|
2012-09-21 21:43:12 +02:00
|
|
|
ASM_CLAC
|
2011-11-29 12:17:45 +01:00
|
|
|
orl $TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
|
|
|
testl $_TIF_WORK_SYSCALL_ENTRY,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_REMEMBER_STATE
|
2005-04-17 00:20:36 +02:00
|
|
|
jnz sysenter_tracesys
|
x86-64, compat: Test %rax for the syscall number, not %eax
On 64 bits, we always, by necessity, jump through the system call
table via %rax. For 32-bit system calls, in theory the system call
number is stored in %eax, and the code was testing %eax for a valid
system call number. At one point we loaded the stored value back from
the stack to enforce zero-extension, but that was removed in checkin
d4d67150165df8bf1cc05e532f6efca96f907cab. An actual 32-bit process
will not be able to introduce a non-zero-extended number, but it can
happen via ptrace.
Instead of re-introducing the zero-extension, test what we are
actually going to use, i.e. %rax. This only adds a handful of REX
prefixes to the code.
Reported-by: Ben Hawkes <hawkes@sota.gen.nz>
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: <stable@kernel.org>
Cc: Roland McGrath <roland@redhat.com>
Cc: Andrew Morton <akpm@linux-foundation.org>
2010-09-14 21:42:41 +02:00
|
|
|
cmpq $(IA32_NR_syscalls-1),%rax
|
2006-04-07 19:50:31 +02:00
|
|
|
ja ia32_badsys
|
2008-07-09 11:38:07 +02:00
|
|
|
sysenter_do_call:
|
2008-08-29 14:21:11 +02:00
|
|
|
IA32_ARG_FIXUP
|
2008-06-24 10:13:31 +02:00
|
|
|
sysenter_dispatch:
|
2005-04-17 00:20:36 +02:00
|
|
|
call *ia32_sys_call_table(,%rax,8)
|
|
|
|
movq %rax,RAX-ARGOFFSET(%rsp)
|
2008-06-25 06:19:29 +02:00
|
|
|
DISABLE_INTERRUPTS(CLBR_NONE)
|
2006-07-03 09:24:45 +02:00
|
|
|
TRACE_IRQS_OFF
|
2011-11-29 12:17:45 +01:00
|
|
|
testl $_TIF_ALLWORK_MASK,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
2008-06-24 10:13:31 +02:00
|
|
|
jnz sysexit_audit
|
|
|
|
sysexit_from_sys_call:
|
2011-11-29 12:17:45 +01:00
|
|
|
andl $~TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
2005-04-17 00:20:36 +02:00
|
|
|
/* clear IF, that popfq doesn't enable interrupts early */
|
|
|
|
andl $~0x200,EFLAGS-R11(%rsp)
|
2008-01-30 13:30:43 +01:00
|
|
|
movl RIP-R11(%rsp),%edx /* User %eip */
|
|
|
|
CFI_REGISTER rip,rdx
|
2011-05-31 22:21:53 +02:00
|
|
|
RESTORE_ARGS 0,24,0,0,0,0
|
2009-09-30 12:22:11 +02:00
|
|
|
xorq %r8,%r8
|
|
|
|
xorq %r9,%r9
|
|
|
|
xorq %r10,%r10
|
|
|
|
xorq %r11,%r11
|
2011-02-28 16:54:40 +01:00
|
|
|
popfq_cfi
|
2005-09-12 18:49:24 +02:00
|
|
|
/*CFI_RESTORE rflags*/
|
2011-02-28 16:54:40 +01:00
|
|
|
popq_cfi %rcx /* User %esp */
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_REGISTER rsp,rcx
|
2006-07-03 09:24:45 +02:00
|
|
|
TRACE_IRQS_ON
|
2008-06-25 06:19:28 +02:00
|
|
|
ENABLE_INTERRUPTS_SYSEXIT32
|
2005-04-17 00:20:36 +02:00
|
|
|
|
2008-06-24 10:13:31 +02:00
|
|
|
#ifdef CONFIG_AUDITSYSCALL
|
|
|
|
.macro auditsys_entry_common
|
|
|
|
movl %esi,%r9d /* 6th arg: 4th syscall arg */
|
|
|
|
movl %edx,%r8d /* 5th arg: 3rd syscall arg */
|
|
|
|
/* (already in %ecx) 4th arg: 2nd syscall arg */
|
|
|
|
movl %ebx,%edx /* 3rd arg: 1st syscall arg */
|
|
|
|
movl %eax,%esi /* 2nd arg: syscall number */
|
|
|
|
movl $AUDIT_ARCH_I386,%edi /* 1st arg: audit arch */
|
2012-01-03 20:23:06 +01:00
|
|
|
call __audit_syscall_entry
|
2008-06-24 10:13:31 +02:00
|
|
|
movl RAX-ARGOFFSET(%rsp),%eax /* reload syscall number */
|
x86-64, compat: Test %rax for the syscall number, not %eax
On 64 bits, we always, by necessity, jump through the system call
table via %rax. For 32-bit system calls, in theory the system call
number is stored in %eax, and the code was testing %eax for a valid
system call number. At one point we loaded the stored value back from
the stack to enforce zero-extension, but that was removed in checkin
d4d67150165df8bf1cc05e532f6efca96f907cab. An actual 32-bit process
will not be able to introduce a non-zero-extended number, but it can
happen via ptrace.
Instead of re-introducing the zero-extension, test what we are
actually going to use, i.e. %rax. This only adds a handful of REX
prefixes to the code.
Reported-by: Ben Hawkes <hawkes@sota.gen.nz>
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: <stable@kernel.org>
Cc: Roland McGrath <roland@redhat.com>
Cc: Andrew Morton <akpm@linux-foundation.org>
2010-09-14 21:42:41 +02:00
|
|
|
cmpq $(IA32_NR_syscalls-1),%rax
|
2008-06-24 10:13:31 +02:00
|
|
|
ja ia32_badsys
|
|
|
|
movl %ebx,%edi /* reload 1st syscall arg */
|
|
|
|
movl RCX-ARGOFFSET(%rsp),%esi /* reload 2nd syscall arg */
|
|
|
|
movl RDX-ARGOFFSET(%rsp),%edx /* reload 3rd syscall arg */
|
|
|
|
movl RSI-ARGOFFSET(%rsp),%ecx /* reload 4th syscall arg */
|
|
|
|
movl RDI-ARGOFFSET(%rsp),%r8d /* reload 5th syscall arg */
|
|
|
|
.endm
|
|
|
|
|
2009-10-26 16:20:29 +01:00
|
|
|
.macro auditsys_exit exit
|
2011-11-29 12:17:45 +01:00
|
|
|
testl $(_TIF_ALLWORK_MASK & ~_TIF_SYSCALL_AUDIT),TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
2009-09-30 12:22:11 +02:00
|
|
|
jnz ia32_ret_from_sys_call
|
2008-06-24 10:13:31 +02:00
|
|
|
TRACE_IRQS_ON
|
2013-01-30 08:55:53 +01:00
|
|
|
ENABLE_INTERRUPTS(CLBR_NONE)
|
2008-06-24 10:13:31 +02:00
|
|
|
movl %eax,%esi /* second arg, syscall return value */
|
2012-01-03 20:23:06 +01:00
|
|
|
cmpl $-MAX_ERRNO,%eax /* is it an error ? */
|
2012-01-03 20:23:06 +01:00
|
|
|
jbe 1f
|
|
|
|
movslq %eax, %rsi /* if error sign extend to 64 bits */
|
|
|
|
1: setbe %al /* 1 if error, 0 if not */
|
2008-06-24 10:13:31 +02:00
|
|
|
movzbl %al,%edi /* zero-extend that into %edi */
|
2012-01-03 20:23:06 +01:00
|
|
|
call __audit_syscall_exit
|
|
|
|
movq RAX-ARGOFFSET(%rsp),%rax /* reload syscall return value */
|
2008-06-24 10:13:31 +02:00
|
|
|
movl $(_TIF_ALLWORK_MASK & ~_TIF_SYSCALL_AUDIT),%edi
|
2013-01-30 08:55:53 +01:00
|
|
|
DISABLE_INTERRUPTS(CLBR_NONE)
|
2008-06-24 10:13:31 +02:00
|
|
|
TRACE_IRQS_OFF
|
2011-11-29 12:17:45 +01:00
|
|
|
testl %edi,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
2009-09-30 12:22:11 +02:00
|
|
|
jz \exit
|
|
|
|
CLEAR_RREGS -ARGOFFSET
|
|
|
|
jmp int_with_check
|
2008-06-24 10:13:31 +02:00
|
|
|
.endm
|
|
|
|
|
|
|
|
sysenter_auditsys:
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_RESTORE_STATE
|
2008-06-24 10:13:31 +02:00
|
|
|
auditsys_entry_common
|
|
|
|
movl %ebp,%r9d /* reload 6th syscall arg */
|
|
|
|
jmp sysenter_dispatch
|
|
|
|
|
|
|
|
sysexit_audit:
|
|
|
|
auditsys_exit sysexit_from_sys_call
|
|
|
|
#endif
|
|
|
|
|
|
|
|
sysenter_tracesys:
|
|
|
|
#ifdef CONFIG_AUDITSYSCALL
|
2011-11-29 12:17:45 +01:00
|
|
|
testl $(_TIF_WORK_SYSCALL_ENTRY & ~_TIF_SYSCALL_AUDIT),TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
2008-06-24 10:13:31 +02:00
|
|
|
jz sysenter_auditsys
|
|
|
|
#endif
|
2005-04-17 00:20:36 +02:00
|
|
|
SAVE_REST
|
|
|
|
CLEAR_RREGS
|
2008-03-19 02:23:50 +01:00
|
|
|
movq $-ENOSYS,RAX(%rsp)/* ptrace can change this for a bad syscall */
|
2005-04-17 00:20:36 +02:00
|
|
|
movq %rsp,%rdi /* &pt_regs -> arg1 */
|
|
|
|
call syscall_trace_enter
|
2007-09-21 16:16:18 +02:00
|
|
|
LOAD_ARGS32 ARGOFFSET /* reload args from stack in case ptrace changed it */
|
2005-04-17 00:20:36 +02:00
|
|
|
RESTORE_REST
|
x86-64, compat: Test %rax for the syscall number, not %eax
On 64 bits, we always, by necessity, jump through the system call
table via %rax. For 32-bit system calls, in theory the system call
number is stored in %eax, and the code was testing %eax for a valid
system call number. At one point we loaded the stored value back from
the stack to enforce zero-extension, but that was removed in checkin
d4d67150165df8bf1cc05e532f6efca96f907cab. An actual 32-bit process
will not be able to introduce a non-zero-extended number, but it can
happen via ptrace.
Instead of re-introducing the zero-extension, test what we are
actually going to use, i.e. %rax. This only adds a handful of REX
prefixes to the code.
Reported-by: Ben Hawkes <hawkes@sota.gen.nz>
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: <stable@kernel.org>
Cc: Roland McGrath <roland@redhat.com>
Cc: Andrew Morton <akpm@linux-foundation.org>
2010-09-14 21:42:41 +02:00
|
|
|
cmpq $(IA32_NR_syscalls-1),%rax
|
2008-03-19 02:23:50 +01:00
|
|
|
ja int_ret_from_sys_call /* sysenter_tracesys has set RAX(%rsp) */
|
2005-04-17 00:20:36 +02:00
|
|
|
jmp sysenter_do_call
|
|
|
|
CFI_ENDPROC
|
2006-06-26 13:56:55 +02:00
|
|
|
ENDPROC(ia32_sysenter_target)
|
2005-04-17 00:20:36 +02:00
|
|
|
|
|
|
|
/*
|
|
|
|
* 32bit SYSCALL instruction entry.
|
|
|
|
*
|
|
|
|
* Arguments:
|
|
|
|
* %eax System call number.
|
|
|
|
* %ebx Arg1
|
|
|
|
* %ecx return EIP
|
|
|
|
* %edx Arg3
|
|
|
|
* %esi Arg4
|
|
|
|
* %edi Arg5
|
|
|
|
* %ebp Arg2 [note: not saved in the stack frame, should not be touched]
|
|
|
|
* %esp user stack
|
|
|
|
* 0(%esp) Arg6
|
|
|
|
*
|
|
|
|
* Interrupts off.
|
|
|
|
*
|
|
|
|
* This is purely a fast path. For anything complicated we use the int 0x80
|
|
|
|
* path below. Set up a complete hardware stack frame to share code
|
|
|
|
* with the int 0x80 path.
|
|
|
|
*/
|
|
|
|
ENTRY(ia32_cstar_target)
|
2006-01-11 22:41:59 +01:00
|
|
|
CFI_STARTPROC32 simple
|
2006-09-26 10:52:41 +02:00
|
|
|
CFI_SIGNAL_FRAME
|
2009-01-18 16:38:58 +01:00
|
|
|
CFI_DEF_CFA rsp,KERNEL_STACK_OFFSET
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_REGISTER rip,rcx
|
|
|
|
/*CFI_REGISTER rflags,r11*/
|
2008-06-26 16:28:51 +02:00
|
|
|
SWAPGS_UNSAFE_STACK
|
2005-04-17 00:20:36 +02:00
|
|
|
movl %esp,%r8d
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_REGISTER rsp,r8
|
2009-01-18 16:38:58 +01:00
|
|
|
movq PER_CPU_VAR(kernel_stack),%rsp
|
2006-07-03 09:24:45 +02:00
|
|
|
/*
|
|
|
|
* No need to follow this irqs on/off section: the syscall
|
|
|
|
* disabled irqs and here we enable it straight after entry:
|
|
|
|
*/
|
2008-06-25 06:19:29 +02:00
|
|
|
ENABLE_INTERRUPTS(CLBR_NONE)
|
2011-05-31 22:21:52 +02:00
|
|
|
SAVE_ARGS 8,0,0
|
2005-04-17 00:20:36 +02:00
|
|
|
movl %eax,%eax /* zero extension */
|
|
|
|
movq %rax,ORIG_RAX-ARGOFFSET(%rsp)
|
|
|
|
movq %rcx,RIP-ARGOFFSET(%rsp)
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_REL_OFFSET rip,RIP-ARGOFFSET
|
2005-04-17 00:20:36 +02:00
|
|
|
movq %rbp,RCX-ARGOFFSET(%rsp) /* this lies slightly to ptrace */
|
|
|
|
movl %ebp,%ecx
|
|
|
|
movq $__USER32_CS,CS-ARGOFFSET(%rsp)
|
|
|
|
movq $__USER32_DS,SS-ARGOFFSET(%rsp)
|
|
|
|
movq %r11,EFLAGS-ARGOFFSET(%rsp)
|
2005-09-12 18:49:24 +02:00
|
|
|
/*CFI_REL_OFFSET rflags,EFLAGS-ARGOFFSET*/
|
2005-04-17 00:20:36 +02:00
|
|
|
movq %r8,RSP-ARGOFFSET(%rsp)
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_REL_OFFSET rsp,RSP-ARGOFFSET
|
2005-04-17 00:20:36 +02:00
|
|
|
/* no need to do an access_ok check here because r8 has been
|
|
|
|
32bit zero extended */
|
|
|
|
/* hardware stack frame is complete now */
|
2012-09-21 21:43:12 +02:00
|
|
|
ASM_STAC
|
2005-04-17 00:20:36 +02:00
|
|
|
1: movl (%r8),%r9d
|
2012-04-21 01:51:50 +02:00
|
|
|
_ASM_EXTABLE(1b,ia32_badarg)
|
2012-09-21 21:43:12 +02:00
|
|
|
ASM_CLAC
|
2011-11-29 12:17:45 +01:00
|
|
|
orl $TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
|
|
|
testl $_TIF_WORK_SYSCALL_ENTRY,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_REMEMBER_STATE
|
2005-04-17 00:20:36 +02:00
|
|
|
jnz cstar_tracesys
|
x86-64, compat: Test %rax for the syscall number, not %eax
On 64 bits, we always, by necessity, jump through the system call
table via %rax. For 32-bit system calls, in theory the system call
number is stored in %eax, and the code was testing %eax for a valid
system call number. At one point we loaded the stored value back from
the stack to enforce zero-extension, but that was removed in checkin
d4d67150165df8bf1cc05e532f6efca96f907cab. An actual 32-bit process
will not be able to introduce a non-zero-extended number, but it can
happen via ptrace.
Instead of re-introducing the zero-extension, test what we are
actually going to use, i.e. %rax. This only adds a handful of REX
prefixes to the code.
Reported-by: Ben Hawkes <hawkes@sota.gen.nz>
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: <stable@kernel.org>
Cc: Roland McGrath <roland@redhat.com>
Cc: Andrew Morton <akpm@linux-foundation.org>
2010-09-14 21:42:41 +02:00
|
|
|
cmpq $IA32_NR_syscalls-1,%rax
|
2006-04-07 19:50:31 +02:00
|
|
|
ja ia32_badsys
|
2008-08-29 14:21:11 +02:00
|
|
|
cstar_do_call:
|
2005-04-17 00:20:36 +02:00
|
|
|
IA32_ARG_FIXUP 1
|
2008-06-24 10:13:31 +02:00
|
|
|
cstar_dispatch:
|
2005-04-17 00:20:36 +02:00
|
|
|
call *ia32_sys_call_table(,%rax,8)
|
|
|
|
movq %rax,RAX-ARGOFFSET(%rsp)
|
2008-06-25 06:19:29 +02:00
|
|
|
DISABLE_INTERRUPTS(CLBR_NONE)
|
2006-07-03 09:24:45 +02:00
|
|
|
TRACE_IRQS_OFF
|
2011-11-29 12:17:45 +01:00
|
|
|
testl $_TIF_ALLWORK_MASK,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
2008-06-24 10:13:31 +02:00
|
|
|
jnz sysretl_audit
|
|
|
|
sysretl_from_sys_call:
|
2011-11-29 12:17:45 +01:00
|
|
|
andl $~TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
2011-05-31 22:21:53 +02:00
|
|
|
RESTORE_ARGS 0,-ARG_SKIP,0,0,0
|
2005-04-17 00:20:36 +02:00
|
|
|
movl RIP-ARGOFFSET(%rsp),%ecx
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_REGISTER rip,rcx
|
2005-04-17 00:20:36 +02:00
|
|
|
movl EFLAGS-ARGOFFSET(%rsp),%r11d
|
2005-09-12 18:49:24 +02:00
|
|
|
/*CFI_REGISTER rflags,r11*/
|
2009-09-30 12:22:11 +02:00
|
|
|
xorq %r10,%r10
|
|
|
|
xorq %r9,%r9
|
|
|
|
xorq %r8,%r8
|
2006-07-03 09:24:45 +02:00
|
|
|
TRACE_IRQS_ON
|
2005-04-17 00:20:36 +02:00
|
|
|
movl RSP-ARGOFFSET(%rsp),%esp
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_RESTORE rsp
|
2008-06-25 06:19:28 +02:00
|
|
|
USERGS_SYSRET32
|
2005-04-17 00:20:36 +02:00
|
|
|
|
2008-06-24 10:13:31 +02:00
|
|
|
#ifdef CONFIG_AUDITSYSCALL
|
|
|
|
cstar_auditsys:
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_RESTORE_STATE
|
2008-06-24 10:13:31 +02:00
|
|
|
movl %r9d,R9-ARGOFFSET(%rsp) /* register to be clobbered by call */
|
|
|
|
auditsys_entry_common
|
|
|
|
movl R9-ARGOFFSET(%rsp),%r9d /* reload 6th syscall arg */
|
|
|
|
jmp cstar_dispatch
|
|
|
|
|
|
|
|
sysretl_audit:
|
2009-10-26 16:20:29 +01:00
|
|
|
auditsys_exit sysretl_from_sys_call
|
2008-06-24 10:13:31 +02:00
|
|
|
#endif
|
|
|
|
|
|
|
|
cstar_tracesys:
|
|
|
|
#ifdef CONFIG_AUDITSYSCALL
|
2011-11-29 12:17:45 +01:00
|
|
|
testl $(_TIF_WORK_SYSCALL_ENTRY & ~_TIF_SYSCALL_AUDIT),TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
2008-06-24 10:13:31 +02:00
|
|
|
jz cstar_auditsys
|
|
|
|
#endif
|
2007-11-07 16:48:39 +01:00
|
|
|
xchgl %r9d,%ebp
|
2005-04-17 00:20:36 +02:00
|
|
|
SAVE_REST
|
2009-09-30 12:22:11 +02:00
|
|
|
CLEAR_RREGS 0, r9
|
2008-03-19 02:23:50 +01:00
|
|
|
movq $-ENOSYS,RAX(%rsp) /* ptrace can change this for a bad syscall */
|
2005-04-17 00:20:36 +02:00
|
|
|
movq %rsp,%rdi /* &pt_regs -> arg1 */
|
|
|
|
call syscall_trace_enter
|
2008-08-29 14:21:11 +02:00
|
|
|
LOAD_ARGS32 ARGOFFSET, 1 /* reload args from stack in case ptrace changed it */
|
2005-04-17 00:20:36 +02:00
|
|
|
RESTORE_REST
|
2007-11-07 16:48:39 +01:00
|
|
|
xchgl %ebp,%r9d
|
x86-64, compat: Test %rax for the syscall number, not %eax
On 64 bits, we always, by necessity, jump through the system call
table via %rax. For 32-bit system calls, in theory the system call
number is stored in %eax, and the code was testing %eax for a valid
system call number. At one point we loaded the stored value back from
the stack to enforce zero-extension, but that was removed in checkin
d4d67150165df8bf1cc05e532f6efca96f907cab. An actual 32-bit process
will not be able to introduce a non-zero-extended number, but it can
happen via ptrace.
Instead of re-introducing the zero-extension, test what we are
actually going to use, i.e. %rax. This only adds a handful of REX
prefixes to the code.
Reported-by: Ben Hawkes <hawkes@sota.gen.nz>
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: <stable@kernel.org>
Cc: Roland McGrath <roland@redhat.com>
Cc: Andrew Morton <akpm@linux-foundation.org>
2010-09-14 21:42:41 +02:00
|
|
|
cmpq $(IA32_NR_syscalls-1),%rax
|
2008-03-19 02:23:50 +01:00
|
|
|
ja int_ret_from_sys_call /* cstar_tracesys has set RAX(%rsp) */
|
2005-04-17 00:20:36 +02:00
|
|
|
jmp cstar_do_call
|
2006-06-26 13:56:55 +02:00
|
|
|
END(ia32_cstar_target)
|
2005-04-17 00:20:36 +02:00
|
|
|
|
|
|
|
ia32_badarg:
|
2012-09-21 21:43:12 +02:00
|
|
|
ASM_CLAC
|
2005-04-17 00:20:36 +02:00
|
|
|
movq $-EFAULT,%rax
|
|
|
|
jmp ia32_sysret
|
|
|
|
CFI_ENDPROC
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Emulated IA32 system calls via int 0x80.
|
|
|
|
*
|
|
|
|
* Arguments:
|
|
|
|
* %eax System call number.
|
|
|
|
* %ebx Arg1
|
|
|
|
* %ecx Arg2
|
|
|
|
* %edx Arg3
|
|
|
|
* %esi Arg4
|
|
|
|
* %edi Arg5
|
|
|
|
* %ebp Arg6 [note: not saved in the stack frame, should not be touched]
|
|
|
|
*
|
|
|
|
* Notes:
|
|
|
|
* Uses the same stack frame as the x86-64 version.
|
|
|
|
* All registers except %eax must be saved (but ptrace may violate that)
|
|
|
|
* Arguments are zero extended. For system calls that want sign extension and
|
|
|
|
* take long arguments a wrapper is needed. Most calls can just be called
|
|
|
|
* directly.
|
|
|
|
* Assumes it is only called from user space and entered with interrupts off.
|
|
|
|
*/
|
|
|
|
|
|
|
|
ENTRY(ia32_syscall)
|
2007-07-21 17:10:20 +02:00
|
|
|
CFI_STARTPROC32 simple
|
2006-09-26 10:52:41 +02:00
|
|
|
CFI_SIGNAL_FRAME
|
2005-09-12 18:49:24 +02:00
|
|
|
CFI_DEF_CFA rsp,SS+8-RIP
|
|
|
|
/*CFI_REL_OFFSET ss,SS-RIP*/
|
|
|
|
CFI_REL_OFFSET rsp,RSP-RIP
|
|
|
|
/*CFI_REL_OFFSET rflags,EFLAGS-RIP*/
|
|
|
|
/*CFI_REL_OFFSET cs,CS-RIP*/
|
|
|
|
CFI_REL_OFFSET rip,RIP-RIP
|
2008-07-09 00:06:28 +02:00
|
|
|
PARAVIRT_ADJUST_EXCEPTION_FRAME
|
2008-06-25 06:19:29 +02:00
|
|
|
SWAPGS
|
2006-07-03 09:24:45 +02:00
|
|
|
/*
|
|
|
|
* No need to follow this irqs on/off section: the syscall
|
|
|
|
* disabled irqs and here we enable it straight after entry:
|
|
|
|
*/
|
2008-06-25 06:19:29 +02:00
|
|
|
ENABLE_INTERRUPTS(CLBR_NONE)
|
2005-04-17 00:20:36 +02:00
|
|
|
movl %eax,%eax
|
2011-02-28 16:54:40 +01:00
|
|
|
pushq_cfi %rax
|
2005-04-17 00:20:36 +02:00
|
|
|
cld
|
|
|
|
/* note the registers are not zero extended to the sf.
|
|
|
|
this could be a problem. */
|
2011-05-31 22:21:52 +02:00
|
|
|
SAVE_ARGS 0,1,0
|
2011-11-29 12:17:45 +01:00
|
|
|
orl $TS_COMPAT,TI_status+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
|
|
|
testl $_TIF_WORK_SYSCALL_ENTRY,TI_flags+THREAD_INFO(%rsp,RIP-ARGOFFSET)
|
2005-04-17 00:20:36 +02:00
|
|
|
jnz ia32_tracesys
|
x86-64, compat: Test %rax for the syscall number, not %eax
On 64 bits, we always, by necessity, jump through the system call
table via %rax. For 32-bit system calls, in theory the system call
number is stored in %eax, and the code was testing %eax for a valid
system call number. At one point we loaded the stored value back from
the stack to enforce zero-extension, but that was removed in checkin
d4d67150165df8bf1cc05e532f6efca96f907cab. An actual 32-bit process
will not be able to introduce a non-zero-extended number, but it can
happen via ptrace.
Instead of re-introducing the zero-extension, test what we are
actually going to use, i.e. %rax. This only adds a handful of REX
prefixes to the code.
Reported-by: Ben Hawkes <hawkes@sota.gen.nz>
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: <stable@kernel.org>
Cc: Roland McGrath <roland@redhat.com>
Cc: Andrew Morton <akpm@linux-foundation.org>
2010-09-14 21:42:41 +02:00
|
|
|
cmpq $(IA32_NR_syscalls-1),%rax
|
2009-02-07 03:15:18 +01:00
|
|
|
ja ia32_badsys
|
|
|
|
ia32_do_call:
|
2005-04-17 00:20:36 +02:00
|
|
|
IA32_ARG_FIXUP
|
|
|
|
call *ia32_sys_call_table(,%rax,8) # xxx: rip relative
|
|
|
|
ia32_sysret:
|
|
|
|
movq %rax,RAX-ARGOFFSET(%rsp)
|
2009-09-30 12:22:11 +02:00
|
|
|
ia32_ret_from_sys_call:
|
|
|
|
CLEAR_RREGS -ARGOFFSET
|
2005-04-17 00:20:36 +02:00
|
|
|
jmp int_ret_from_sys_call
|
|
|
|
|
|
|
|
ia32_tracesys:
|
|
|
|
SAVE_REST
|
2007-07-21 17:10:20 +02:00
|
|
|
CLEAR_RREGS
|
2008-03-17 05:57:41 +01:00
|
|
|
movq $-ENOSYS,RAX(%rsp) /* ptrace can change this for a bad syscall */
|
2005-04-17 00:20:36 +02:00
|
|
|
movq %rsp,%rdi /* &pt_regs -> arg1 */
|
|
|
|
call syscall_trace_enter
|
2007-09-21 16:16:18 +02:00
|
|
|
LOAD_ARGS32 ARGOFFSET /* reload args from stack in case ptrace changed it */
|
2005-04-17 00:20:36 +02:00
|
|
|
RESTORE_REST
|
x86-64, compat: Test %rax for the syscall number, not %eax
On 64 bits, we always, by necessity, jump through the system call
table via %rax. For 32-bit system calls, in theory the system call
number is stored in %eax, and the code was testing %eax for a valid
system call number. At one point we loaded the stored value back from
the stack to enforce zero-extension, but that was removed in checkin
d4d67150165df8bf1cc05e532f6efca96f907cab. An actual 32-bit process
will not be able to introduce a non-zero-extended number, but it can
happen via ptrace.
Instead of re-introducing the zero-extension, test what we are
actually going to use, i.e. %rax. This only adds a handful of REX
prefixes to the code.
Reported-by: Ben Hawkes <hawkes@sota.gen.nz>
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Cc: <stable@kernel.org>
Cc: Roland McGrath <roland@redhat.com>
Cc: Andrew Morton <akpm@linux-foundation.org>
2010-09-14 21:42:41 +02:00
|
|
|
cmpq $(IA32_NR_syscalls-1),%rax
|
2009-02-07 03:15:18 +01:00
|
|
|
ja int_ret_from_sys_call /* ia32_tracesys has set RAX(%rsp) */
|
|
|
|
jmp ia32_do_call
|
2006-06-26 13:56:55 +02:00
|
|
|
END(ia32_syscall)
|
2005-04-17 00:20:36 +02:00
|
|
|
|
|
|
|
ia32_badsys:
|
|
|
|
movq $0,ORIG_RAX-ARGOFFSET(%rsp)
|
2009-09-30 12:22:11 +02:00
|
|
|
movq $-ENOSYS,%rax
|
|
|
|
jmp ia32_sysret
|
2005-04-17 00:20:36 +02:00
|
|
|
|
|
|
|
CFI_ENDPROC
|
|
|
|
|
|
|
|
.macro PTREGSCALL label, func, arg
|
2011-11-29 12:24:10 +01:00
|
|
|
ALIGN
|
|
|
|
GLOBAL(\label)
|
2005-04-17 00:20:36 +02:00
|
|
|
leaq \func(%rip),%rax
|
|
|
|
jmp ia32_ptregs_common
|
|
|
|
.endm
|
|
|
|
|
2006-01-11 22:41:59 +01:00
|
|
|
CFI_STARTPROC32
|
2005-09-12 18:49:24 +02:00
|
|
|
|
2012-11-12 20:32:42 +01:00
|
|
|
PTREGSCALL stub32_rt_sigreturn, sys32_rt_sigreturn
|
|
|
|
PTREGSCALL stub32_sigreturn, sys32_sigreturn
|
|
|
|
PTREGSCALL stub32_execve, compat_sys_execve
|
|
|
|
PTREGSCALL stub32_fork, sys_fork
|
|
|
|
PTREGSCALL stub32_vfork, sys_vfork
|
2005-04-17 00:20:36 +02:00
|
|
|
|
2012-10-23 04:34:11 +02:00
|
|
|
ALIGN
|
|
|
|
GLOBAL(stub32_clone)
|
|
|
|
leaq sys_clone(%rip),%rax
|
|
|
|
mov %r8, %rcx
|
|
|
|
jmp ia32_ptregs_common
|
|
|
|
|
2011-11-29 12:24:10 +01:00
|
|
|
ALIGN
|
|
|
|
ia32_ptregs_common:
|
2005-04-17 00:20:36 +02:00
|
|
|
popq %r11
|
2006-01-11 22:41:59 +01:00
|
|
|
CFI_ENDPROC
|
|
|
|
CFI_STARTPROC32 simple
|
2006-09-26 10:52:41 +02:00
|
|
|
CFI_SIGNAL_FRAME
|
2006-01-11 22:41:59 +01:00
|
|
|
CFI_DEF_CFA rsp,SS+8-ARGOFFSET
|
|
|
|
CFI_REL_OFFSET rax,RAX-ARGOFFSET
|
|
|
|
CFI_REL_OFFSET rcx,RCX-ARGOFFSET
|
|
|
|
CFI_REL_OFFSET rdx,RDX-ARGOFFSET
|
|
|
|
CFI_REL_OFFSET rsi,RSI-ARGOFFSET
|
|
|
|
CFI_REL_OFFSET rdi,RDI-ARGOFFSET
|
|
|
|
CFI_REL_OFFSET rip,RIP-ARGOFFSET
|
|
|
|
/* CFI_REL_OFFSET cs,CS-ARGOFFSET*/
|
|
|
|
/* CFI_REL_OFFSET rflags,EFLAGS-ARGOFFSET*/
|
|
|
|
CFI_REL_OFFSET rsp,RSP-ARGOFFSET
|
|
|
|
/* CFI_REL_OFFSET ss,SS-ARGOFFSET*/
|
2005-04-17 00:20:36 +02:00
|
|
|
SAVE_REST
|
|
|
|
call *%rax
|
|
|
|
RESTORE_REST
|
|
|
|
jmp ia32_sysret /* misbalances the return cache */
|
|
|
|
CFI_ENDPROC
|
2006-06-26 13:56:55 +02:00
|
|
|
END(ia32_ptregs_common)
|