1a338ac32c
Remove the bloat of the C calling convention out of the preempt_enable() sites by creating an ASM wrapper which allows us to do an asm("call ___preempt_schedule") instead. calling.h bits by Andi Kleen Suggested-by: Linus Torvalds <torvalds@linux-foundation.org> Signed-off-by: Peter Zijlstra <peterz@infradead.org> Link: http://lkml.kernel.org/n/tip-tk7xdi1cvvxewixzke8t8le1@git.kernel.org [ Fixed build error. ] Signed-off-by: Ingo Molnar <mingo@kernel.org>
245 lines
5.9 KiB
C
245 lines
5.9 KiB
C
/*
|
|
|
|
x86 function call convention, 64-bit:
|
|
-------------------------------------
|
|
arguments | callee-saved | extra caller-saved | return
|
|
[callee-clobbered] | | [callee-clobbered] |
|
|
---------------------------------------------------------------------------
|
|
rdi rsi rdx rcx r8-9 | rbx rbp [*] r12-15 | r10-11 | rax, rdx [**]
|
|
|
|
( rsp is obviously invariant across normal function calls. (gcc can 'merge'
|
|
functions when it sees tail-call optimization possibilities) rflags is
|
|
clobbered. Leftover arguments are passed over the stack frame.)
|
|
|
|
[*] In the frame-pointers case rbp is fixed to the stack frame.
|
|
|
|
[**] for struct return values wider than 64 bits the return convention is a
|
|
bit more complex: up to 128 bits width we return small structures
|
|
straight in rax, rdx. For structures larger than that (3 words or
|
|
larger) the caller puts a pointer to an on-stack return struct
|
|
[allocated in the caller's stack frame] into the first argument - i.e.
|
|
into rdi. All other arguments shift up by one in this case.
|
|
Fortunately this case is rare in the kernel.
|
|
|
|
For 32-bit we have the following conventions - kernel is built with
|
|
-mregparm=3 and -freg-struct-return:
|
|
|
|
x86 function calling convention, 32-bit:
|
|
----------------------------------------
|
|
arguments | callee-saved | extra caller-saved | return
|
|
[callee-clobbered] | | [callee-clobbered] |
|
|
-------------------------------------------------------------------------
|
|
eax edx ecx | ebx edi esi ebp [*] | <none> | eax, edx [**]
|
|
|
|
( here too esp is obviously invariant across normal function calls. eflags
|
|
is clobbered. Leftover arguments are passed over the stack frame. )
|
|
|
|
[*] In the frame-pointers case ebp is fixed to the stack frame.
|
|
|
|
[**] We build with -freg-struct-return, which on 32-bit means similar
|
|
semantics as on 64-bit: edx can be used for a second return value
|
|
(i.e. covering integer and structure sizes up to 64 bits) - after that
|
|
it gets more complex and more expensive: 3-word or larger struct returns
|
|
get done in the caller's frame and the pointer to the return struct goes
|
|
into regparm0, i.e. eax - the other arguments shift up and the
|
|
function's register parameters degenerate to regparm=2 in essence.
|
|
|
|
*/
|
|
|
|
#include <asm/dwarf2.h>
|
|
|
|
#ifdef CONFIG_X86_64
|
|
|
|
/*
|
|
* 64-bit system call stack frame layout defines and helpers,
|
|
* for assembly code:
|
|
*/
|
|
|
|
#define R15 0
|
|
#define R14 8
|
|
#define R13 16
|
|
#define R12 24
|
|
#define RBP 32
|
|
#define RBX 40
|
|
|
|
/* arguments: interrupts/non tracing syscalls only save up to here: */
|
|
#define R11 48
|
|
#define R10 56
|
|
#define R9 64
|
|
#define R8 72
|
|
#define RAX 80
|
|
#define RCX 88
|
|
#define RDX 96
|
|
#define RSI 104
|
|
#define RDI 112
|
|
#define ORIG_RAX 120 /* + error_code */
|
|
/* end of arguments */
|
|
|
|
/* cpu exception frame or undefined in case of fast syscall: */
|
|
#define RIP 128
|
|
#define CS 136
|
|
#define EFLAGS 144
|
|
#define RSP 152
|
|
#define SS 160
|
|
|
|
#define ARGOFFSET R11
|
|
#define SWFRAME ORIG_RAX
|
|
|
|
.macro SAVE_ARGS addskip=0, save_rcx=1, save_r891011=1
|
|
subq $9*8+\addskip, %rsp
|
|
CFI_ADJUST_CFA_OFFSET 9*8+\addskip
|
|
movq_cfi rdi, 8*8
|
|
movq_cfi rsi, 7*8
|
|
movq_cfi rdx, 6*8
|
|
|
|
.if \save_rcx
|
|
movq_cfi rcx, 5*8
|
|
.endif
|
|
|
|
movq_cfi rax, 4*8
|
|
|
|
.if \save_r891011
|
|
movq_cfi r8, 3*8
|
|
movq_cfi r9, 2*8
|
|
movq_cfi r10, 1*8
|
|
movq_cfi r11, 0*8
|
|
.endif
|
|
|
|
.endm
|
|
|
|
#define ARG_SKIP (9*8)
|
|
|
|
.macro RESTORE_ARGS rstor_rax=1, addskip=0, rstor_rcx=1, rstor_r11=1, \
|
|
rstor_r8910=1, rstor_rdx=1
|
|
.if \rstor_r11
|
|
movq_cfi_restore 0*8, r11
|
|
.endif
|
|
|
|
.if \rstor_r8910
|
|
movq_cfi_restore 1*8, r10
|
|
movq_cfi_restore 2*8, r9
|
|
movq_cfi_restore 3*8, r8
|
|
.endif
|
|
|
|
.if \rstor_rax
|
|
movq_cfi_restore 4*8, rax
|
|
.endif
|
|
|
|
.if \rstor_rcx
|
|
movq_cfi_restore 5*8, rcx
|
|
.endif
|
|
|
|
.if \rstor_rdx
|
|
movq_cfi_restore 6*8, rdx
|
|
.endif
|
|
|
|
movq_cfi_restore 7*8, rsi
|
|
movq_cfi_restore 8*8, rdi
|
|
|
|
.if ARG_SKIP+\addskip > 0
|
|
addq $ARG_SKIP+\addskip, %rsp
|
|
CFI_ADJUST_CFA_OFFSET -(ARG_SKIP+\addskip)
|
|
.endif
|
|
.endm
|
|
|
|
.macro LOAD_ARGS offset, skiprax=0
|
|
movq \offset(%rsp), %r11
|
|
movq \offset+8(%rsp), %r10
|
|
movq \offset+16(%rsp), %r9
|
|
movq \offset+24(%rsp), %r8
|
|
movq \offset+40(%rsp), %rcx
|
|
movq \offset+48(%rsp), %rdx
|
|
movq \offset+56(%rsp), %rsi
|
|
movq \offset+64(%rsp), %rdi
|
|
.if \skiprax
|
|
.else
|
|
movq \offset+72(%rsp), %rax
|
|
.endif
|
|
.endm
|
|
|
|
#define REST_SKIP (6*8)
|
|
|
|
.macro SAVE_REST
|
|
subq $REST_SKIP, %rsp
|
|
CFI_ADJUST_CFA_OFFSET REST_SKIP
|
|
movq_cfi rbx, 5*8
|
|
movq_cfi rbp, 4*8
|
|
movq_cfi r12, 3*8
|
|
movq_cfi r13, 2*8
|
|
movq_cfi r14, 1*8
|
|
movq_cfi r15, 0*8
|
|
.endm
|
|
|
|
.macro RESTORE_REST
|
|
movq_cfi_restore 0*8, r15
|
|
movq_cfi_restore 1*8, r14
|
|
movq_cfi_restore 2*8, r13
|
|
movq_cfi_restore 3*8, r12
|
|
movq_cfi_restore 4*8, rbp
|
|
movq_cfi_restore 5*8, rbx
|
|
addq $REST_SKIP, %rsp
|
|
CFI_ADJUST_CFA_OFFSET -(REST_SKIP)
|
|
.endm
|
|
|
|
.macro SAVE_ALL
|
|
SAVE_ARGS
|
|
SAVE_REST
|
|
.endm
|
|
|
|
.macro RESTORE_ALL addskip=0
|
|
RESTORE_REST
|
|
RESTORE_ARGS 1, \addskip
|
|
.endm
|
|
|
|
.macro icebp
|
|
.byte 0xf1
|
|
.endm
|
|
|
|
#else /* CONFIG_X86_64 */
|
|
|
|
/*
|
|
* For 32bit only simplified versions of SAVE_ALL/RESTORE_ALL. These
|
|
* are different from the entry_32.S versions in not changing the segment
|
|
* registers. So only suitable for in kernel use, not when transitioning
|
|
* from or to user space. The resulting stack frame is not a standard
|
|
* pt_regs frame. The main use case is calling C code from assembler
|
|
* when all the registers need to be preserved.
|
|
*/
|
|
|
|
.macro SAVE_ALL
|
|
pushl_cfi %eax
|
|
CFI_REL_OFFSET eax, 0
|
|
pushl_cfi %ebp
|
|
CFI_REL_OFFSET ebp, 0
|
|
pushl_cfi %edi
|
|
CFI_REL_OFFSET edi, 0
|
|
pushl_cfi %esi
|
|
CFI_REL_OFFSET esi, 0
|
|
pushl_cfi %edx
|
|
CFI_REL_OFFSET edx, 0
|
|
pushl_cfi %ecx
|
|
CFI_REL_OFFSET ecx, 0
|
|
pushl_cfi %ebx
|
|
CFI_REL_OFFSET ebx, 0
|
|
.endm
|
|
|
|
.macro RESTORE_ALL
|
|
popl_cfi %ebx
|
|
CFI_RESTORE ebx
|
|
popl_cfi %ecx
|
|
CFI_RESTORE ecx
|
|
popl_cfi %edx
|
|
CFI_RESTORE edx
|
|
popl_cfi %esi
|
|
CFI_RESTORE esi
|
|
popl_cfi %edi
|
|
CFI_RESTORE edi
|
|
popl_cfi %ebp
|
|
CFI_RESTORE ebp
|
|
popl_cfi %eax
|
|
CFI_RESTORE eax
|
|
.endm
|
|
|
|
#endif /* CONFIG_X86_64 */
|
|
|