arm64: Implement stack trace termination record

Reliable stacktracing requires that we identify when a stacktrace is
terminated early. We can do this by ensuring all tasks have a final
frame record at a known location on their task stack, and checking
that this is the final frame record in the chain.

We'd like to use task_pt_regs(task)->stackframe as the final frame
record, as this is already setup upon exception entry from EL0. For
kernel tasks we need to consistently reserve the pt_regs and point x29
at this, which we can do with small changes to __primary_switched,
__secondary_switched, and copy_process().

Since the final frame record must be at a specific location, we must
create the final frame record in __primary_switched and
__secondary_switched rather than leaving this to start_kernel and
secondary_start_kernel. Thus, __primary_switched and
__secondary_switched will now show up in stacktraces for the idle tasks.

Since the final frame record is now identified by its location rather
than by its contents, we identify it at the start of unwind_frame(),
before we read any values from it.

External debuggers may terminate the stack trace when FP == 0. In the
pt_regs->stackframe, the PC is 0 as well. So, stack traces taken in the
debugger may print an extra record 0x0 at the end. While this is not
pretty, this does not do any harm. This is a small price to pay for
having reliable stack trace termination in the kernel. That said, gdb
does not show the extra record probably because it uses DWARF and not
frame pointers for stack traces.

Signed-off-by: Madhavan T. Venkataraman <madvenka@linux.microsoft.com>
Reviewed-by: Mark Brown <broonie@kernel.org>
[Mark: rebase, use ASM_BUG(), update comments, update commit message]
Signed-off-by: Mark Rutland <mark.rutland@arm.com>
Link: https://lore.kernel.org/r/20210510110026.18061-1-mark.rutland@arm.com
Signed-off-by: Will Deacon <will@kernel.org>
This commit is contained in:
Madhavan T. Venkataraman 2021-05-10 12:00:26 +01:00 committed by Will Deacon
parent c4681547bc
commit 7d7b720a4b
4 changed files with 32 additions and 16 deletions

View File

@ -285,7 +285,7 @@ alternative_else_nop_endif
stp lr, x21, [sp, #S_LR] stp lr, x21, [sp, #S_LR]
/* /*
* For exceptions from EL0, create a terminal frame record. * For exceptions from EL0, create a final frame record.
* For exceptions from EL1, create a synthetic frame record so the * For exceptions from EL1, create a synthetic frame record so the
* interrupted code shows up in the backtrace. * interrupted code shows up in the backtrace.
*/ */

View File

@ -16,6 +16,7 @@
#include <asm/asm_pointer_auth.h> #include <asm/asm_pointer_auth.h>
#include <asm/assembler.h> #include <asm/assembler.h>
#include <asm/boot.h> #include <asm/boot.h>
#include <asm/bug.h>
#include <asm/ptrace.h> #include <asm/ptrace.h>
#include <asm/asm-offsets.h> #include <asm/asm-offsets.h>
#include <asm/cache.h> #include <asm/cache.h>
@ -393,6 +394,18 @@ SYM_FUNC_START_LOCAL(__create_page_tables)
ret x28 ret x28
SYM_FUNC_END(__create_page_tables) SYM_FUNC_END(__create_page_tables)
/*
* Create a final frame record at task_pt_regs(current)->stackframe, so
* that the unwinder can identify the final frame record of any task by
* its location in the task stack. We reserve the entire pt_regs space
* for consistency with user tasks and kthreads.
*/
.macro setup_final_frame
sub sp, sp, #PT_REGS_SIZE
stp xzr, xzr, [sp, #S_STACKFRAME]
add x29, sp, #S_STACKFRAME
.endm
/* /*
* The following fragment of code is executed with the MMU enabled. * The following fragment of code is executed with the MMU enabled.
* *
@ -447,9 +460,9 @@ SYM_FUNC_START_LOCAL(__primary_switched)
#endif #endif
bl switch_to_vhe // Prefer VHE if possible bl switch_to_vhe // Prefer VHE if possible
add sp, sp, #16 add sp, sp, #16
mov x29, #0 setup_final_frame
mov x30, #0 bl start_kernel
b start_kernel ASM_BUG()
SYM_FUNC_END(__primary_switched) SYM_FUNC_END(__primary_switched)
.pushsection ".rodata", "a" .pushsection ".rodata", "a"
@ -639,14 +652,14 @@ SYM_FUNC_START_LOCAL(__secondary_switched)
cbz x2, __secondary_too_slow cbz x2, __secondary_too_slow
msr sp_el0, x2 msr sp_el0, x2
scs_load x2, x3 scs_load x2, x3
mov x29, #0 setup_final_frame
mov x30, #0
#ifdef CONFIG_ARM64_PTR_AUTH #ifdef CONFIG_ARM64_PTR_AUTH
ptrauth_keys_init_cpu x2, x3, x4, x5 ptrauth_keys_init_cpu x2, x3, x4, x5
#endif #endif
b secondary_start_kernel bl secondary_start_kernel
ASM_BUG()
SYM_FUNC_END(__secondary_switched) SYM_FUNC_END(__secondary_switched)
SYM_FUNC_START_LOCAL(__secondary_too_slow) SYM_FUNC_START_LOCAL(__secondary_too_slow)

View File

@ -435,6 +435,11 @@ int copy_thread(unsigned long clone_flags, unsigned long stack_start,
} }
p->thread.cpu_context.pc = (unsigned long)ret_from_fork; p->thread.cpu_context.pc = (unsigned long)ret_from_fork;
p->thread.cpu_context.sp = (unsigned long)childregs; p->thread.cpu_context.sp = (unsigned long)childregs;
/*
* For the benefit of the unwinder, set up childregs->stackframe
* as the final frame for the new task.
*/
p->thread.cpu_context.fp = (unsigned long)childregs->stackframe;
ptrace_hw_copy_thread(p); ptrace_hw_copy_thread(p);

View File

@ -68,12 +68,16 @@ int notrace unwind_frame(struct task_struct *tsk, struct stackframe *frame)
unsigned long fp = frame->fp; unsigned long fp = frame->fp;
struct stack_info info; struct stack_info info;
if (fp & 0xf)
return -EINVAL;
if (!tsk) if (!tsk)
tsk = current; tsk = current;
/* Final frame; nothing to unwind */
if (fp == (unsigned long)task_pt_regs(tsk)->stackframe)
return -ENOENT;
if (fp & 0xf)
return -EINVAL;
if (!on_accessible_stack(tsk, fp, &info)) if (!on_accessible_stack(tsk, fp, &info))
return -EINVAL; return -EINVAL;
@ -128,12 +132,6 @@ int notrace unwind_frame(struct task_struct *tsk, struct stackframe *frame)
frame->pc = ptrauth_strip_insn_pac(frame->pc); frame->pc = ptrauth_strip_insn_pac(frame->pc);
/*
* This is a terminal record, so we have finished unwinding.
*/
if (!frame->fp && !frame->pc)
return -ENOENT;
return 0; return 0;
} }
NOKPROBE_SYMBOL(unwind_frame); NOKPROBE_SYMBOL(unwind_frame);