Commit 2507bc13 authored by Haavard Skinnemoen's avatar Haavard Skinnemoen

[AVR32] Follow the rules when dealing with the OCD system

The current debug trap handling code does a number of things that are
illegal according to the AVR32 Architecture manual. Most importantly,
it may try to schedule from Debug Mode, thus clearing the D bit, which
can lead to "undefined behaviour".

It seems like this works in most cases, but several people have
observed somewhat unstable behaviour when debugging programs,
including soft lockups. So there's definitely something which is not
right with the existing code.

The new code will never schedule from Debug mode, it will always exit
Debug mode with a "retd" instruction, and if something not running in
Debug mode needs to do something debug-related (like doing a single
step), it will enter debug mode through a "breakpoint" instruction.
The monitor code will then return directly to user space, bypassing
its own saved registers if necessary (since we don't actually care
about the trapped context, only the one that came before.)

This adds three instructions to the common exception handling code,
including one branch. It does not touch super-hot paths like the TLB
miss handler.
Signed-off-by: default avatarHaavard Skinnemoen <hskinnemoen@atmel.com>
parent 8dfe8f29
...@@ -21,5 +21,7 @@ void foo(void) ...@@ -21,5 +21,7 @@ void foo(void)
OFFSET(TI_flags, thread_info, flags); OFFSET(TI_flags, thread_info, flags);
OFFSET(TI_cpu, thread_info, cpu); OFFSET(TI_cpu, thread_info, cpu);
OFFSET(TI_preempt_count, thread_info, preempt_count); OFFSET(TI_preempt_count, thread_info, preempt_count);
OFFSET(TI_rar_saved, thread_info, rar_saved);
OFFSET(TI_rsr_saved, thread_info, rsr_saved);
OFFSET(TI_restart_block, thread_info, restart_block); OFFSET(TI_restart_block, thread_info, restart_block);
} }
...@@ -264,16 +264,7 @@ syscall_exit_work: ...@@ -264,16 +264,7 @@ syscall_exit_work:
3: bld r1, TIF_BREAKPOINT 3: bld r1, TIF_BREAKPOINT
brcc syscall_exit_cont brcc syscall_exit_cont
mfsr r3, SYSREG_TLBEHI rjmp enter_monitor_mode
lddsp r2, sp[REG_PC]
andl r3, 0xff, COH
lsl r3, 1
sbr r3, 30
sbr r3, 0
mtdr OCD_BWA2A, r2
mtdr OCD_BWC2A, r3
rjmp syscall_exit_cont
/* The slow path of the TLB miss handler */ /* The slow path of the TLB miss handler */
page_table_not_present: page_table_not_present:
...@@ -288,11 +279,16 @@ page_not_present: ...@@ -288,11 +279,16 @@ page_not_present:
rjmp ret_from_exception rjmp ret_from_exception
/* This function expects to find offending PC in SYSREG_RAR_EX */ /* This function expects to find offending PC in SYSREG_RAR_EX */
.type save_full_context_ex, @function
.align 2
save_full_context_ex: save_full_context_ex:
mfsr r11, SYSREG_RAR_EX
sub r9, pc, . - debug_trampoline
mfsr r8, SYSREG_RSR_EX mfsr r8, SYSREG_RSR_EX
cp.w r9, r11
breq 3f
mov r12, r8 mov r12, r8
andh r8, (MODE_MASK >> 16), COH andh r8, (MODE_MASK >> 16), COH
mfsr r11, SYSREG_RAR_EX
brne 2f brne 2f
1: pushm r11, r12 /* PC and SR */ 1: pushm r11, r12 /* PC and SR */
...@@ -303,6 +299,21 @@ save_full_context_ex: ...@@ -303,6 +299,21 @@ save_full_context_ex:
stdsp sp[4], r10 /* replace saved SP */ stdsp sp[4], r10 /* replace saved SP */
rjmp 1b rjmp 1b
/*
* The debug handler set up a trampoline to make us
* automatically enter monitor mode upon return, but since
* we're saving the full context, we must assume that the
* exception handler might want to alter the return address
* and/or status register. So we need to restore the original
* context and enter monitor mode manually after the exception
* has been handled.
*/
3: get_thread_info r8
ld.w r11, r8[TI_rar_saved]
ld.w r12, r8[TI_rsr_saved]
rjmp 1b
.size save_full_context_ex, . - save_full_context_ex
/* Low-level exception handlers */ /* Low-level exception handlers */
handle_critical: handle_critical:
pushm r12 pushm r12
...@@ -439,6 +450,7 @@ do_fpe_ll: ...@@ -439,6 +450,7 @@ do_fpe_ll:
ret_from_exception: ret_from_exception:
mask_interrupts mask_interrupts
lddsp r4, sp[REG_SR] lddsp r4, sp[REG_SR]
andh r4, (MODE_MASK >> 16), COH andh r4, (MODE_MASK >> 16), COH
brne fault_resume_kernel brne fault_resume_kernel
...@@ -515,34 +527,76 @@ fault_exit_work: ...@@ -515,34 +527,76 @@ fault_exit_work:
2: bld r1, TIF_BREAKPOINT 2: bld r1, TIF_BREAKPOINT
brcc fault_resume_user brcc fault_resume_user
mfsr r3, SYSREG_TLBEHI rjmp enter_monitor_mode
lddsp r2, sp[REG_PC]
andl r3, 0xff, COH .section .kprobes.text, "ax", @progbits
lsl r3, 1 .type handle_debug, @function
sbr r3, 30 handle_debug:
sbr r3, 0 sub sp, 4 /* r12_orig */
mtdr OCD_BWA2A, r2 stmts --sp, r0-lr
mtdr OCD_BWC2A, r3 mfsr r8, SYSREG_RAR_DBG
rjmp fault_resume_user mfsr r9, SYSREG_RSR_DBG
unmask_exceptions
/* If we get a debug trap from privileged context we end up here */ pushm r8-r9
handle_debug_priv: bfextu r9, r9, SYSREG_MODE_OFFSET, SYSREG_MODE_SIZE
/* Fix up LR and SP in regs. r1 contains the mode we came from */ brne debug_fixup_regs
mfsr r2, SYSREG_SR
mov r3, r2 .Ldebug_fixup_cont:
bfins r2, r1, SYSREG_MODE_OFFSET, SYSREG_MODE_SIZE #ifdef CONFIG_TRACE_IRQFLAGS
mtsr SYSREG_SR, r2 rcall trace_hardirqs_off
#endif
mov r12, sp
rcall do_debug
mov sp, r12
lddsp r2, sp[REG_SR]
bfextu r3, r2, SYSREG_MODE_OFFSET, SYSREG_MODE_SIZE
brne debug_resume_kernel
get_thread_info r0
ld.w r1, r0[TI_flags]
mov r2, _TIF_DBGWORK_MASK
tst r1, r2
brne debug_exit_work
bld r1, TIF_SINGLE_STEP
brcc 1f
mfdr r4, OCD_DC
sbr r4, OCD_DC_SS_BIT
mtdr OCD_DC, r4
1: popm r10,r11
mask_exceptions
mtsr SYSREG_RSR_DBG, r11
mtsr SYSREG_RAR_DBG, r10
#ifdef CONFIG_TRACE_IRQFLAGS
rcall trace_hardirqs_on
1:
#endif
ldmts sp++, r0-lr
sub sp, -4
retd
.size handle_debug, . - handle_debug
/* Mode of the trapped context is in r9 */
.type debug_fixup_regs, @function
debug_fixup_regs:
mfsr r8, SYSREG_SR
mov r10, r8
bfins r8, r9, SYSREG_MODE_OFFSET, SYSREG_MODE_SIZE
mtsr SYSREG_SR, r8
sub pc, -2 sub pc, -2
stdsp sp[REG_LR], lr stdsp sp[REG_LR], lr
mtsr SYSREG_SR, r3 mtsr SYSREG_SR, r10
sub pc, -2 sub pc, -2
sub r10, sp, -FRAME_SIZE_FULL sub r8, sp, -FRAME_SIZE_FULL
stdsp sp[REG_SP], r10 stdsp sp[REG_SP], r8
mov r12, sp rjmp .Ldebug_fixup_cont
rcall do_debug_priv .size debug_fixup_regs, . - debug_fixup_regs
/* Now, put everything back */ .type debug_resume_kernel, @function
ssrf SR_EM_BIT debug_resume_kernel:
mask_exceptions
popm r10, r11 popm r10, r11
mtsr SYSREG_RAR_DBG, r10 mtsr SYSREG_RAR_DBG, r10
mtsr SYSREG_RSR_DBG, r11 mtsr SYSREG_RSR_DBG, r11
...@@ -553,93 +607,44 @@ handle_debug_priv: ...@@ -553,93 +607,44 @@ handle_debug_priv:
1: 1:
#endif #endif
mfsr r2, SYSREG_SR mfsr r2, SYSREG_SR
mov r3, r2 mov r1, r2
bfins r2, r1, SYSREG_MODE_OFFSET, SYSREG_MODE_SIZE bfins r2, r3, SYSREG_MODE_OFFSET, SYSREG_MODE_SIZE
mtsr SYSREG_SR, r2 mtsr SYSREG_SR, r2
sub pc, -2 sub pc, -2
popm lr popm lr
mtsr SYSREG_SR, r3 mtsr SYSREG_SR, r1
sub pc, -2 sub pc, -2
sub sp, -4 /* skip SP */ sub sp, -4 /* skip SP */
popm r0-r12 popm r0-r12
sub sp, -4 sub sp, -4
retd retd
.size debug_resume_kernel, . - debug_resume_kernel
.type debug_exit_work, @function
debug_exit_work:
/* /*
* At this point, everything is masked, that is, interrupts, * We must return from Monitor Mode using a retd, and we must
* exceptions and debugging traps. We might get called from * not schedule since that involves the D bit in SR getting
* interrupt or exception context in some rare cases, but this * cleared by something other than the debug hardware. This
* will be taken care of by do_debug(), so we're not going to * may cause undefined behaviour according to the Architecture
* do a 100% correct context save here. * manual.
*
* So we fix up the return address and status and return to a
* stub below in Exception mode. From there, we can follow the
* normal exception return path.
*
* The real return address and status registers are stored on
* the stack in the way the exception return path understands,
* so no need to fix anything up there.
*/ */
handle_debug: sub r8, pc, . - fault_exit_work
sub sp, 4 /* r12_orig */ mtsr SYSREG_RAR_DBG, r8
stmts --sp, r0-lr mov r9, 0
mfsr r0, SYSREG_RAR_DBG orh r9, hi(SR_EM | SR_GM | MODE_EXCEPTION)
mfsr r1, SYSREG_RSR_DBG mtsr SYSREG_RSR_DBG, r9
#ifdef CONFIG_TRACE_IRQFLAGS sub pc, -2
rcall trace_hardirqs_off
#endif
unmask_exceptions
stm --sp, r0, r1
bfextu r1, r1, SYSREG_MODE_OFFSET, SYSREG_MODE_SIZE
brne handle_debug_priv
mov r12, sp
rcall do_debug
lddsp r10, sp[REG_SR]
andh r10, (MODE_MASK >> 16), COH
breq debug_resume_user
debug_restore_all:
popm r10,r11
mask_exceptions
mtsr SYSREG_RSR_DBG, r11
mtsr SYSREG_RAR_DBG, r10
#ifdef CONFIG_TRACE_IRQFLAGS
bld r11, SYSREG_GM_OFFSET
brcc 1f
rcall trace_hardirqs_on
1:
#endif
ldmts sp++, r0-lr
sub sp, -4
retd retd
.size debug_exit_work, . - debug_exit_work
debug_resume_user:
get_thread_info r0
mask_interrupts
ld.w r1, r0[TI_flags]
andl r1, _TIF_DBGWORK_MASK, COH
breq debug_restore_all
1: bld r1, TIF_NEED_RESCHED
brcc 2f
unmask_interrupts
rcall schedule
mask_interrupts
ld.w r1, r0[TI_flags]
rjmp 1b
2: mov r2, _TIF_SIGPENDING | _TIF_RESTORE_SIGMASK
tst r1, r2
breq 3f
unmask_interrupts
mov r12, sp
mov r11, r0
rcall do_notify_resume
mask_interrupts
ld.w r1, r0[TI_flags]
rjmp 1b
3: bld r1, TIF_SINGLE_STEP
brcc debug_restore_all
mfdr r2, OCD_DC
sbr r2, OCD_DC_SS_BIT
mtdr OCD_DC, r2
rjmp debug_restore_all
.set rsr_int0, SYSREG_RSR_INT0 .set rsr_int0, SYSREG_RSR_INT0
.set rsr_int1, SYSREG_RSR_INT1 .set rsr_int1, SYSREG_RSR_INT1
...@@ -764,3 +769,53 @@ cpu_idle_enable_int_and_exit: ...@@ -764,3 +769,53 @@ cpu_idle_enable_int_and_exit:
IRQ_LEVEL 1 IRQ_LEVEL 1
IRQ_LEVEL 2 IRQ_LEVEL 2
IRQ_LEVEL 3 IRQ_LEVEL 3
.section .kprobes.text, "ax", @progbits
.type enter_monitor_mode, @function
enter_monitor_mode:
/*
* We need to enter monitor mode to do a single step. The
* monitor code will alter the return address so that we
* return directly to the user instead of returning here.
*/
breakpoint
rjmp breakpoint_failed
.size enter_monitor_mode, . - enter_monitor_mode
.type debug_trampoline, @function
.global debug_trampoline
debug_trampoline:
/*
* Save the registers on the stack so that the monitor code
* can find them easily.
*/
sub sp, 4 /* r12_orig */
stmts --sp, r0-lr
get_thread_info r0
ld.w r8, r0[TI_rar_saved]
ld.w r9, r0[TI_rsr_saved]
pushm r8-r9
/*
* The monitor code will alter the return address so we don't
* return here.
*/
breakpoint
rjmp breakpoint_failed
.size debug_trampoline, . - debug_trampoline
.type breakpoint_failed, @function
breakpoint_failed:
/*
* Something went wrong. Perhaps the debug hardware isn't
* enabled?
*/
lda.w r12, msg_breakpoint_failed
mov r11, sp
mov r10, 9 /* SIGKILL */
call die
1: rjmp 1b
msg_breakpoint_failed:
.asciz "Failed to enter Debug Mode"
This diff is collapsed.
...@@ -77,10 +77,10 @@ SECTIONS ...@@ -77,10 +77,10 @@ SECTIONS
. = 0x100; . = 0x100;
*(.scall.text) *(.scall.text)
*(.irq.text) *(.irq.text)
KPROBES_TEXT
TEXT_TEXT TEXT_TEXT
SCHED_TEXT SCHED_TEXT
LOCK_TEXT LOCK_TEXT
KPROBES_TEXT
*(.fixup) *(.fixup)
*(.gnu.warning) *(.gnu.warning)
_etext = .; _etext = .;
......
...@@ -139,6 +139,9 @@ extern void show_regs_log_lvl(struct pt_regs *regs, const char *log_lvl); ...@@ -139,6 +139,9 @@ extern void show_regs_log_lvl(struct pt_regs *regs, const char *log_lvl);
extern void show_stack_log_lvl(struct task_struct *tsk, unsigned long sp, extern void show_stack_log_lvl(struct task_struct *tsk, unsigned long sp,
struct pt_regs *regs, const char *log_lvl); struct pt_regs *regs, const char *log_lvl);
#define task_pt_regs(p) \
((struct pt_regs *)(THREAD_SIZE + task_stack_page(p)) - 1)
#define KSTK_EIP(tsk) ((tsk)->thread.cpu_context.pc) #define KSTK_EIP(tsk) ((tsk)->thread.cpu_context.pc)
#define KSTK_ESP(tsk) ((tsk)->thread.cpu_context.ksp) #define KSTK_ESP(tsk) ((tsk)->thread.cpu_context.ksp)
......
...@@ -25,6 +25,11 @@ struct thread_info { ...@@ -25,6 +25,11 @@ struct thread_info {
unsigned long flags; /* low level flags */ unsigned long flags; /* low level flags */
__u32 cpu; __u32 cpu;
__s32 preempt_count; /* 0 => preemptable, <0 => BUG */ __s32 preempt_count; /* 0 => preemptable, <0 => BUG */
__u32 rar_saved; /* return address... */
__u32 rsr_saved; /* ...and status register
saved by debug handler
when setting up
trampoline */
struct restart_block restart_block; struct restart_block restart_block;
__u8 supervisor_stack[0]; __u8 supervisor_stack[0];
}; };
...@@ -78,8 +83,8 @@ static inline struct thread_info *current_thread_info(void) ...@@ -78,8 +83,8 @@ static inline struct thread_info *current_thread_info(void)
#define TIF_NEED_RESCHED 2 /* rescheduling necessary */ #define TIF_NEED_RESCHED 2 /* rescheduling necessary */
#define TIF_POLLING_NRFLAG 3 /* true if poll_idle() is polling #define TIF_POLLING_NRFLAG 3 /* true if poll_idle() is polling
TIF_NEED_RESCHED */ TIF_NEED_RESCHED */
#define TIF_BREAKPOINT 4 /* true if we should break after return */ #define TIF_BREAKPOINT 4 /* enter monitor mode on return */
#define TIF_SINGLE_STEP 5 /* single step after next break */ #define TIF_SINGLE_STEP 5 /* single step in progress */
#define TIF_MEMDIE 6 #define TIF_MEMDIE 6
#define TIF_RESTORE_SIGMASK 7 /* restore signal mask in do_signal */ #define TIF_RESTORE_SIGMASK 7 /* restore signal mask in do_signal */
#define TIF_CPU_GOING_TO_SLEEP 8 /* CPU is entering sleep 0 mode */ #define TIF_CPU_GOING_TO_SLEEP 8 /* CPU is entering sleep 0 mode */
...@@ -89,7 +94,6 @@ static inline struct thread_info *current_thread_info(void) ...@@ -89,7 +94,6 @@ static inline struct thread_info *current_thread_info(void)
#define _TIF_SIGPENDING (1 << TIF_SIGPENDING) #define _TIF_SIGPENDING (1 << TIF_SIGPENDING)
#define _TIF_NEED_RESCHED (1 << TIF_NEED_RESCHED) #define _TIF_NEED_RESCHED (1 << TIF_NEED_RESCHED)
#define _TIF_POLLING_NRFLAG (1 << TIF_POLLING_NRFLAG) #define _TIF_POLLING_NRFLAG (1 << TIF_POLLING_NRFLAG)
#define _TIF_BREAKPOINT (1 << TIF_BREAKPOINT)
#define _TIF_SINGLE_STEP (1 << TIF_SINGLE_STEP) #define _TIF_SINGLE_STEP (1 << TIF_SINGLE_STEP)
#define _TIF_MEMDIE (1 << TIF_MEMDIE) #define _TIF_MEMDIE (1 << TIF_MEMDIE)
#define _TIF_RESTORE_SIGMASK (1 << TIF_RESTORE_SIGMASK) #define _TIF_RESTORE_SIGMASK (1 << TIF_RESTORE_SIGMASK)
...@@ -108,6 +112,6 @@ static inline struct thread_info *current_thread_info(void) ...@@ -108,6 +112,6 @@ static inline struct thread_info *current_thread_info(void)
/* work to do on any return to userspace */ /* work to do on any return to userspace */
#define _TIF_ALLWORK_MASK (_TIF_WORK_MASK | (1 << TIF_SYSCALL_TRACE)) #define _TIF_ALLWORK_MASK (_TIF_WORK_MASK | (1 << TIF_SYSCALL_TRACE))
/* work to do on return from debug mode */ /* work to do on return from debug mode */
#define _TIF_DBGWORK_MASK (_TIF_WORK_MASK | (1 << TIF_SINGLE_STEP)) #define _TIF_DBGWORK_MASK (_TIF_WORK_MASK & ~(1 << TIF_BREAKPOINT))
#endif /* __ASM_AVR32_THREAD_INFO_H */ #endif /* __ASM_AVR32_THREAD_INFO_H */
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment