15aae8a53SK.Prasad /* 25aae8a53SK.Prasad * HW_breakpoint: a unified kernel/user-space hardware breakpoint facility, 35aae8a53SK.Prasad * using the CPU's debug registers. Derived from 45aae8a53SK.Prasad * "arch/x86/kernel/hw_breakpoint.c" 55aae8a53SK.Prasad * 65aae8a53SK.Prasad * This program is free software; you can redistribute it and/or modify 75aae8a53SK.Prasad * it under the terms of the GNU General Public License as published by 85aae8a53SK.Prasad * the Free Software Foundation; either version 2 of the License, or 95aae8a53SK.Prasad * (at your option) any later version. 105aae8a53SK.Prasad * 115aae8a53SK.Prasad * This program is distributed in the hope that it will be useful, 125aae8a53SK.Prasad * but WITHOUT ANY WARRANTY; without even the implied warranty of 135aae8a53SK.Prasad * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 145aae8a53SK.Prasad * GNU General Public License for more details. 155aae8a53SK.Prasad * 165aae8a53SK.Prasad * You should have received a copy of the GNU General Public License 175aae8a53SK.Prasad * along with this program; if not, write to the Free Software 185aae8a53SK.Prasad * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. 195aae8a53SK.Prasad * 205aae8a53SK.Prasad * Copyright 2010 IBM Corporation 215aae8a53SK.Prasad * Author: K.Prasad <prasad@linux.vnet.ibm.com> 225aae8a53SK.Prasad * 235aae8a53SK.Prasad */ 245aae8a53SK.Prasad 255aae8a53SK.Prasad #include <linux/hw_breakpoint.h> 265aae8a53SK.Prasad #include <linux/notifier.h> 275aae8a53SK.Prasad #include <linux/kprobes.h> 285aae8a53SK.Prasad #include <linux/percpu.h> 295aae8a53SK.Prasad #include <linux/kernel.h> 305aae8a53SK.Prasad #include <linux/sched.h> 315aae8a53SK.Prasad #include <linux/smp.h> 325aae8a53SK.Prasad 335aae8a53SK.Prasad #include <asm/hw_breakpoint.h> 345aae8a53SK.Prasad #include <asm/processor.h> 355aae8a53SK.Prasad #include <asm/sstep.h> 36*7c0f6ba6SLinus Torvalds #include <linux/uaccess.h> 375aae8a53SK.Prasad 385aae8a53SK.Prasad /* 395aae8a53SK.Prasad * Stores the breakpoints currently in use on each breakpoint address 405aae8a53SK.Prasad * register for every cpu 415aae8a53SK.Prasad */ 425aae8a53SK.Prasad static DEFINE_PER_CPU(struct perf_event *, bp_per_reg); 435aae8a53SK.Prasad 445aae8a53SK.Prasad /* 45d09ec738SPaul Mackerras * Returns total number of data or instruction breakpoints available. 46d09ec738SPaul Mackerras */ 47d09ec738SPaul Mackerras int hw_breakpoint_slots(int type) 48d09ec738SPaul Mackerras { 49d09ec738SPaul Mackerras if (type == TYPE_DATA) 50d09ec738SPaul Mackerras return HBP_NUM; 51d09ec738SPaul Mackerras return 0; /* no instruction breakpoints available */ 52d09ec738SPaul Mackerras } 53d09ec738SPaul Mackerras 54d09ec738SPaul Mackerras /* 555aae8a53SK.Prasad * Install a perf counter breakpoint. 565aae8a53SK.Prasad * 575aae8a53SK.Prasad * We seek a free debug address register and use it for this 585aae8a53SK.Prasad * breakpoint. 595aae8a53SK.Prasad * 605aae8a53SK.Prasad * Atomic: we hold the counter->ctx->lock and we only handle variables 615aae8a53SK.Prasad * and registers local to this cpu. 625aae8a53SK.Prasad */ 635aae8a53SK.Prasad int arch_install_hw_breakpoint(struct perf_event *bp) 645aae8a53SK.Prasad { 655aae8a53SK.Prasad struct arch_hw_breakpoint *info = counter_arch_bp(bp); 6669111bacSChristoph Lameter struct perf_event **slot = this_cpu_ptr(&bp_per_reg); 675aae8a53SK.Prasad 685aae8a53SK.Prasad *slot = bp; 695aae8a53SK.Prasad 705aae8a53SK.Prasad /* 715aae8a53SK.Prasad * Do not install DABR values if the instruction must be single-stepped. 725aae8a53SK.Prasad * If so, DABR will be populated in single_step_dabr_instruction(). 735aae8a53SK.Prasad */ 745aae8a53SK.Prasad if (current->thread.last_hit_ubp != bp) 7521f58507SPaul Gortmaker __set_breakpoint(info); 765aae8a53SK.Prasad 775aae8a53SK.Prasad return 0; 785aae8a53SK.Prasad } 795aae8a53SK.Prasad 805aae8a53SK.Prasad /* 815aae8a53SK.Prasad * Uninstall the breakpoint contained in the given counter. 825aae8a53SK.Prasad * 835aae8a53SK.Prasad * First we search the debug address register it uses and then we disable 845aae8a53SK.Prasad * it. 855aae8a53SK.Prasad * 865aae8a53SK.Prasad * Atomic: we hold the counter->ctx->lock and we only handle variables 875aae8a53SK.Prasad * and registers local to this cpu. 885aae8a53SK.Prasad */ 895aae8a53SK.Prasad void arch_uninstall_hw_breakpoint(struct perf_event *bp) 905aae8a53SK.Prasad { 9169111bacSChristoph Lameter struct perf_event **slot = this_cpu_ptr(&bp_per_reg); 925aae8a53SK.Prasad 935aae8a53SK.Prasad if (*slot != bp) { 945aae8a53SK.Prasad WARN_ONCE(1, "Can't find the breakpoint"); 955aae8a53SK.Prasad return; 965aae8a53SK.Prasad } 975aae8a53SK.Prasad 985aae8a53SK.Prasad *slot = NULL; 999422de3eSMichael Neuling hw_breakpoint_disable(); 1005aae8a53SK.Prasad } 1015aae8a53SK.Prasad 1025aae8a53SK.Prasad /* 1035aae8a53SK.Prasad * Perform cleanup of arch-specific counters during unregistration 1045aae8a53SK.Prasad * of the perf-event 1055aae8a53SK.Prasad */ 1065aae8a53SK.Prasad void arch_unregister_hw_breakpoint(struct perf_event *bp) 1075aae8a53SK.Prasad { 1085aae8a53SK.Prasad /* 1095aae8a53SK.Prasad * If the breakpoint is unregistered between a hw_breakpoint_handler() 1105aae8a53SK.Prasad * and the single_step_dabr_instruction(), then cleanup the breakpoint 1115aae8a53SK.Prasad * restoration variables to prevent dangling pointers. 112fb822e60SRavi Bangoria * FIXME, this should not be using bp->ctx at all! Sayeth peterz. 1135aae8a53SK.Prasad */ 114fb822e60SRavi Bangoria if (bp->ctx && bp->ctx->task && bp->ctx->task != ((void *)-1L)) 1155aae8a53SK.Prasad bp->ctx->task->thread.last_hit_ubp = NULL; 1165aae8a53SK.Prasad } 1175aae8a53SK.Prasad 1185aae8a53SK.Prasad /* 1195aae8a53SK.Prasad * Check for virtual address in kernel space. 1205aae8a53SK.Prasad */ 1215aae8a53SK.Prasad int arch_check_bp_in_kernelspace(struct perf_event *bp) 1225aae8a53SK.Prasad { 1235aae8a53SK.Prasad struct arch_hw_breakpoint *info = counter_arch_bp(bp); 1245aae8a53SK.Prasad 1255aae8a53SK.Prasad return is_kernel_addr(info->address); 1265aae8a53SK.Prasad } 1275aae8a53SK.Prasad 1285aae8a53SK.Prasad int arch_bp_generic_fields(int type, int *gen_bp_type) 1295aae8a53SK.Prasad { 1309422de3eSMichael Neuling *gen_bp_type = 0; 1319422de3eSMichael Neuling if (type & HW_BRK_TYPE_READ) 1329422de3eSMichael Neuling *gen_bp_type |= HW_BREAKPOINT_R; 1339422de3eSMichael Neuling if (type & HW_BRK_TYPE_WRITE) 1349422de3eSMichael Neuling *gen_bp_type |= HW_BREAKPOINT_W; 1359422de3eSMichael Neuling if (*gen_bp_type == 0) 1365aae8a53SK.Prasad return -EINVAL; 1375aae8a53SK.Prasad return 0; 1385aae8a53SK.Prasad } 1395aae8a53SK.Prasad 1405aae8a53SK.Prasad /* 1415aae8a53SK.Prasad * Validate the arch-specific HW Breakpoint register settings 1425aae8a53SK.Prasad */ 1435aae8a53SK.Prasad int arch_validate_hwbkpt_settings(struct perf_event *bp) 1445aae8a53SK.Prasad { 1454ae7ebe9SMichael Neuling int ret = -EINVAL, length_max; 1465aae8a53SK.Prasad struct arch_hw_breakpoint *info = counter_arch_bp(bp); 1475aae8a53SK.Prasad 1485aae8a53SK.Prasad if (!bp) 1495aae8a53SK.Prasad return ret; 1505aae8a53SK.Prasad 1519422de3eSMichael Neuling info->type = HW_BRK_TYPE_TRANSLATE; 1529422de3eSMichael Neuling if (bp->attr.bp_type & HW_BREAKPOINT_R) 1539422de3eSMichael Neuling info->type |= HW_BRK_TYPE_READ; 1549422de3eSMichael Neuling if (bp->attr.bp_type & HW_BREAKPOINT_W) 1559422de3eSMichael Neuling info->type |= HW_BRK_TYPE_WRITE; 1569422de3eSMichael Neuling if (info->type == HW_BRK_TYPE_TRANSLATE) 1579422de3eSMichael Neuling /* must set alteast read or write */ 1585aae8a53SK.Prasad return ret; 1599422de3eSMichael Neuling if (!(bp->attr.exclude_user)) 1609422de3eSMichael Neuling info->type |= HW_BRK_TYPE_USER; 1619422de3eSMichael Neuling if (!(bp->attr.exclude_kernel)) 1629422de3eSMichael Neuling info->type |= HW_BRK_TYPE_KERNEL; 1639422de3eSMichael Neuling if (!(bp->attr.exclude_hv)) 1649422de3eSMichael Neuling info->type |= HW_BRK_TYPE_HYP; 1655aae8a53SK.Prasad info->address = bp->attr.bp_addr; 1665aae8a53SK.Prasad info->len = bp->attr.bp_len; 1675aae8a53SK.Prasad 1685aae8a53SK.Prasad /* 1695aae8a53SK.Prasad * Since breakpoint length can be a maximum of HW_BREAKPOINT_LEN(8) 1705aae8a53SK.Prasad * and breakpoint addresses are aligned to nearest double-word 1715aae8a53SK.Prasad * HW_BREAKPOINT_ALIGN by rounding off to the lower address, the 1725aae8a53SK.Prasad * 'symbolsize' should satisfy the check below. 1735aae8a53SK.Prasad */ 1744ae7ebe9SMichael Neuling length_max = 8; /* DABR */ 1754ae7ebe9SMichael Neuling if (cpu_has_feature(CPU_FTR_DAWR)) { 1764ae7ebe9SMichael Neuling length_max = 512 ; /* 64 doublewords */ 1774ae7ebe9SMichael Neuling /* DAWR region can't cross 512 boundary */ 1784ae7ebe9SMichael Neuling if ((bp->attr.bp_addr >> 10) != 179e2a800beSMichael Neuling ((bp->attr.bp_addr + bp->attr.bp_len - 1) >> 10)) 1804ae7ebe9SMichael Neuling return -EINVAL; 1814ae7ebe9SMichael Neuling } 1825aae8a53SK.Prasad if (info->len > 1834ae7ebe9SMichael Neuling (length_max - (info->address & HW_BREAKPOINT_ALIGN))) 1845aae8a53SK.Prasad return -EINVAL; 1855aae8a53SK.Prasad return 0; 1865aae8a53SK.Prasad } 1875aae8a53SK.Prasad 1885aae8a53SK.Prasad /* 18906532a67SK.Prasad * Restores the breakpoint on the debug registers. 19006532a67SK.Prasad * Invoke this function if it is known that the execution context is 19106532a67SK.Prasad * about to change to cause loss of MSR_SE settings. 19206532a67SK.Prasad */ 19306532a67SK.Prasad void thread_change_pc(struct task_struct *tsk, struct pt_regs *regs) 19406532a67SK.Prasad { 19506532a67SK.Prasad struct arch_hw_breakpoint *info; 19606532a67SK.Prasad 19706532a67SK.Prasad if (likely(!tsk->thread.last_hit_ubp)) 19806532a67SK.Prasad return; 19906532a67SK.Prasad 20006532a67SK.Prasad info = counter_arch_bp(tsk->thread.last_hit_ubp); 20106532a67SK.Prasad regs->msr &= ~MSR_SE; 20221f58507SPaul Gortmaker __set_breakpoint(info); 20306532a67SK.Prasad tsk->thread.last_hit_ubp = NULL; 20406532a67SK.Prasad } 20506532a67SK.Prasad 20606532a67SK.Prasad /* 2075aae8a53SK.Prasad * Handle debug exception notifications. 2085aae8a53SK.Prasad */ 20903465f89SNicholas Piggin int hw_breakpoint_handler(struct die_args *args) 2105aae8a53SK.Prasad { 2115aae8a53SK.Prasad int rc = NOTIFY_STOP; 2125aae8a53SK.Prasad struct perf_event *bp; 2135aae8a53SK.Prasad struct pt_regs *regs = args->regs; 2145aae8a53SK.Prasad int stepped = 1; 2155aae8a53SK.Prasad struct arch_hw_breakpoint *info; 2165aae8a53SK.Prasad unsigned int instr; 217e3e94084SK.Prasad unsigned long dar = regs->dar; 2185aae8a53SK.Prasad 2195aae8a53SK.Prasad /* Disable breakpoints during exception handling */ 2209422de3eSMichael Neuling hw_breakpoint_disable(); 221574cb248SPaul Mackerras 2225aae8a53SK.Prasad /* 2235aae8a53SK.Prasad * The counter may be concurrently released but that can only 2245aae8a53SK.Prasad * occur from a call_rcu() path. We can then safely fetch 2255aae8a53SK.Prasad * the breakpoint, use its callback, touch its counter 2265aae8a53SK.Prasad * while we are in an rcu_read_lock() path. 2275aae8a53SK.Prasad */ 2285aae8a53SK.Prasad rcu_read_lock(); 2295aae8a53SK.Prasad 23069111bacSChristoph Lameter bp = __this_cpu_read(bp_per_reg); 2315aae8a53SK.Prasad if (!bp) 2325aae8a53SK.Prasad goto out; 2335aae8a53SK.Prasad info = counter_arch_bp(bp); 2345aae8a53SK.Prasad 2355aae8a53SK.Prasad /* 2365aae8a53SK.Prasad * Return early after invoking user-callback function without restoring 2375aae8a53SK.Prasad * DABR if the breakpoint is from ptrace which always operates in 2385aae8a53SK.Prasad * one-shot mode. The ptrace-ed process will receive the SIGTRAP signal 2395aae8a53SK.Prasad * generated in do_dabr(). 2405aae8a53SK.Prasad */ 241574cb248SPaul Mackerras if (bp->overflow_handler == ptrace_triggered) { 2425aae8a53SK.Prasad perf_bp_event(bp, regs); 2435aae8a53SK.Prasad rc = NOTIFY_DONE; 2445aae8a53SK.Prasad goto out; 2455aae8a53SK.Prasad } 2465aae8a53SK.Prasad 247e3e94084SK.Prasad /* 248e3e94084SK.Prasad * Verify if dar lies within the address range occupied by the symbol 249574cb248SPaul Mackerras * being watched to filter extraneous exceptions. If it doesn't, 250574cb248SPaul Mackerras * we still need to single-step the instruction, but we don't 251574cb248SPaul Mackerras * generate an event. 252e3e94084SK.Prasad */ 253540e07c6SMichael Neuling info->type &= ~HW_BRK_TYPE_EXTRANEOUS_IRQ; 2549422de3eSMichael Neuling if (!((bp->attr.bp_addr <= dar) && 2559422de3eSMichael Neuling (dar - bp->attr.bp_addr < bp->attr.bp_len))) 2569422de3eSMichael Neuling info->type |= HW_BRK_TYPE_EXTRANEOUS_IRQ; 257e3e94084SK.Prasad 2585aae8a53SK.Prasad /* Do not emulate user-space instructions, instead single-step them */ 2595aae8a53SK.Prasad if (user_mode(regs)) { 2606d9c00c6SMichael Neuling current->thread.last_hit_ubp = bp; 2615aae8a53SK.Prasad regs->msr |= MSR_SE; 2625aae8a53SK.Prasad goto out; 2635aae8a53SK.Prasad } 2645aae8a53SK.Prasad 2655aae8a53SK.Prasad stepped = 0; 2665aae8a53SK.Prasad instr = 0; 2675aae8a53SK.Prasad if (!__get_user_inatomic(instr, (unsigned int *) regs->nip)) 2685aae8a53SK.Prasad stepped = emulate_step(regs, instr); 2695aae8a53SK.Prasad 2705aae8a53SK.Prasad /* 2715aae8a53SK.Prasad * emulate_step() could not execute it. We've failed in reliably 2725aae8a53SK.Prasad * handling the hw-breakpoint. Unregister it and throw a warning 2735aae8a53SK.Prasad * message to let the user know about it. 2745aae8a53SK.Prasad */ 2755aae8a53SK.Prasad if (!stepped) { 2765aae8a53SK.Prasad WARN(1, "Unable to handle hardware breakpoint. Breakpoint at " 2775aae8a53SK.Prasad "0x%lx will be disabled.", info->address); 2785aab90ceSJiri Olsa perf_event_disable_inatomic(bp); 2795aae8a53SK.Prasad goto out; 2805aae8a53SK.Prasad } 2815aae8a53SK.Prasad /* 2825aae8a53SK.Prasad * As a policy, the callback is invoked in a 'trigger-after-execute' 2835aae8a53SK.Prasad * fashion 2845aae8a53SK.Prasad */ 2859422de3eSMichael Neuling if (!(info->type & HW_BRK_TYPE_EXTRANEOUS_IRQ)) 2865aae8a53SK.Prasad perf_bp_event(bp, regs); 2875aae8a53SK.Prasad 28821f58507SPaul Gortmaker __set_breakpoint(info); 2895aae8a53SK.Prasad out: 2905aae8a53SK.Prasad rcu_read_unlock(); 2915aae8a53SK.Prasad return rc; 2925aae8a53SK.Prasad } 29303465f89SNicholas Piggin NOKPROBE_SYMBOL(hw_breakpoint_handler); 2945aae8a53SK.Prasad 2955aae8a53SK.Prasad /* 2965aae8a53SK.Prasad * Handle single-step exceptions following a DABR hit. 2975aae8a53SK.Prasad */ 29803465f89SNicholas Piggin static int single_step_dabr_instruction(struct die_args *args) 2995aae8a53SK.Prasad { 3005aae8a53SK.Prasad struct pt_regs *regs = args->regs; 3015aae8a53SK.Prasad struct perf_event *bp = NULL; 3023f4693eeSMichael Neuling struct arch_hw_breakpoint *info; 3035aae8a53SK.Prasad 3045aae8a53SK.Prasad bp = current->thread.last_hit_ubp; 3055aae8a53SK.Prasad /* 3065aae8a53SK.Prasad * Check if we are single-stepping as a result of a 3075aae8a53SK.Prasad * previous HW Breakpoint exception 3085aae8a53SK.Prasad */ 3095aae8a53SK.Prasad if (!bp) 3105aae8a53SK.Prasad return NOTIFY_DONE; 3115aae8a53SK.Prasad 3123f4693eeSMichael Neuling info = counter_arch_bp(bp); 3135aae8a53SK.Prasad 3145aae8a53SK.Prasad /* 3155aae8a53SK.Prasad * We shall invoke the user-defined callback function in the single 3165aae8a53SK.Prasad * stepping handler to confirm to 'trigger-after-execute' semantics 3175aae8a53SK.Prasad */ 3189422de3eSMichael Neuling if (!(info->type & HW_BRK_TYPE_EXTRANEOUS_IRQ)) 3195aae8a53SK.Prasad perf_bp_event(bp, regs); 3205aae8a53SK.Prasad 32121f58507SPaul Gortmaker __set_breakpoint(info); 3225aae8a53SK.Prasad current->thread.last_hit_ubp = NULL; 32376b0f133SPaul Mackerras 32476b0f133SPaul Mackerras /* 32576b0f133SPaul Mackerras * If the process was being single-stepped by ptrace, let the 32676b0f133SPaul Mackerras * other single-step actions occur (e.g. generate SIGTRAP). 32776b0f133SPaul Mackerras */ 32876b0f133SPaul Mackerras if (test_thread_flag(TIF_SINGLESTEP)) 32976b0f133SPaul Mackerras return NOTIFY_DONE; 33076b0f133SPaul Mackerras 3315aae8a53SK.Prasad return NOTIFY_STOP; 3325aae8a53SK.Prasad } 33303465f89SNicholas Piggin NOKPROBE_SYMBOL(single_step_dabr_instruction); 3345aae8a53SK.Prasad 3355aae8a53SK.Prasad /* 3365aae8a53SK.Prasad * Handle debug exception notifications. 3375aae8a53SK.Prasad */ 33803465f89SNicholas Piggin int hw_breakpoint_exceptions_notify( 3395aae8a53SK.Prasad struct notifier_block *unused, unsigned long val, void *data) 3405aae8a53SK.Prasad { 3415aae8a53SK.Prasad int ret = NOTIFY_DONE; 3425aae8a53SK.Prasad 3435aae8a53SK.Prasad switch (val) { 3445aae8a53SK.Prasad case DIE_DABR_MATCH: 3455aae8a53SK.Prasad ret = hw_breakpoint_handler(data); 3465aae8a53SK.Prasad break; 3475aae8a53SK.Prasad case DIE_SSTEP: 3485aae8a53SK.Prasad ret = single_step_dabr_instruction(data); 3495aae8a53SK.Prasad break; 3505aae8a53SK.Prasad } 3515aae8a53SK.Prasad 3525aae8a53SK.Prasad return ret; 3535aae8a53SK.Prasad } 35403465f89SNicholas Piggin NOKPROBE_SYMBOL(hw_breakpoint_exceptions_notify); 3555aae8a53SK.Prasad 3565aae8a53SK.Prasad /* 3575aae8a53SK.Prasad * Release the user breakpoints used by ptrace 3585aae8a53SK.Prasad */ 3595aae8a53SK.Prasad void flush_ptrace_hw_breakpoint(struct task_struct *tsk) 3605aae8a53SK.Prasad { 3615aae8a53SK.Prasad struct thread_struct *t = &tsk->thread; 3625aae8a53SK.Prasad 3635aae8a53SK.Prasad unregister_hw_breakpoint(t->ptrace_bps[0]); 3645aae8a53SK.Prasad t->ptrace_bps[0] = NULL; 3655aae8a53SK.Prasad } 3665aae8a53SK.Prasad 3675aae8a53SK.Prasad void hw_breakpoint_pmu_read(struct perf_event *bp) 3685aae8a53SK.Prasad { 3695aae8a53SK.Prasad /* TODO */ 3705aae8a53SK.Prasad } 371