11a59d1b8SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later 20067f129SK.Prasad /* 30067f129SK.Prasad * 40067f129SK.Prasad * Copyright (C) 2007 Alan Stern 50067f129SK.Prasad * Copyright (C) 2009 IBM Corporation 624f1e32cSFrederic Weisbecker * Copyright (C) 2009 Frederic Weisbecker <fweisbec@gmail.com> 7ba6909b7SK.Prasad * 8ba6909b7SK.Prasad * Authors: Alan Stern <stern@rowland.harvard.edu> 9ba6909b7SK.Prasad * K.Prasad <prasad@linux.vnet.ibm.com> 10ba6909b7SK.Prasad * Frederic Weisbecker <fweisbec@gmail.com> 110067f129SK.Prasad */ 120067f129SK.Prasad 130067f129SK.Prasad /* 140067f129SK.Prasad * HW_breakpoint: a unified kernel/user-space hardware breakpoint facility, 150067f129SK.Prasad * using the CPU's debug registers. 160067f129SK.Prasad */ 170067f129SK.Prasad 1824f1e32cSFrederic Weisbecker #include <linux/perf_event.h> 1924f1e32cSFrederic Weisbecker #include <linux/hw_breakpoint.h> 200067f129SK.Prasad #include <linux/irqflags.h> 210067f129SK.Prasad #include <linux/notifier.h> 220067f129SK.Prasad #include <linux/kallsyms.h> 23e5779e8eSAndy Lutomirski #include <linux/kprobes.h> 240067f129SK.Prasad #include <linux/percpu.h> 250067f129SK.Prasad #include <linux/kdebug.h> 260067f129SK.Prasad #include <linux/kernel.h> 27186f4360SPaul Gortmaker #include <linux/export.h> 280067f129SK.Prasad #include <linux/sched.h> 290067f129SK.Prasad #include <linux/smp.h> 300067f129SK.Prasad 310067f129SK.Prasad #include <asm/hw_breakpoint.h> 320067f129SK.Prasad #include <asm/processor.h> 330067f129SK.Prasad #include <asm/debugreg.h> 34186f4360SPaul Gortmaker #include <asm/user.h> 3597417cb9SLai Jiangshan #include <asm/desc.h> 360067f129SK.Prasad 3724f1e32cSFrederic Weisbecker /* Per cpu debug control register value */ 3828b4e0d8STejun Heo DEFINE_PER_CPU(unsigned long, cpu_dr7); 3928b4e0d8STejun Heo EXPORT_PER_CPU_SYMBOL(cpu_dr7); 4024f1e32cSFrederic Weisbecker 4124f1e32cSFrederic Weisbecker /* Per cpu debug address registers values */ 4224f1e32cSFrederic Weisbecker static DEFINE_PER_CPU(unsigned long, cpu_debugreg[HBP_NUM]); 430067f129SK.Prasad 440067f129SK.Prasad /* 4524f1e32cSFrederic Weisbecker * Stores the breakpoints currently in use on each breakpoint address 4624f1e32cSFrederic Weisbecker * register for each cpus 470067f129SK.Prasad */ 4824f1e32cSFrederic Weisbecker static DEFINE_PER_CPU(struct perf_event *, bp_per_reg[HBP_NUM]); 490067f129SK.Prasad 500067f129SK.Prasad 512c31b795SFrederic Weisbecker static inline unsigned long 522c31b795SFrederic Weisbecker __encode_dr7(int drnum, unsigned int len, unsigned int type) 532c31b795SFrederic Weisbecker { 542c31b795SFrederic Weisbecker unsigned long bp_info; 552c31b795SFrederic Weisbecker 562c31b795SFrederic Weisbecker bp_info = (len | type) & 0xf; 572c31b795SFrederic Weisbecker bp_info <<= (DR_CONTROL_SHIFT + drnum * DR_CONTROL_SIZE); 582c31b795SFrederic Weisbecker bp_info |= (DR_GLOBAL_ENABLE << (drnum * DR_ENABLE_SIZE)); 592c31b795SFrederic Weisbecker 602c31b795SFrederic Weisbecker return bp_info; 612c31b795SFrederic Weisbecker } 622c31b795SFrederic Weisbecker 630067f129SK.Prasad /* 640067f129SK.Prasad * Encode the length, type, Exact, and Enable bits for a particular breakpoint 650067f129SK.Prasad * as stored in debug register 7. 660067f129SK.Prasad */ 6724f1e32cSFrederic Weisbecker unsigned long encode_dr7(int drnum, unsigned int len, unsigned int type) 680067f129SK.Prasad { 692c31b795SFrederic Weisbecker return __encode_dr7(drnum, len, type) | DR_GLOBAL_SLOWDOWN; 700067f129SK.Prasad } 710067f129SK.Prasad 7224f1e32cSFrederic Weisbecker /* 7324f1e32cSFrederic Weisbecker * Decode the length and type bits for a particular breakpoint as 7424f1e32cSFrederic Weisbecker * stored in debug register 7. Return the "enabled" status. 750067f129SK.Prasad */ 7624f1e32cSFrederic Weisbecker int decode_dr7(unsigned long dr7, int bpnum, unsigned *len, unsigned *type) 7724f1e32cSFrederic Weisbecker { 7824f1e32cSFrederic Weisbecker int bp_info = dr7 >> (DR_CONTROL_SHIFT + bpnum * DR_CONTROL_SIZE); 7924f1e32cSFrederic Weisbecker 8024f1e32cSFrederic Weisbecker *len = (bp_info & 0xc) | 0x40; 8124f1e32cSFrederic Weisbecker *type = (bp_info & 0x3) | 0x80; 8224f1e32cSFrederic Weisbecker 8324f1e32cSFrederic Weisbecker return (dr7 >> (bpnum * DR_ENABLE_SIZE)) & 0x3; 840067f129SK.Prasad } 850067f129SK.Prasad 860067f129SK.Prasad /* 8724f1e32cSFrederic Weisbecker * Install a perf counter breakpoint. 8824f1e32cSFrederic Weisbecker * 8924f1e32cSFrederic Weisbecker * We seek a free debug address register and use it for this 9024f1e32cSFrederic Weisbecker * breakpoint. Eventually we enable it in the debug control register. 9124f1e32cSFrederic Weisbecker * 9224f1e32cSFrederic Weisbecker * Atomic: we hold the counter->ctx->lock and we only handle variables 9324f1e32cSFrederic Weisbecker * and registers local to this cpu. 940067f129SK.Prasad */ 9524f1e32cSFrederic Weisbecker int arch_install_hw_breakpoint(struct perf_event *bp) 960067f129SK.Prasad { 9724f1e32cSFrederic Weisbecker struct arch_hw_breakpoint *info = counter_arch_bp(bp); 9824f1e32cSFrederic Weisbecker unsigned long *dr7; 9924f1e32cSFrederic Weisbecker int i; 1000067f129SK.Prasad 10124f1e32cSFrederic Weisbecker for (i = 0; i < HBP_NUM; i++) { 10289cbc767SChristoph Lameter struct perf_event **slot = this_cpu_ptr(&bp_per_reg[i]); 10324f1e32cSFrederic Weisbecker 10424f1e32cSFrederic Weisbecker if (!*slot) { 10524f1e32cSFrederic Weisbecker *slot = bp; 1060067f129SK.Prasad break; 1070067f129SK.Prasad } 10824f1e32cSFrederic Weisbecker } 1090067f129SK.Prasad 11024f1e32cSFrederic Weisbecker if (WARN_ONCE(i == HBP_NUM, "Can't find any breakpoint slot")) 11124f1e32cSFrederic Weisbecker return -EBUSY; 11224f1e32cSFrederic Weisbecker 11324f1e32cSFrederic Weisbecker set_debugreg(info->address, i); 1140a3aee0dSTejun Heo __this_cpu_write(cpu_debugreg[i], info->address); 11524f1e32cSFrederic Weisbecker 11689cbc767SChristoph Lameter dr7 = this_cpu_ptr(&cpu_dr7); 11724f1e32cSFrederic Weisbecker *dr7 |= encode_dr7(i, info->len, info->type); 11824f1e32cSFrederic Weisbecker 11924f1e32cSFrederic Weisbecker set_debugreg(*dr7, 7); 120d6d55f0bSJacob Shin if (info->mask) 121d6d55f0bSJacob Shin set_dr_addr_mask(info->mask, i); 12224f1e32cSFrederic Weisbecker 12324f1e32cSFrederic Weisbecker return 0; 1240067f129SK.Prasad } 1250067f129SK.Prasad 1260067f129SK.Prasad /* 12724f1e32cSFrederic Weisbecker * Uninstall the breakpoint contained in the given counter. 12824f1e32cSFrederic Weisbecker * 12924f1e32cSFrederic Weisbecker * First we search the debug address register it uses and then we disable 13024f1e32cSFrederic Weisbecker * it. 13124f1e32cSFrederic Weisbecker * 13224f1e32cSFrederic Weisbecker * Atomic: we hold the counter->ctx->lock and we only handle variables 13324f1e32cSFrederic Weisbecker * and registers local to this cpu. 1340067f129SK.Prasad */ 13524f1e32cSFrederic Weisbecker void arch_uninstall_hw_breakpoint(struct perf_event *bp) 1360067f129SK.Prasad { 13724f1e32cSFrederic Weisbecker struct arch_hw_breakpoint *info = counter_arch_bp(bp); 13824f1e32cSFrederic Weisbecker unsigned long *dr7; 13924f1e32cSFrederic Weisbecker int i; 1400067f129SK.Prasad 14124f1e32cSFrederic Weisbecker for (i = 0; i < HBP_NUM; i++) { 14289cbc767SChristoph Lameter struct perf_event **slot = this_cpu_ptr(&bp_per_reg[i]); 14324f1e32cSFrederic Weisbecker 14424f1e32cSFrederic Weisbecker if (*slot == bp) { 14524f1e32cSFrederic Weisbecker *slot = NULL; 14624f1e32cSFrederic Weisbecker break; 14724f1e32cSFrederic Weisbecker } 14824f1e32cSFrederic Weisbecker } 14924f1e32cSFrederic Weisbecker 15024f1e32cSFrederic Weisbecker if (WARN_ONCE(i == HBP_NUM, "Can't find any breakpoint slot")) 15124f1e32cSFrederic Weisbecker return; 15224f1e32cSFrederic Weisbecker 15389cbc767SChristoph Lameter dr7 = this_cpu_ptr(&cpu_dr7); 1542c31b795SFrederic Weisbecker *dr7 &= ~__encode_dr7(i, info->len, info->type); 15524f1e32cSFrederic Weisbecker 15624f1e32cSFrederic Weisbecker set_debugreg(*dr7, 7); 157d6d55f0bSJacob Shin if (info->mask) 158d6d55f0bSJacob Shin set_dr_addr_mask(0, i); 1590067f129SK.Prasad } 1600067f129SK.Prasad 1618e983ff9SFrederic Weisbecker static int arch_bp_generic_len(int x86_len) 1620067f129SK.Prasad { 1638e983ff9SFrederic Weisbecker switch (x86_len) { 1648e983ff9SFrederic Weisbecker case X86_BREAKPOINT_LEN_1: 1658e983ff9SFrederic Weisbecker return HW_BREAKPOINT_LEN_1; 1668e983ff9SFrederic Weisbecker case X86_BREAKPOINT_LEN_2: 1678e983ff9SFrederic Weisbecker return HW_BREAKPOINT_LEN_2; 1688e983ff9SFrederic Weisbecker case X86_BREAKPOINT_LEN_4: 1698e983ff9SFrederic Weisbecker return HW_BREAKPOINT_LEN_4; 1708e983ff9SFrederic Weisbecker #ifdef CONFIG_X86_64 1718e983ff9SFrederic Weisbecker case X86_BREAKPOINT_LEN_8: 1728e983ff9SFrederic Weisbecker return HW_BREAKPOINT_LEN_8; 1738e983ff9SFrederic Weisbecker #endif 1748e983ff9SFrederic Weisbecker default: 1758e983ff9SFrederic Weisbecker return -EINVAL; 1768e983ff9SFrederic Weisbecker } 1770067f129SK.Prasad } 1780067f129SK.Prasad 17924f1e32cSFrederic Weisbecker int arch_bp_generic_fields(int x86_len, int x86_type, 18024f1e32cSFrederic Weisbecker int *gen_len, int *gen_type) 18124f1e32cSFrederic Weisbecker { 1828e983ff9SFrederic Weisbecker int len; 1838e983ff9SFrederic Weisbecker 18489e45aacSFrederic Weisbecker /* Type */ 18589e45aacSFrederic Weisbecker switch (x86_type) { 18689e45aacSFrederic Weisbecker case X86_BREAKPOINT_EXECUTE: 18789e45aacSFrederic Weisbecker if (x86_len != X86_BREAKPOINT_LEN_X) 18889e45aacSFrederic Weisbecker return -EINVAL; 18989e45aacSFrederic Weisbecker 19089e45aacSFrederic Weisbecker *gen_type = HW_BREAKPOINT_X; 19189e45aacSFrederic Weisbecker *gen_len = sizeof(long); 19289e45aacSFrederic Weisbecker return 0; 19389e45aacSFrederic Weisbecker case X86_BREAKPOINT_WRITE: 19489e45aacSFrederic Weisbecker *gen_type = HW_BREAKPOINT_W; 19589e45aacSFrederic Weisbecker break; 19689e45aacSFrederic Weisbecker case X86_BREAKPOINT_RW: 19789e45aacSFrederic Weisbecker *gen_type = HW_BREAKPOINT_W | HW_BREAKPOINT_R; 19889e45aacSFrederic Weisbecker break; 19989e45aacSFrederic Weisbecker default: 20089e45aacSFrederic Weisbecker return -EINVAL; 20189e45aacSFrederic Weisbecker } 20289e45aacSFrederic Weisbecker 20324f1e32cSFrederic Weisbecker /* Len */ 2048e983ff9SFrederic Weisbecker len = arch_bp_generic_len(x86_len); 2058e983ff9SFrederic Weisbecker if (len < 0) 20624f1e32cSFrederic Weisbecker return -EINVAL; 2078e983ff9SFrederic Weisbecker *gen_len = len; 20824f1e32cSFrederic Weisbecker 20924f1e32cSFrederic Weisbecker return 0; 21024f1e32cSFrederic Weisbecker } 21124f1e32cSFrederic Weisbecker 2128e983ff9SFrederic Weisbecker /* 2138e983ff9SFrederic Weisbecker * Check for virtual address in kernel space. 2148e983ff9SFrederic Weisbecker */ 2158e983ff9SFrederic Weisbecker int arch_check_bp_in_kernelspace(struct arch_hw_breakpoint *hw) 2168e983ff9SFrederic Weisbecker { 2178e983ff9SFrederic Weisbecker unsigned long va; 2188e983ff9SFrederic Weisbecker int len; 2198e983ff9SFrederic Weisbecker 2208e983ff9SFrederic Weisbecker va = hw->address; 2218e983ff9SFrederic Weisbecker len = arch_bp_generic_len(hw->len); 2228e983ff9SFrederic Weisbecker WARN_ON_ONCE(len < 0); 2238e983ff9SFrederic Weisbecker 2248e983ff9SFrederic Weisbecker /* 2258e983ff9SFrederic Weisbecker * We don't need to worry about va + len - 1 overflowing: 2268e983ff9SFrederic Weisbecker * we already require that va is aligned to a multiple of len. 2278e983ff9SFrederic Weisbecker */ 2288e983ff9SFrederic Weisbecker return (va >= TASK_SIZE_MAX) || ((va + len - 1) >= TASK_SIZE_MAX); 2298e983ff9SFrederic Weisbecker } 23024f1e32cSFrederic Weisbecker 23124ae0c91SAndy Lutomirski /* 232d390e6deSLai Jiangshan * Checks whether the range [addr, end], overlaps the area [base, base + size). 233d390e6deSLai Jiangshan */ 234d390e6deSLai Jiangshan static inline bool within_area(unsigned long addr, unsigned long end, 235d390e6deSLai Jiangshan unsigned long base, unsigned long size) 236d390e6deSLai Jiangshan { 237d390e6deSLai Jiangshan return end >= base && addr < (base + size); 238d390e6deSLai Jiangshan } 239d390e6deSLai Jiangshan 240d390e6deSLai Jiangshan /* 24197417cb9SLai Jiangshan * Checks whether the range from addr to end, inclusive, overlaps the fixed 24297417cb9SLai Jiangshan * mapped CPU entry area range or other ranges used for CPU entry. 24324ae0c91SAndy Lutomirski */ 24497417cb9SLai Jiangshan static inline bool within_cpu_entry(unsigned long addr, unsigned long end) 24524ae0c91SAndy Lutomirski { 24697417cb9SLai Jiangshan int cpu; 24797417cb9SLai Jiangshan 24897417cb9SLai Jiangshan /* CPU entry erea is always used for CPU entry */ 24997417cb9SLai Jiangshan if (within_area(addr, end, CPU_ENTRY_AREA_BASE, 25097417cb9SLai Jiangshan CPU_ENTRY_AREA_TOTAL_SIZE)) 25197417cb9SLai Jiangshan return true; 25297417cb9SLai Jiangshan 25397417cb9SLai Jiangshan for_each_possible_cpu(cpu) { 25497417cb9SLai Jiangshan /* The original rw GDT is being used after load_direct_gdt() */ 25597417cb9SLai Jiangshan if (within_area(addr, end, (unsigned long)get_cpu_gdt_rw(cpu), 25697417cb9SLai Jiangshan GDT_SIZE)) 25797417cb9SLai Jiangshan return true; 25897417cb9SLai Jiangshan } 25997417cb9SLai Jiangshan 26097417cb9SLai Jiangshan return false; 26124ae0c91SAndy Lutomirski } 26224ae0c91SAndy Lutomirski 263a0baf043SFrederic Weisbecker static int arch_build_bp_info(struct perf_event *bp, 264a0baf043SFrederic Weisbecker const struct perf_event_attr *attr, 265a0baf043SFrederic Weisbecker struct arch_hw_breakpoint *hw) 26624f1e32cSFrederic Weisbecker { 26724ae0c91SAndy Lutomirski unsigned long bp_end; 26824ae0c91SAndy Lutomirski 26924ae0c91SAndy Lutomirski bp_end = attr->bp_addr + attr->bp_len - 1; 27024ae0c91SAndy Lutomirski if (bp_end < attr->bp_addr) 27124ae0c91SAndy Lutomirski return -EINVAL; 27224ae0c91SAndy Lutomirski 27324ae0c91SAndy Lutomirski /* 27497417cb9SLai Jiangshan * Prevent any breakpoint of any type that overlaps the CPU 27597417cb9SLai Jiangshan * entry area and data. This protects the IST stacks and also 27624ae0c91SAndy Lutomirski * reduces the chance that we ever find out what happens if 27724ae0c91SAndy Lutomirski * there's a data breakpoint on the GDT, IDT, or TSS. 27824ae0c91SAndy Lutomirski */ 27997417cb9SLai Jiangshan if (within_cpu_entry(attr->bp_addr, bp_end)) 28024ae0c91SAndy Lutomirski return -EINVAL; 28124ae0c91SAndy Lutomirski 282a0baf043SFrederic Weisbecker hw->address = attr->bp_addr; 283a0baf043SFrederic Weisbecker hw->mask = 0; 28424f1e32cSFrederic Weisbecker 285f7809dafSFrederic Weisbecker /* Type */ 286a0baf043SFrederic Weisbecker switch (attr->bp_type) { 287f7809dafSFrederic Weisbecker case HW_BREAKPOINT_W: 288a0baf043SFrederic Weisbecker hw->type = X86_BREAKPOINT_WRITE; 289f7809dafSFrederic Weisbecker break; 290f7809dafSFrederic Weisbecker case HW_BREAKPOINT_W | HW_BREAKPOINT_R: 291a0baf043SFrederic Weisbecker hw->type = X86_BREAKPOINT_RW; 292f7809dafSFrederic Weisbecker break; 293f7809dafSFrederic Weisbecker case HW_BREAKPOINT_X: 294e5779e8eSAndy Lutomirski /* 295e5779e8eSAndy Lutomirski * We don't allow kernel breakpoints in places that are not 296e5779e8eSAndy Lutomirski * acceptable for kprobes. On non-kprobes kernels, we don't 297e5779e8eSAndy Lutomirski * allow kernel breakpoints at all. 298e5779e8eSAndy Lutomirski */ 299a0baf043SFrederic Weisbecker if (attr->bp_addr >= TASK_SIZE_MAX) { 300a0baf043SFrederic Weisbecker if (within_kprobe_blacklist(attr->bp_addr)) 301e5779e8eSAndy Lutomirski return -EINVAL; 302e5779e8eSAndy Lutomirski } 303e5779e8eSAndy Lutomirski 304a0baf043SFrederic Weisbecker hw->type = X86_BREAKPOINT_EXECUTE; 305f7809dafSFrederic Weisbecker /* 306f7809dafSFrederic Weisbecker * x86 inst breakpoints need to have a specific undefined len. 307f7809dafSFrederic Weisbecker * But we still need to check userspace is not trying to setup 308f7809dafSFrederic Weisbecker * an unsupported length, to get a range breakpoint for example. 309f7809dafSFrederic Weisbecker */ 310a0baf043SFrederic Weisbecker if (attr->bp_len == sizeof(long)) { 311a0baf043SFrederic Weisbecker hw->len = X86_BREAKPOINT_LEN_X; 312f7809dafSFrederic Weisbecker return 0; 313f7809dafSFrederic Weisbecker } 3146fcebf13SGustavo A. R. Silva /* fall through */ 315f7809dafSFrederic Weisbecker default: 316f7809dafSFrederic Weisbecker return -EINVAL; 317f7809dafSFrederic Weisbecker } 318f7809dafSFrederic Weisbecker 31924f1e32cSFrederic Weisbecker /* Len */ 320a0baf043SFrederic Weisbecker switch (attr->bp_len) { 32124f1e32cSFrederic Weisbecker case HW_BREAKPOINT_LEN_1: 322a0baf043SFrederic Weisbecker hw->len = X86_BREAKPOINT_LEN_1; 32324f1e32cSFrederic Weisbecker break; 32424f1e32cSFrederic Weisbecker case HW_BREAKPOINT_LEN_2: 325a0baf043SFrederic Weisbecker hw->len = X86_BREAKPOINT_LEN_2; 32624f1e32cSFrederic Weisbecker break; 32724f1e32cSFrederic Weisbecker case HW_BREAKPOINT_LEN_4: 328a0baf043SFrederic Weisbecker hw->len = X86_BREAKPOINT_LEN_4; 32924f1e32cSFrederic Weisbecker break; 33024f1e32cSFrederic Weisbecker #ifdef CONFIG_X86_64 33124f1e32cSFrederic Weisbecker case HW_BREAKPOINT_LEN_8: 332a0baf043SFrederic Weisbecker hw->len = X86_BREAKPOINT_LEN_8; 33324f1e32cSFrederic Weisbecker break; 33424f1e32cSFrederic Weisbecker #endif 33524f1e32cSFrederic Weisbecker default: 336ab513927SAndy Lutomirski /* AMD range breakpoint */ 337a0baf043SFrederic Weisbecker if (!is_power_of_2(attr->bp_len)) 33824f1e32cSFrederic Weisbecker return -EINVAL; 339a0baf043SFrederic Weisbecker if (attr->bp_addr & (attr->bp_len - 1)) 340ab513927SAndy Lutomirski return -EINVAL; 341362f924bSBorislav Petkov 342362f924bSBorislav Petkov if (!boot_cpu_has(X86_FEATURE_BPEXT)) 343362f924bSBorislav Petkov return -EOPNOTSUPP; 344362f924bSBorislav Petkov 345ab513927SAndy Lutomirski /* 346ab513927SAndy Lutomirski * It's impossible to use a range breakpoint to fake out 347ab513927SAndy Lutomirski * user vs kernel detection because bp_len - 1 can't 348ab513927SAndy Lutomirski * have the high bit set. If we ever allow range instruction 349ab513927SAndy Lutomirski * breakpoints, then we'll have to check for kprobe-blacklisted 350ab513927SAndy Lutomirski * addresses anywhere in the range. 351ab513927SAndy Lutomirski */ 352a0baf043SFrederic Weisbecker hw->mask = attr->bp_len - 1; 353a0baf043SFrederic Weisbecker hw->len = X86_BREAKPOINT_LEN_1; 35424f1e32cSFrederic Weisbecker } 35524f1e32cSFrederic Weisbecker 35624f1e32cSFrederic Weisbecker return 0; 35724f1e32cSFrederic Weisbecker } 358d6d55f0bSJacob Shin 3590067f129SK.Prasad /* 3600067f129SK.Prasad * Validate the arch-specific HW Breakpoint register settings 3610067f129SK.Prasad */ 362a0baf043SFrederic Weisbecker int hw_breakpoint_arch_parse(struct perf_event *bp, 363a0baf043SFrederic Weisbecker const struct perf_event_attr *attr, 364a0baf043SFrederic Weisbecker struct arch_hw_breakpoint *hw) 3650067f129SK.Prasad { 3660067f129SK.Prasad unsigned int align; 36724f1e32cSFrederic Weisbecker int ret; 3680067f129SK.Prasad 36924f1e32cSFrederic Weisbecker 370a0baf043SFrederic Weisbecker ret = arch_build_bp_info(bp, attr, hw); 37124f1e32cSFrederic Weisbecker if (ret) 37224f1e32cSFrederic Weisbecker return ret; 37324f1e32cSFrederic Weisbecker 374a0baf043SFrederic Weisbecker switch (hw->len) { 37524f1e32cSFrederic Weisbecker case X86_BREAKPOINT_LEN_1: 3760067f129SK.Prasad align = 0; 377a0baf043SFrederic Weisbecker if (hw->mask) 378a0baf043SFrederic Weisbecker align = hw->mask; 3790067f129SK.Prasad break; 38024f1e32cSFrederic Weisbecker case X86_BREAKPOINT_LEN_2: 3810067f129SK.Prasad align = 1; 3820067f129SK.Prasad break; 38324f1e32cSFrederic Weisbecker case X86_BREAKPOINT_LEN_4: 3840067f129SK.Prasad align = 3; 3850067f129SK.Prasad break; 3860067f129SK.Prasad #ifdef CONFIG_X86_64 38724f1e32cSFrederic Weisbecker case X86_BREAKPOINT_LEN_8: 3880067f129SK.Prasad align = 7; 3890067f129SK.Prasad break; 3900067f129SK.Prasad #endif 3910067f129SK.Prasad default: 392d6d55f0bSJacob Shin WARN_ON_ONCE(1); 393e898e69dSNathan Chancellor return -EINVAL; 3940067f129SK.Prasad } 3950067f129SK.Prasad 39684d71092SFrederic Weisbecker /* 3970067f129SK.Prasad * Check that the low-order bits of the address are appropriate 3980067f129SK.Prasad * for the alignment implied by len. 3990067f129SK.Prasad */ 400a0baf043SFrederic Weisbecker if (hw->address & align) 4010067f129SK.Prasad return -EINVAL; 4020067f129SK.Prasad 4030067f129SK.Prasad return 0; 4040067f129SK.Prasad } 4050067f129SK.Prasad 40624f1e32cSFrederic Weisbecker /* 4079f6b3c2cSFrederic Weisbecker * Dump the debug register contents to the user. 4089f6b3c2cSFrederic Weisbecker * We can't dump our per cpu values because it 4099f6b3c2cSFrederic Weisbecker * may contain cpu wide breakpoint, something that 4109f6b3c2cSFrederic Weisbecker * doesn't belong to the current task. 4119f6b3c2cSFrederic Weisbecker * 4129f6b3c2cSFrederic Weisbecker * TODO: include non-ptrace user breakpoints (perf) 4139f6b3c2cSFrederic Weisbecker */ 4149f6b3c2cSFrederic Weisbecker void aout_dump_debugregs(struct user *dump) 4159f6b3c2cSFrederic Weisbecker { 4169f6b3c2cSFrederic Weisbecker int i; 4179f6b3c2cSFrederic Weisbecker int dr7 = 0; 4189f6b3c2cSFrederic Weisbecker struct perf_event *bp; 4199f6b3c2cSFrederic Weisbecker struct arch_hw_breakpoint *info; 4209f6b3c2cSFrederic Weisbecker struct thread_struct *thread = ¤t->thread; 4219f6b3c2cSFrederic Weisbecker 4229f6b3c2cSFrederic Weisbecker for (i = 0; i < HBP_NUM; i++) { 4239f6b3c2cSFrederic Weisbecker bp = thread->ptrace_bps[i]; 4249f6b3c2cSFrederic Weisbecker 4259f6b3c2cSFrederic Weisbecker if (bp && !bp->attr.disabled) { 4269f6b3c2cSFrederic Weisbecker dump->u_debugreg[i] = bp->attr.bp_addr; 4279f6b3c2cSFrederic Weisbecker info = counter_arch_bp(bp); 4289f6b3c2cSFrederic Weisbecker dr7 |= encode_dr7(i, info->len, info->type); 4299f6b3c2cSFrederic Weisbecker } else { 4309f6b3c2cSFrederic Weisbecker dump->u_debugreg[i] = 0; 4319f6b3c2cSFrederic Weisbecker } 4329f6b3c2cSFrederic Weisbecker } 4339f6b3c2cSFrederic Weisbecker 4349f6b3c2cSFrederic Weisbecker dump->u_debugreg[4] = 0; 4359f6b3c2cSFrederic Weisbecker dump->u_debugreg[5] = 0; 4369f6b3c2cSFrederic Weisbecker dump->u_debugreg[6] = current->thread.debugreg6; 4379f6b3c2cSFrederic Weisbecker 4389f6b3c2cSFrederic Weisbecker dump->u_debugreg[7] = dr7; 4399f6b3c2cSFrederic Weisbecker } 44068efa37dSIngo Molnar EXPORT_SYMBOL_GPL(aout_dump_debugregs); 4419f6b3c2cSFrederic Weisbecker 4429f6b3c2cSFrederic Weisbecker /* 44324f1e32cSFrederic Weisbecker * Release the user breakpoints used by ptrace 44424f1e32cSFrederic Weisbecker */ 44524f1e32cSFrederic Weisbecker void flush_ptrace_hw_breakpoint(struct task_struct *tsk) 4460067f129SK.Prasad { 4470067f129SK.Prasad int i; 44824f1e32cSFrederic Weisbecker struct thread_struct *t = &tsk->thread; 4490067f129SK.Prasad 45024f1e32cSFrederic Weisbecker for (i = 0; i < HBP_NUM; i++) { 45124f1e32cSFrederic Weisbecker unregister_hw_breakpoint(t->ptrace_bps[i]); 45224f1e32cSFrederic Weisbecker t->ptrace_bps[i] = NULL; 4530067f129SK.Prasad } 454f7da04c9SOleg Nesterov 455f7da04c9SOleg Nesterov t->debugreg6 = 0; 456f7da04c9SOleg Nesterov t->ptrace_dr7 = 0; 45724f1e32cSFrederic Weisbecker } 45824f1e32cSFrederic Weisbecker 45924f1e32cSFrederic Weisbecker void hw_breakpoint_restore(void) 46024f1e32cSFrederic Weisbecker { 4610a3aee0dSTejun Heo set_debugreg(__this_cpu_read(cpu_debugreg[0]), 0); 4620a3aee0dSTejun Heo set_debugreg(__this_cpu_read(cpu_debugreg[1]), 1); 4630a3aee0dSTejun Heo set_debugreg(__this_cpu_read(cpu_debugreg[2]), 2); 4640a3aee0dSTejun Heo set_debugreg(__this_cpu_read(cpu_debugreg[3]), 3); 46524f1e32cSFrederic Weisbecker set_debugreg(current->thread.debugreg6, 6); 4660a3aee0dSTejun Heo set_debugreg(__this_cpu_read(cpu_dr7), 7); 46724f1e32cSFrederic Weisbecker } 46824f1e32cSFrederic Weisbecker EXPORT_SYMBOL_GPL(hw_breakpoint_restore); 4690067f129SK.Prasad 4700067f129SK.Prasad /* 4710067f129SK.Prasad * Handle debug exception notifications. 4720067f129SK.Prasad * 4730067f129SK.Prasad * Return value is either NOTIFY_STOP or NOTIFY_DONE as explained below. 4740067f129SK.Prasad * 4750067f129SK.Prasad * NOTIFY_DONE returned if one of the following conditions is true. 4760067f129SK.Prasad * i) When the causative address is from user-space and the exception 4770067f129SK.Prasad * is a valid one, i.e. not triggered as a result of lazy debug register 4780067f129SK.Prasad * switching 4790067f129SK.Prasad * ii) When there are more bits than trap<n> set in DR6 register (such 4800067f129SK.Prasad * as BD, BS or BT) indicating that more than one debug condition is 4810067f129SK.Prasad * met and requires some more action in do_debug(). 4820067f129SK.Prasad * 4830067f129SK.Prasad * NOTIFY_STOP returned for all other cases 4840067f129SK.Prasad * 4850067f129SK.Prasad */ 4869c54b616SMasami Hiramatsu static int hw_breakpoint_handler(struct die_args *args) 4870067f129SK.Prasad { 4880067f129SK.Prasad int i, cpu, rc = NOTIFY_STOP; 48924f1e32cSFrederic Weisbecker struct perf_event *bp; 4909f58fddeSPeter Zijlstra unsigned long dr6; 49162edab90SK.Prasad unsigned long *dr6_p; 49262edab90SK.Prasad 49362edab90SK.Prasad /* The DR6 value is pointed by args->err */ 49462edab90SK.Prasad dr6_p = (unsigned long *)ERR_PTR(args->err); 49562edab90SK.Prasad dr6 = *dr6_p; 4960067f129SK.Prasad 4976c0aca28SFrederic Weisbecker /* If it's a single step, TRAP bits are random */ 4986c0aca28SFrederic Weisbecker if (dr6 & DR_STEP) 4996c0aca28SFrederic Weisbecker return NOTIFY_DONE; 5006c0aca28SFrederic Weisbecker 5010067f129SK.Prasad /* Do an early return if no trap bits are set in DR6 */ 5020067f129SK.Prasad if ((dr6 & DR_TRAP_BITS) == 0) 5030067f129SK.Prasad return NOTIFY_DONE; 5040067f129SK.Prasad 5050067f129SK.Prasad /* 5060067f129SK.Prasad * Assert that local interrupts are disabled 5070067f129SK.Prasad * Reset the DRn bits in the virtualized register value. 5080067f129SK.Prasad * The ptrace trigger routine will add in whatever is needed. 5090067f129SK.Prasad */ 5100067f129SK.Prasad current->thread.debugreg6 &= ~DR_TRAP_BITS; 5110067f129SK.Prasad cpu = get_cpu(); 5120067f129SK.Prasad 5130067f129SK.Prasad /* Handle all the breakpoints that were triggered */ 5140067f129SK.Prasad for (i = 0; i < HBP_NUM; ++i) { 5150067f129SK.Prasad if (likely(!(dr6 & (DR_TRAP0 << i)))) 5160067f129SK.Prasad continue; 51724f1e32cSFrederic Weisbecker 5180067f129SK.Prasad /* 51924f1e32cSFrederic Weisbecker * The counter may be concurrently released but that can only 52024f1e32cSFrederic Weisbecker * occur from a call_rcu() path. We can then safely fetch 52124f1e32cSFrederic Weisbecker * the breakpoint, use its callback, touch its counter 52224f1e32cSFrederic Weisbecker * while we are in an rcu_read_lock() path. 5230067f129SK.Prasad */ 52424f1e32cSFrederic Weisbecker rcu_read_lock(); 52524f1e32cSFrederic Weisbecker 52624f1e32cSFrederic Weisbecker bp = per_cpu(bp_per_reg[i], cpu); 5270067f129SK.Prasad /* 52862edab90SK.Prasad * Reset the 'i'th TRAP bit in dr6 to denote completion of 52962edab90SK.Prasad * exception handling 53062edab90SK.Prasad */ 53162edab90SK.Prasad (*dr6_p) &= ~(DR_TRAP0 << i); 53262edab90SK.Prasad /* 5330067f129SK.Prasad * bp can be NULL due to lazy debug register switching 53424f1e32cSFrederic Weisbecker * or due to concurrent perf counter removing. 5350067f129SK.Prasad */ 53624f1e32cSFrederic Weisbecker if (!bp) { 53724f1e32cSFrederic Weisbecker rcu_read_unlock(); 53824f1e32cSFrederic Weisbecker break; 53924f1e32cSFrederic Weisbecker } 5400067f129SK.Prasad 541b326e956SFrederic Weisbecker perf_bp_event(bp, args->regs); 54224f1e32cSFrederic Weisbecker 5430c4519e8SFrederic Weisbecker /* 5440c4519e8SFrederic Weisbecker * Set up resume flag to avoid breakpoint recursion when 5450c4519e8SFrederic Weisbecker * returning back to origin. 5460c4519e8SFrederic Weisbecker */ 5470c4519e8SFrederic Weisbecker if (bp->hw.info.type == X86_BREAKPOINT_EXECUTE) 5480c4519e8SFrederic Weisbecker args->regs->flags |= X86_EFLAGS_RF; 5490c4519e8SFrederic Weisbecker 55024f1e32cSFrederic Weisbecker rcu_read_unlock(); 5510067f129SK.Prasad } 552e0e53db6SK.Prasad /* 553e0e53db6SK.Prasad * Further processing in do_debug() is needed for a) user-space 554e0e53db6SK.Prasad * breakpoints (to generate signals) and b) when the system has 555e0e53db6SK.Prasad * taken exception due to multiple causes 556e0e53db6SK.Prasad */ 557e0e53db6SK.Prasad if ((current->thread.debugreg6 & DR_TRAP_BITS) || 558e0e53db6SK.Prasad (dr6 & (~DR_TRAP_BITS))) 5590067f129SK.Prasad rc = NOTIFY_DONE; 5600067f129SK.Prasad 561eadb8a09SIngo Molnar put_cpu(); 56224f1e32cSFrederic Weisbecker 5630067f129SK.Prasad return rc; 5640067f129SK.Prasad } 5650067f129SK.Prasad 5660067f129SK.Prasad /* 5670067f129SK.Prasad * Handle debug exception notifications. 5680067f129SK.Prasad */ 5699c54b616SMasami Hiramatsu int hw_breakpoint_exceptions_notify( 5700067f129SK.Prasad struct notifier_block *unused, unsigned long val, void *data) 5710067f129SK.Prasad { 5720067f129SK.Prasad if (val != DIE_DEBUG) 5730067f129SK.Prasad return NOTIFY_DONE; 5740067f129SK.Prasad 5750067f129SK.Prasad return hw_breakpoint_handler(data); 5760067f129SK.Prasad } 57724f1e32cSFrederic Weisbecker 57824f1e32cSFrederic Weisbecker void hw_breakpoint_pmu_read(struct perf_event *bp) 57924f1e32cSFrederic Weisbecker { 58024f1e32cSFrederic Weisbecker /* TODO */ 58124f1e32cSFrederic Weisbecker } 582