xref: /openbmc/linux/arch/x86/kernel/hw_breakpoint.c (revision ab513927)
10067f129SK.Prasad /*
20067f129SK.Prasad  * This program is free software; you can redistribute it and/or modify
30067f129SK.Prasad  * it under the terms of the GNU General Public License as published by
40067f129SK.Prasad  * the Free Software Foundation; either version 2 of the License, or
50067f129SK.Prasad  * (at your option) any later version.
60067f129SK.Prasad  *
70067f129SK.Prasad  * This program is distributed in the hope that it will be useful,
80067f129SK.Prasad  * but WITHOUT ANY WARRANTY; without even the implied warranty of
90067f129SK.Prasad  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
100067f129SK.Prasad  * GNU General Public License for more details.
110067f129SK.Prasad  *
120067f129SK.Prasad  * You should have received a copy of the GNU General Public License
130067f129SK.Prasad  * along with this program; if not, write to the Free Software
140067f129SK.Prasad  * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
150067f129SK.Prasad  *
160067f129SK.Prasad  * Copyright (C) 2007 Alan Stern
170067f129SK.Prasad  * Copyright (C) 2009 IBM Corporation
1824f1e32cSFrederic Weisbecker  * Copyright (C) 2009 Frederic Weisbecker <fweisbec@gmail.com>
19ba6909b7SK.Prasad  *
20ba6909b7SK.Prasad  * Authors: Alan Stern <stern@rowland.harvard.edu>
21ba6909b7SK.Prasad  *          K.Prasad <prasad@linux.vnet.ibm.com>
22ba6909b7SK.Prasad  *          Frederic Weisbecker <fweisbec@gmail.com>
230067f129SK.Prasad  */
240067f129SK.Prasad 
250067f129SK.Prasad /*
260067f129SK.Prasad  * HW_breakpoint: a unified kernel/user-space hardware breakpoint facility,
270067f129SK.Prasad  * using the CPU's debug registers.
280067f129SK.Prasad  */
290067f129SK.Prasad 
3024f1e32cSFrederic Weisbecker #include <linux/perf_event.h>
3124f1e32cSFrederic Weisbecker #include <linux/hw_breakpoint.h>
320067f129SK.Prasad #include <linux/irqflags.h>
330067f129SK.Prasad #include <linux/notifier.h>
340067f129SK.Prasad #include <linux/kallsyms.h>
35e5779e8eSAndy Lutomirski #include <linux/kprobes.h>
360067f129SK.Prasad #include <linux/percpu.h>
370067f129SK.Prasad #include <linux/kdebug.h>
380067f129SK.Prasad #include <linux/kernel.h>
390067f129SK.Prasad #include <linux/module.h>
400067f129SK.Prasad #include <linux/sched.h>
410067f129SK.Prasad #include <linux/smp.h>
420067f129SK.Prasad 
430067f129SK.Prasad #include <asm/hw_breakpoint.h>
440067f129SK.Prasad #include <asm/processor.h>
450067f129SK.Prasad #include <asm/debugreg.h>
460067f129SK.Prasad 
4724f1e32cSFrederic Weisbecker /* Per cpu debug control register value */
4828b4e0d8STejun Heo DEFINE_PER_CPU(unsigned long, cpu_dr7);
4928b4e0d8STejun Heo EXPORT_PER_CPU_SYMBOL(cpu_dr7);
5024f1e32cSFrederic Weisbecker 
5124f1e32cSFrederic Weisbecker /* Per cpu debug address registers values */
5224f1e32cSFrederic Weisbecker static DEFINE_PER_CPU(unsigned long, cpu_debugreg[HBP_NUM]);
530067f129SK.Prasad 
540067f129SK.Prasad /*
5524f1e32cSFrederic Weisbecker  * Stores the breakpoints currently in use on each breakpoint address
5624f1e32cSFrederic Weisbecker  * register for each cpus
570067f129SK.Prasad  */
5824f1e32cSFrederic Weisbecker static DEFINE_PER_CPU(struct perf_event *, bp_per_reg[HBP_NUM]);
590067f129SK.Prasad 
600067f129SK.Prasad 
612c31b795SFrederic Weisbecker static inline unsigned long
622c31b795SFrederic Weisbecker __encode_dr7(int drnum, unsigned int len, unsigned int type)
632c31b795SFrederic Weisbecker {
642c31b795SFrederic Weisbecker 	unsigned long bp_info;
652c31b795SFrederic Weisbecker 
662c31b795SFrederic Weisbecker 	bp_info = (len | type) & 0xf;
672c31b795SFrederic Weisbecker 	bp_info <<= (DR_CONTROL_SHIFT + drnum * DR_CONTROL_SIZE);
682c31b795SFrederic Weisbecker 	bp_info |= (DR_GLOBAL_ENABLE << (drnum * DR_ENABLE_SIZE));
692c31b795SFrederic Weisbecker 
702c31b795SFrederic Weisbecker 	return bp_info;
712c31b795SFrederic Weisbecker }
722c31b795SFrederic Weisbecker 
730067f129SK.Prasad /*
740067f129SK.Prasad  * Encode the length, type, Exact, and Enable bits for a particular breakpoint
750067f129SK.Prasad  * as stored in debug register 7.
760067f129SK.Prasad  */
7724f1e32cSFrederic Weisbecker unsigned long encode_dr7(int drnum, unsigned int len, unsigned int type)
780067f129SK.Prasad {
792c31b795SFrederic Weisbecker 	return __encode_dr7(drnum, len, type) | DR_GLOBAL_SLOWDOWN;
800067f129SK.Prasad }
810067f129SK.Prasad 
8224f1e32cSFrederic Weisbecker /*
8324f1e32cSFrederic Weisbecker  * Decode the length and type bits for a particular breakpoint as
8424f1e32cSFrederic Weisbecker  * stored in debug register 7.  Return the "enabled" status.
850067f129SK.Prasad  */
8624f1e32cSFrederic Weisbecker int decode_dr7(unsigned long dr7, int bpnum, unsigned *len, unsigned *type)
8724f1e32cSFrederic Weisbecker {
8824f1e32cSFrederic Weisbecker 	int bp_info = dr7 >> (DR_CONTROL_SHIFT + bpnum * DR_CONTROL_SIZE);
8924f1e32cSFrederic Weisbecker 
9024f1e32cSFrederic Weisbecker 	*len = (bp_info & 0xc) | 0x40;
9124f1e32cSFrederic Weisbecker 	*type = (bp_info & 0x3) | 0x80;
9224f1e32cSFrederic Weisbecker 
9324f1e32cSFrederic Weisbecker 	return (dr7 >> (bpnum * DR_ENABLE_SIZE)) & 0x3;
940067f129SK.Prasad }
950067f129SK.Prasad 
960067f129SK.Prasad /*
9724f1e32cSFrederic Weisbecker  * Install a perf counter breakpoint.
9824f1e32cSFrederic Weisbecker  *
9924f1e32cSFrederic Weisbecker  * We seek a free debug address register and use it for this
10024f1e32cSFrederic Weisbecker  * breakpoint. Eventually we enable it in the debug control register.
10124f1e32cSFrederic Weisbecker  *
10224f1e32cSFrederic Weisbecker  * Atomic: we hold the counter->ctx->lock and we only handle variables
10324f1e32cSFrederic Weisbecker  * and registers local to this cpu.
1040067f129SK.Prasad  */
10524f1e32cSFrederic Weisbecker int arch_install_hw_breakpoint(struct perf_event *bp)
1060067f129SK.Prasad {
10724f1e32cSFrederic Weisbecker 	struct arch_hw_breakpoint *info = counter_arch_bp(bp);
10824f1e32cSFrederic Weisbecker 	unsigned long *dr7;
10924f1e32cSFrederic Weisbecker 	int i;
1100067f129SK.Prasad 
11124f1e32cSFrederic Weisbecker 	for (i = 0; i < HBP_NUM; i++) {
11289cbc767SChristoph Lameter 		struct perf_event **slot = this_cpu_ptr(&bp_per_reg[i]);
11324f1e32cSFrederic Weisbecker 
11424f1e32cSFrederic Weisbecker 		if (!*slot) {
11524f1e32cSFrederic Weisbecker 			*slot = bp;
1160067f129SK.Prasad 			break;
1170067f129SK.Prasad 		}
11824f1e32cSFrederic Weisbecker 	}
1190067f129SK.Prasad 
12024f1e32cSFrederic Weisbecker 	if (WARN_ONCE(i == HBP_NUM, "Can't find any breakpoint slot"))
12124f1e32cSFrederic Weisbecker 		return -EBUSY;
12224f1e32cSFrederic Weisbecker 
12324f1e32cSFrederic Weisbecker 	set_debugreg(info->address, i);
1240a3aee0dSTejun Heo 	__this_cpu_write(cpu_debugreg[i], info->address);
12524f1e32cSFrederic Weisbecker 
12689cbc767SChristoph Lameter 	dr7 = this_cpu_ptr(&cpu_dr7);
12724f1e32cSFrederic Weisbecker 	*dr7 |= encode_dr7(i, info->len, info->type);
12824f1e32cSFrederic Weisbecker 
12924f1e32cSFrederic Weisbecker 	set_debugreg(*dr7, 7);
130d6d55f0bSJacob Shin 	if (info->mask)
131d6d55f0bSJacob Shin 		set_dr_addr_mask(info->mask, i);
13224f1e32cSFrederic Weisbecker 
13324f1e32cSFrederic Weisbecker 	return 0;
1340067f129SK.Prasad }
1350067f129SK.Prasad 
1360067f129SK.Prasad /*
13724f1e32cSFrederic Weisbecker  * Uninstall the breakpoint contained in the given counter.
13824f1e32cSFrederic Weisbecker  *
13924f1e32cSFrederic Weisbecker  * First we search the debug address register it uses and then we disable
14024f1e32cSFrederic Weisbecker  * it.
14124f1e32cSFrederic Weisbecker  *
14224f1e32cSFrederic Weisbecker  * Atomic: we hold the counter->ctx->lock and we only handle variables
14324f1e32cSFrederic Weisbecker  * and registers local to this cpu.
1440067f129SK.Prasad  */
14524f1e32cSFrederic Weisbecker void arch_uninstall_hw_breakpoint(struct perf_event *bp)
1460067f129SK.Prasad {
14724f1e32cSFrederic Weisbecker 	struct arch_hw_breakpoint *info = counter_arch_bp(bp);
14824f1e32cSFrederic Weisbecker 	unsigned long *dr7;
14924f1e32cSFrederic Weisbecker 	int i;
1500067f129SK.Prasad 
15124f1e32cSFrederic Weisbecker 	for (i = 0; i < HBP_NUM; i++) {
15289cbc767SChristoph Lameter 		struct perf_event **slot = this_cpu_ptr(&bp_per_reg[i]);
15324f1e32cSFrederic Weisbecker 
15424f1e32cSFrederic Weisbecker 		if (*slot == bp) {
15524f1e32cSFrederic Weisbecker 			*slot = NULL;
15624f1e32cSFrederic Weisbecker 			break;
15724f1e32cSFrederic Weisbecker 		}
15824f1e32cSFrederic Weisbecker 	}
15924f1e32cSFrederic Weisbecker 
16024f1e32cSFrederic Weisbecker 	if (WARN_ONCE(i == HBP_NUM, "Can't find any breakpoint slot"))
16124f1e32cSFrederic Weisbecker 		return;
16224f1e32cSFrederic Weisbecker 
16389cbc767SChristoph Lameter 	dr7 = this_cpu_ptr(&cpu_dr7);
1642c31b795SFrederic Weisbecker 	*dr7 &= ~__encode_dr7(i, info->len, info->type);
16524f1e32cSFrederic Weisbecker 
16624f1e32cSFrederic Weisbecker 	set_debugreg(*dr7, 7);
167d6d55f0bSJacob Shin 	if (info->mask)
168d6d55f0bSJacob Shin 		set_dr_addr_mask(0, i);
1690067f129SK.Prasad }
1700067f129SK.Prasad 
1710067f129SK.Prasad /*
1720067f129SK.Prasad  * Check for virtual address in kernel space.
1730067f129SK.Prasad  */
174b2812d03SFrederic Weisbecker int arch_check_bp_in_kernelspace(struct perf_event *bp)
1750067f129SK.Prasad {
1760067f129SK.Prasad 	unsigned int len;
177b2812d03SFrederic Weisbecker 	unsigned long va;
178b2812d03SFrederic Weisbecker 	struct arch_hw_breakpoint *info = counter_arch_bp(bp);
1790067f129SK.Prasad 
180b2812d03SFrederic Weisbecker 	va = info->address;
18136748b95SJacob Shin 	len = bp->attr.bp_len;
1820067f129SK.Prasad 
1830067f129SK.Prasad 	return (va >= TASK_SIZE) && ((va + len - 1) >= TASK_SIZE);
1840067f129SK.Prasad }
1850067f129SK.Prasad 
18624f1e32cSFrederic Weisbecker int arch_bp_generic_fields(int x86_len, int x86_type,
18724f1e32cSFrederic Weisbecker 			   int *gen_len, int *gen_type)
18824f1e32cSFrederic Weisbecker {
18989e45aacSFrederic Weisbecker 	/* Type */
19089e45aacSFrederic Weisbecker 	switch (x86_type) {
19189e45aacSFrederic Weisbecker 	case X86_BREAKPOINT_EXECUTE:
19289e45aacSFrederic Weisbecker 		if (x86_len != X86_BREAKPOINT_LEN_X)
19389e45aacSFrederic Weisbecker 			return -EINVAL;
19489e45aacSFrederic Weisbecker 
19589e45aacSFrederic Weisbecker 		*gen_type = HW_BREAKPOINT_X;
19689e45aacSFrederic Weisbecker 		*gen_len = sizeof(long);
19789e45aacSFrederic Weisbecker 		return 0;
19889e45aacSFrederic Weisbecker 	case X86_BREAKPOINT_WRITE:
19989e45aacSFrederic Weisbecker 		*gen_type = HW_BREAKPOINT_W;
20089e45aacSFrederic Weisbecker 		break;
20189e45aacSFrederic Weisbecker 	case X86_BREAKPOINT_RW:
20289e45aacSFrederic Weisbecker 		*gen_type = HW_BREAKPOINT_W | HW_BREAKPOINT_R;
20389e45aacSFrederic Weisbecker 		break;
20489e45aacSFrederic Weisbecker 	default:
20589e45aacSFrederic Weisbecker 		return -EINVAL;
20689e45aacSFrederic Weisbecker 	}
20789e45aacSFrederic Weisbecker 
20824f1e32cSFrederic Weisbecker 	/* Len */
20924f1e32cSFrederic Weisbecker 	switch (x86_len) {
21024f1e32cSFrederic Weisbecker 	case X86_BREAKPOINT_LEN_1:
21124f1e32cSFrederic Weisbecker 		*gen_len = HW_BREAKPOINT_LEN_1;
21224f1e32cSFrederic Weisbecker 		break;
21324f1e32cSFrederic Weisbecker 	case X86_BREAKPOINT_LEN_2:
21424f1e32cSFrederic Weisbecker 		*gen_len = HW_BREAKPOINT_LEN_2;
21524f1e32cSFrederic Weisbecker 		break;
21624f1e32cSFrederic Weisbecker 	case X86_BREAKPOINT_LEN_4:
21724f1e32cSFrederic Weisbecker 		*gen_len = HW_BREAKPOINT_LEN_4;
21824f1e32cSFrederic Weisbecker 		break;
21924f1e32cSFrederic Weisbecker #ifdef CONFIG_X86_64
22024f1e32cSFrederic Weisbecker 	case X86_BREAKPOINT_LEN_8:
22124f1e32cSFrederic Weisbecker 		*gen_len = HW_BREAKPOINT_LEN_8;
22224f1e32cSFrederic Weisbecker 		break;
22324f1e32cSFrederic Weisbecker #endif
22424f1e32cSFrederic Weisbecker 	default:
22524f1e32cSFrederic Weisbecker 		return -EINVAL;
22624f1e32cSFrederic Weisbecker 	}
22724f1e32cSFrederic Weisbecker 
22824f1e32cSFrederic Weisbecker 	return 0;
22924f1e32cSFrederic Weisbecker }
23024f1e32cSFrederic Weisbecker 
23124f1e32cSFrederic Weisbecker 
23224f1e32cSFrederic Weisbecker static int arch_build_bp_info(struct perf_event *bp)
23324f1e32cSFrederic Weisbecker {
23424f1e32cSFrederic Weisbecker 	struct arch_hw_breakpoint *info = counter_arch_bp(bp);
23524f1e32cSFrederic Weisbecker 
23624f1e32cSFrederic Weisbecker 	info->address = bp->attr.bp_addr;
23724f1e32cSFrederic Weisbecker 
238f7809dafSFrederic Weisbecker 	/* Type */
239f7809dafSFrederic Weisbecker 	switch (bp->attr.bp_type) {
240f7809dafSFrederic Weisbecker 	case HW_BREAKPOINT_W:
241f7809dafSFrederic Weisbecker 		info->type = X86_BREAKPOINT_WRITE;
242f7809dafSFrederic Weisbecker 		break;
243f7809dafSFrederic Weisbecker 	case HW_BREAKPOINT_W | HW_BREAKPOINT_R:
244f7809dafSFrederic Weisbecker 		info->type = X86_BREAKPOINT_RW;
245f7809dafSFrederic Weisbecker 		break;
246f7809dafSFrederic Weisbecker 	case HW_BREAKPOINT_X:
247e5779e8eSAndy Lutomirski 		/*
248e5779e8eSAndy Lutomirski 		 * We don't allow kernel breakpoints in places that are not
249e5779e8eSAndy Lutomirski 		 * acceptable for kprobes.  On non-kprobes kernels, we don't
250e5779e8eSAndy Lutomirski 		 * allow kernel breakpoints at all.
251e5779e8eSAndy Lutomirski 		 */
252e5779e8eSAndy Lutomirski 		if (bp->attr.bp_addr >= TASK_SIZE_MAX) {
253e5779e8eSAndy Lutomirski #ifdef CONFIG_KPROBES
254e5779e8eSAndy Lutomirski 			if (within_kprobe_blacklist(bp->attr.bp_addr))
255e5779e8eSAndy Lutomirski 				return -EINVAL;
256e5779e8eSAndy Lutomirski #else
257e5779e8eSAndy Lutomirski 			return -EINVAL;
258e5779e8eSAndy Lutomirski #endif
259e5779e8eSAndy Lutomirski 		}
260e5779e8eSAndy Lutomirski 
261f7809dafSFrederic Weisbecker 		info->type = X86_BREAKPOINT_EXECUTE;
262f7809dafSFrederic Weisbecker 		/*
263f7809dafSFrederic Weisbecker 		 * x86 inst breakpoints need to have a specific undefined len.
264f7809dafSFrederic Weisbecker 		 * But we still need to check userspace is not trying to setup
265f7809dafSFrederic Weisbecker 		 * an unsupported length, to get a range breakpoint for example.
266f7809dafSFrederic Weisbecker 		 */
267f7809dafSFrederic Weisbecker 		if (bp->attr.bp_len == sizeof(long)) {
268f7809dafSFrederic Weisbecker 			info->len = X86_BREAKPOINT_LEN_X;
269f7809dafSFrederic Weisbecker 			return 0;
270f7809dafSFrederic Weisbecker 		}
271f7809dafSFrederic Weisbecker 	default:
272f7809dafSFrederic Weisbecker 		return -EINVAL;
273f7809dafSFrederic Weisbecker 	}
274f7809dafSFrederic Weisbecker 
27524f1e32cSFrederic Weisbecker 	/* Len */
276d6d55f0bSJacob Shin 	info->mask = 0;
277d6d55f0bSJacob Shin 
27824f1e32cSFrederic Weisbecker 	switch (bp->attr.bp_len) {
27924f1e32cSFrederic Weisbecker 	case HW_BREAKPOINT_LEN_1:
28024f1e32cSFrederic Weisbecker 		info->len = X86_BREAKPOINT_LEN_1;
28124f1e32cSFrederic Weisbecker 		break;
28224f1e32cSFrederic Weisbecker 	case HW_BREAKPOINT_LEN_2:
28324f1e32cSFrederic Weisbecker 		info->len = X86_BREAKPOINT_LEN_2;
28424f1e32cSFrederic Weisbecker 		break;
28524f1e32cSFrederic Weisbecker 	case HW_BREAKPOINT_LEN_4:
28624f1e32cSFrederic Weisbecker 		info->len = X86_BREAKPOINT_LEN_4;
28724f1e32cSFrederic Weisbecker 		break;
28824f1e32cSFrederic Weisbecker #ifdef CONFIG_X86_64
28924f1e32cSFrederic Weisbecker 	case HW_BREAKPOINT_LEN_8:
29024f1e32cSFrederic Weisbecker 		info->len = X86_BREAKPOINT_LEN_8;
29124f1e32cSFrederic Weisbecker 		break;
29224f1e32cSFrederic Weisbecker #endif
29324f1e32cSFrederic Weisbecker 	default:
294ab513927SAndy Lutomirski 		/* AMD range breakpoint */
295d6d55f0bSJacob Shin 		if (!is_power_of_2(bp->attr.bp_len))
29624f1e32cSFrederic Weisbecker 			return -EINVAL;
297ab513927SAndy Lutomirski 		if (bp->attr.bp_addr & (bp->attr.bp_len - 1))
298ab513927SAndy Lutomirski 			return -EINVAL;
299ab513927SAndy Lutomirski 		/*
300ab513927SAndy Lutomirski 		 * It's impossible to use a range breakpoint to fake out
301ab513927SAndy Lutomirski 		 * user vs kernel detection because bp_len - 1 can't
302ab513927SAndy Lutomirski 		 * have the high bit set.  If we ever allow range instruction
303ab513927SAndy Lutomirski 		 * breakpoints, then we'll have to check for kprobe-blacklisted
304ab513927SAndy Lutomirski 		 * addresses anywhere in the range.
305ab513927SAndy Lutomirski 		 */
306d6d55f0bSJacob Shin 		if (!cpu_has_bpext)
307d6d55f0bSJacob Shin 			return -EOPNOTSUPP;
308d6d55f0bSJacob Shin 		info->mask = bp->attr.bp_len - 1;
309d6d55f0bSJacob Shin 		info->len = X86_BREAKPOINT_LEN_1;
31024f1e32cSFrederic Weisbecker 	}
31124f1e32cSFrederic Weisbecker 
31224f1e32cSFrederic Weisbecker 	return 0;
31324f1e32cSFrederic Weisbecker }
314d6d55f0bSJacob Shin 
3150067f129SK.Prasad /*
3160067f129SK.Prasad  * Validate the arch-specific HW Breakpoint register settings
3170067f129SK.Prasad  */
318b2812d03SFrederic Weisbecker int arch_validate_hwbkpt_settings(struct perf_event *bp)
3190067f129SK.Prasad {
32024f1e32cSFrederic Weisbecker 	struct arch_hw_breakpoint *info = counter_arch_bp(bp);
3210067f129SK.Prasad 	unsigned int align;
32224f1e32cSFrederic Weisbecker 	int ret;
3230067f129SK.Prasad 
32424f1e32cSFrederic Weisbecker 
32524f1e32cSFrederic Weisbecker 	ret = arch_build_bp_info(bp);
32624f1e32cSFrederic Weisbecker 	if (ret)
32724f1e32cSFrederic Weisbecker 		return ret;
32824f1e32cSFrederic Weisbecker 
32924f1e32cSFrederic Weisbecker 	switch (info->len) {
33024f1e32cSFrederic Weisbecker 	case X86_BREAKPOINT_LEN_1:
3310067f129SK.Prasad 		align = 0;
332d6d55f0bSJacob Shin 		if (info->mask)
333d6d55f0bSJacob Shin 			align = info->mask;
3340067f129SK.Prasad 		break;
33524f1e32cSFrederic Weisbecker 	case X86_BREAKPOINT_LEN_2:
3360067f129SK.Prasad 		align = 1;
3370067f129SK.Prasad 		break;
33824f1e32cSFrederic Weisbecker 	case X86_BREAKPOINT_LEN_4:
3390067f129SK.Prasad 		align = 3;
3400067f129SK.Prasad 		break;
3410067f129SK.Prasad #ifdef CONFIG_X86_64
34224f1e32cSFrederic Weisbecker 	case X86_BREAKPOINT_LEN_8:
3430067f129SK.Prasad 		align = 7;
3440067f129SK.Prasad 		break;
3450067f129SK.Prasad #endif
3460067f129SK.Prasad 	default:
347d6d55f0bSJacob Shin 		WARN_ON_ONCE(1);
3480067f129SK.Prasad 	}
3490067f129SK.Prasad 
35084d71092SFrederic Weisbecker 	/*
3510067f129SK.Prasad 	 * Check that the low-order bits of the address are appropriate
3520067f129SK.Prasad 	 * for the alignment implied by len.
3530067f129SK.Prasad 	 */
35424f1e32cSFrederic Weisbecker 	if (info->address & align)
3550067f129SK.Prasad 		return -EINVAL;
3560067f129SK.Prasad 
3570067f129SK.Prasad 	return 0;
3580067f129SK.Prasad }
3590067f129SK.Prasad 
36024f1e32cSFrederic Weisbecker /*
3619f6b3c2cSFrederic Weisbecker  * Dump the debug register contents to the user.
3629f6b3c2cSFrederic Weisbecker  * We can't dump our per cpu values because it
3639f6b3c2cSFrederic Weisbecker  * may contain cpu wide breakpoint, something that
3649f6b3c2cSFrederic Weisbecker  * doesn't belong to the current task.
3659f6b3c2cSFrederic Weisbecker  *
3669f6b3c2cSFrederic Weisbecker  * TODO: include non-ptrace user breakpoints (perf)
3679f6b3c2cSFrederic Weisbecker  */
3689f6b3c2cSFrederic Weisbecker void aout_dump_debugregs(struct user *dump)
3699f6b3c2cSFrederic Weisbecker {
3709f6b3c2cSFrederic Weisbecker 	int i;
3719f6b3c2cSFrederic Weisbecker 	int dr7 = 0;
3729f6b3c2cSFrederic Weisbecker 	struct perf_event *bp;
3739f6b3c2cSFrederic Weisbecker 	struct arch_hw_breakpoint *info;
3749f6b3c2cSFrederic Weisbecker 	struct thread_struct *thread = &current->thread;
3759f6b3c2cSFrederic Weisbecker 
3769f6b3c2cSFrederic Weisbecker 	for (i = 0; i < HBP_NUM; i++) {
3779f6b3c2cSFrederic Weisbecker 		bp = thread->ptrace_bps[i];
3789f6b3c2cSFrederic Weisbecker 
3799f6b3c2cSFrederic Weisbecker 		if (bp && !bp->attr.disabled) {
3809f6b3c2cSFrederic Weisbecker 			dump->u_debugreg[i] = bp->attr.bp_addr;
3819f6b3c2cSFrederic Weisbecker 			info = counter_arch_bp(bp);
3829f6b3c2cSFrederic Weisbecker 			dr7 |= encode_dr7(i, info->len, info->type);
3839f6b3c2cSFrederic Weisbecker 		} else {
3849f6b3c2cSFrederic Weisbecker 			dump->u_debugreg[i] = 0;
3859f6b3c2cSFrederic Weisbecker 		}
3869f6b3c2cSFrederic Weisbecker 	}
3879f6b3c2cSFrederic Weisbecker 
3889f6b3c2cSFrederic Weisbecker 	dump->u_debugreg[4] = 0;
3899f6b3c2cSFrederic Weisbecker 	dump->u_debugreg[5] = 0;
3909f6b3c2cSFrederic Weisbecker 	dump->u_debugreg[6] = current->thread.debugreg6;
3919f6b3c2cSFrederic Weisbecker 
3929f6b3c2cSFrederic Weisbecker 	dump->u_debugreg[7] = dr7;
3939f6b3c2cSFrederic Weisbecker }
39468efa37dSIngo Molnar EXPORT_SYMBOL_GPL(aout_dump_debugregs);
3959f6b3c2cSFrederic Weisbecker 
3969f6b3c2cSFrederic Weisbecker /*
39724f1e32cSFrederic Weisbecker  * Release the user breakpoints used by ptrace
39824f1e32cSFrederic Weisbecker  */
39924f1e32cSFrederic Weisbecker void flush_ptrace_hw_breakpoint(struct task_struct *tsk)
4000067f129SK.Prasad {
4010067f129SK.Prasad 	int i;
40224f1e32cSFrederic Weisbecker 	struct thread_struct *t = &tsk->thread;
4030067f129SK.Prasad 
40424f1e32cSFrederic Weisbecker 	for (i = 0; i < HBP_NUM; i++) {
40524f1e32cSFrederic Weisbecker 		unregister_hw_breakpoint(t->ptrace_bps[i]);
40624f1e32cSFrederic Weisbecker 		t->ptrace_bps[i] = NULL;
4070067f129SK.Prasad 	}
408f7da04c9SOleg Nesterov 
409f7da04c9SOleg Nesterov 	t->debugreg6 = 0;
410f7da04c9SOleg Nesterov 	t->ptrace_dr7 = 0;
41124f1e32cSFrederic Weisbecker }
41224f1e32cSFrederic Weisbecker 
41324f1e32cSFrederic Weisbecker void hw_breakpoint_restore(void)
41424f1e32cSFrederic Weisbecker {
4150a3aee0dSTejun Heo 	set_debugreg(__this_cpu_read(cpu_debugreg[0]), 0);
4160a3aee0dSTejun Heo 	set_debugreg(__this_cpu_read(cpu_debugreg[1]), 1);
4170a3aee0dSTejun Heo 	set_debugreg(__this_cpu_read(cpu_debugreg[2]), 2);
4180a3aee0dSTejun Heo 	set_debugreg(__this_cpu_read(cpu_debugreg[3]), 3);
41924f1e32cSFrederic Weisbecker 	set_debugreg(current->thread.debugreg6, 6);
4200a3aee0dSTejun Heo 	set_debugreg(__this_cpu_read(cpu_dr7), 7);
42124f1e32cSFrederic Weisbecker }
42224f1e32cSFrederic Weisbecker EXPORT_SYMBOL_GPL(hw_breakpoint_restore);
4230067f129SK.Prasad 
4240067f129SK.Prasad /*
4250067f129SK.Prasad  * Handle debug exception notifications.
4260067f129SK.Prasad  *
4270067f129SK.Prasad  * Return value is either NOTIFY_STOP or NOTIFY_DONE as explained below.
4280067f129SK.Prasad  *
4290067f129SK.Prasad  * NOTIFY_DONE returned if one of the following conditions is true.
4300067f129SK.Prasad  * i) When the causative address is from user-space and the exception
4310067f129SK.Prasad  * is a valid one, i.e. not triggered as a result of lazy debug register
4320067f129SK.Prasad  * switching
4330067f129SK.Prasad  * ii) When there are more bits than trap<n> set in DR6 register (such
4340067f129SK.Prasad  * as BD, BS or BT) indicating that more than one debug condition is
4350067f129SK.Prasad  * met and requires some more action in do_debug().
4360067f129SK.Prasad  *
4370067f129SK.Prasad  * NOTIFY_STOP returned for all other cases
4380067f129SK.Prasad  *
4390067f129SK.Prasad  */
4409c54b616SMasami Hiramatsu static int hw_breakpoint_handler(struct die_args *args)
4410067f129SK.Prasad {
4420067f129SK.Prasad 	int i, cpu, rc = NOTIFY_STOP;
44324f1e32cSFrederic Weisbecker 	struct perf_event *bp;
44462edab90SK.Prasad 	unsigned long dr7, dr6;
44562edab90SK.Prasad 	unsigned long *dr6_p;
44662edab90SK.Prasad 
44762edab90SK.Prasad 	/* The DR6 value is pointed by args->err */
44862edab90SK.Prasad 	dr6_p = (unsigned long *)ERR_PTR(args->err);
44962edab90SK.Prasad 	dr6 = *dr6_p;
4500067f129SK.Prasad 
4516c0aca28SFrederic Weisbecker 	/* If it's a single step, TRAP bits are random */
4526c0aca28SFrederic Weisbecker 	if (dr6 & DR_STEP)
4536c0aca28SFrederic Weisbecker 		return NOTIFY_DONE;
4546c0aca28SFrederic Weisbecker 
4550067f129SK.Prasad 	/* Do an early return if no trap bits are set in DR6 */
4560067f129SK.Prasad 	if ((dr6 & DR_TRAP_BITS) == 0)
4570067f129SK.Prasad 		return NOTIFY_DONE;
4580067f129SK.Prasad 
4590067f129SK.Prasad 	get_debugreg(dr7, 7);
4600067f129SK.Prasad 	/* Disable breakpoints during exception handling */
4610067f129SK.Prasad 	set_debugreg(0UL, 7);
4620067f129SK.Prasad 	/*
4630067f129SK.Prasad 	 * Assert that local interrupts are disabled
4640067f129SK.Prasad 	 * Reset the DRn bits in the virtualized register value.
4650067f129SK.Prasad 	 * The ptrace trigger routine will add in whatever is needed.
4660067f129SK.Prasad 	 */
4670067f129SK.Prasad 	current->thread.debugreg6 &= ~DR_TRAP_BITS;
4680067f129SK.Prasad 	cpu = get_cpu();
4690067f129SK.Prasad 
4700067f129SK.Prasad 	/* Handle all the breakpoints that were triggered */
4710067f129SK.Prasad 	for (i = 0; i < HBP_NUM; ++i) {
4720067f129SK.Prasad 		if (likely(!(dr6 & (DR_TRAP0 << i))))
4730067f129SK.Prasad 			continue;
47424f1e32cSFrederic Weisbecker 
4750067f129SK.Prasad 		/*
47624f1e32cSFrederic Weisbecker 		 * The counter may be concurrently released but that can only
47724f1e32cSFrederic Weisbecker 		 * occur from a call_rcu() path. We can then safely fetch
47824f1e32cSFrederic Weisbecker 		 * the breakpoint, use its callback, touch its counter
47924f1e32cSFrederic Weisbecker 		 * while we are in an rcu_read_lock() path.
4800067f129SK.Prasad 		 */
48124f1e32cSFrederic Weisbecker 		rcu_read_lock();
48224f1e32cSFrederic Weisbecker 
48324f1e32cSFrederic Weisbecker 		bp = per_cpu(bp_per_reg[i], cpu);
4840067f129SK.Prasad 		/*
48562edab90SK.Prasad 		 * Reset the 'i'th TRAP bit in dr6 to denote completion of
48662edab90SK.Prasad 		 * exception handling
48762edab90SK.Prasad 		 */
48862edab90SK.Prasad 		(*dr6_p) &= ~(DR_TRAP0 << i);
48962edab90SK.Prasad 		/*
4900067f129SK.Prasad 		 * bp can be NULL due to lazy debug register switching
49124f1e32cSFrederic Weisbecker 		 * or due to concurrent perf counter removing.
4920067f129SK.Prasad 		 */
49324f1e32cSFrederic Weisbecker 		if (!bp) {
49424f1e32cSFrederic Weisbecker 			rcu_read_unlock();
49524f1e32cSFrederic Weisbecker 			break;
49624f1e32cSFrederic Weisbecker 		}
4970067f129SK.Prasad 
498b326e956SFrederic Weisbecker 		perf_bp_event(bp, args->regs);
49924f1e32cSFrederic Weisbecker 
5000c4519e8SFrederic Weisbecker 		/*
5010c4519e8SFrederic Weisbecker 		 * Set up resume flag to avoid breakpoint recursion when
5020c4519e8SFrederic Weisbecker 		 * returning back to origin.
5030c4519e8SFrederic Weisbecker 		 */
5040c4519e8SFrederic Weisbecker 		if (bp->hw.info.type == X86_BREAKPOINT_EXECUTE)
5050c4519e8SFrederic Weisbecker 			args->regs->flags |= X86_EFLAGS_RF;
5060c4519e8SFrederic Weisbecker 
50724f1e32cSFrederic Weisbecker 		rcu_read_unlock();
5080067f129SK.Prasad 	}
509e0e53db6SK.Prasad 	/*
510e0e53db6SK.Prasad 	 * Further processing in do_debug() is needed for a) user-space
511e0e53db6SK.Prasad 	 * breakpoints (to generate signals) and b) when the system has
512e0e53db6SK.Prasad 	 * taken exception due to multiple causes
513e0e53db6SK.Prasad 	 */
514e0e53db6SK.Prasad 	if ((current->thread.debugreg6 & DR_TRAP_BITS) ||
515e0e53db6SK.Prasad 	    (dr6 & (~DR_TRAP_BITS)))
5160067f129SK.Prasad 		rc = NOTIFY_DONE;
5170067f129SK.Prasad 
5180067f129SK.Prasad 	set_debugreg(dr7, 7);
519eadb8a09SIngo Molnar 	put_cpu();
52024f1e32cSFrederic Weisbecker 
5210067f129SK.Prasad 	return rc;
5220067f129SK.Prasad }
5230067f129SK.Prasad 
5240067f129SK.Prasad /*
5250067f129SK.Prasad  * Handle debug exception notifications.
5260067f129SK.Prasad  */
5279c54b616SMasami Hiramatsu int hw_breakpoint_exceptions_notify(
5280067f129SK.Prasad 		struct notifier_block *unused, unsigned long val, void *data)
5290067f129SK.Prasad {
5300067f129SK.Prasad 	if (val != DIE_DEBUG)
5310067f129SK.Prasad 		return NOTIFY_DONE;
5320067f129SK.Prasad 
5330067f129SK.Prasad 	return hw_breakpoint_handler(data);
5340067f129SK.Prasad }
53524f1e32cSFrederic Weisbecker 
53624f1e32cSFrederic Weisbecker void hw_breakpoint_pmu_read(struct perf_event *bp)
53724f1e32cSFrederic Weisbecker {
53824f1e32cSFrederic Weisbecker 	/* TODO */
53924f1e32cSFrederic Weisbecker }
540