xref: /openbmc/linux/arch/powerpc/kernel/kprobes.c (revision a16be368)
1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3  *  Kernel Probes (KProbes)
4  *
5  * Copyright (C) IBM Corporation, 2002, 2004
6  *
7  * 2002-Oct	Created by Vamsi Krishna S <vamsi_krishna@in.ibm.com> Kernel
8  *		Probes initial implementation ( includes contributions from
9  *		Rusty Russell).
10  * 2004-July	Suparna Bhattacharya <suparna@in.ibm.com> added jumper probes
11  *		interface to access function arguments.
12  * 2004-Nov	Ananth N Mavinakayanahalli <ananth@in.ibm.com> kprobes port
13  *		for PPC64
14  */
15 
16 #include <linux/kprobes.h>
17 #include <linux/ptrace.h>
18 #include <linux/preempt.h>
19 #include <linux/extable.h>
20 #include <linux/kdebug.h>
21 #include <linux/slab.h>
22 #include <asm/code-patching.h>
23 #include <asm/cacheflush.h>
24 #include <asm/sstep.h>
25 #include <asm/sections.h>
26 #include <asm/inst.h>
27 #include <linux/uaccess.h>
28 
29 DEFINE_PER_CPU(struct kprobe *, current_kprobe) = NULL;
30 DEFINE_PER_CPU(struct kprobe_ctlblk, kprobe_ctlblk);
31 
32 struct kretprobe_blackpoint kretprobe_blacklist[] = {{NULL, NULL}};
33 
34 bool arch_within_kprobe_blacklist(unsigned long addr)
35 {
36 	return  (addr >= (unsigned long)__kprobes_text_start &&
37 		 addr < (unsigned long)__kprobes_text_end) ||
38 		(addr >= (unsigned long)_stext &&
39 		 addr < (unsigned long)__head_end);
40 }
41 
42 kprobe_opcode_t *kprobe_lookup_name(const char *name, unsigned int offset)
43 {
44 	kprobe_opcode_t *addr = NULL;
45 
46 #ifdef PPC64_ELF_ABI_v2
47 	/* PPC64 ABIv2 needs local entry point */
48 	addr = (kprobe_opcode_t *)kallsyms_lookup_name(name);
49 	if (addr && !offset) {
50 #ifdef CONFIG_KPROBES_ON_FTRACE
51 		unsigned long faddr;
52 		/*
53 		 * Per livepatch.h, ftrace location is always within the first
54 		 * 16 bytes of a function on powerpc with -mprofile-kernel.
55 		 */
56 		faddr = ftrace_location_range((unsigned long)addr,
57 					      (unsigned long)addr + 16);
58 		if (faddr)
59 			addr = (kprobe_opcode_t *)faddr;
60 		else
61 #endif
62 			addr = (kprobe_opcode_t *)ppc_function_entry(addr);
63 	}
64 #elif defined(PPC64_ELF_ABI_v1)
65 	/*
66 	 * 64bit powerpc ABIv1 uses function descriptors:
67 	 * - Check for the dot variant of the symbol first.
68 	 * - If that fails, try looking up the symbol provided.
69 	 *
70 	 * This ensures we always get to the actual symbol and not
71 	 * the descriptor.
72 	 *
73 	 * Also handle <module:symbol> format.
74 	 */
75 	char dot_name[MODULE_NAME_LEN + 1 + KSYM_NAME_LEN];
76 	bool dot_appended = false;
77 	const char *c;
78 	ssize_t ret = 0;
79 	int len = 0;
80 
81 	if ((c = strnchr(name, MODULE_NAME_LEN, ':')) != NULL) {
82 		c++;
83 		len = c - name;
84 		memcpy(dot_name, name, len);
85 	} else
86 		c = name;
87 
88 	if (*c != '\0' && *c != '.') {
89 		dot_name[len++] = '.';
90 		dot_appended = true;
91 	}
92 	ret = strscpy(dot_name + len, c, KSYM_NAME_LEN);
93 	if (ret > 0)
94 		addr = (kprobe_opcode_t *)kallsyms_lookup_name(dot_name);
95 
96 	/* Fallback to the original non-dot symbol lookup */
97 	if (!addr && dot_appended)
98 		addr = (kprobe_opcode_t *)kallsyms_lookup_name(name);
99 #else
100 	addr = (kprobe_opcode_t *)kallsyms_lookup_name(name);
101 #endif
102 
103 	return addr;
104 }
105 
106 int arch_prepare_kprobe(struct kprobe *p)
107 {
108 	int ret = 0;
109 	struct kprobe *prev;
110 	struct ppc_inst insn = ppc_inst_read((struct ppc_inst *)p->addr);
111 	struct ppc_inst prefix = ppc_inst_read((struct ppc_inst *)(p->addr - 1));
112 
113 	if ((unsigned long)p->addr & 0x03) {
114 		printk("Attempt to register kprobe at an unaligned address\n");
115 		ret = -EINVAL;
116 	} else if (IS_MTMSRD(insn) || IS_RFID(insn) || IS_RFI(insn)) {
117 		printk("Cannot register a kprobe on rfi/rfid or mtmsr[d]\n");
118 		ret = -EINVAL;
119 	} else if (ppc_inst_prefixed(prefix)) {
120 		printk("Cannot register a kprobe on the second word of prefixed instruction\n");
121 		ret = -EINVAL;
122 	}
123 	preempt_disable();
124 	prev = get_kprobe(p->addr - 1);
125 	preempt_enable_no_resched();
126 	if (prev &&
127 	    ppc_inst_prefixed(ppc_inst_read((struct ppc_inst *)prev->ainsn.insn))) {
128 		printk("Cannot register a kprobe on the second word of prefixed instruction\n");
129 		ret = -EINVAL;
130 	}
131 
132 	/* insn must be on a special executable page on ppc64.  This is
133 	 * not explicitly required on ppc32 (right now), but it doesn't hurt */
134 	if (!ret) {
135 		p->ainsn.insn = get_insn_slot();
136 		if (!p->ainsn.insn)
137 			ret = -ENOMEM;
138 	}
139 
140 	if (!ret) {
141 		patch_instruction((struct ppc_inst *)p->ainsn.insn, insn);
142 		p->opcode = ppc_inst_val(insn);
143 	}
144 
145 	p->ainsn.boostable = 0;
146 	return ret;
147 }
148 NOKPROBE_SYMBOL(arch_prepare_kprobe);
149 
150 void arch_arm_kprobe(struct kprobe *p)
151 {
152 	patch_instruction((struct ppc_inst *)p->addr, ppc_inst(BREAKPOINT_INSTRUCTION));
153 }
154 NOKPROBE_SYMBOL(arch_arm_kprobe);
155 
156 void arch_disarm_kprobe(struct kprobe *p)
157 {
158 	patch_instruction((struct ppc_inst *)p->addr, ppc_inst(p->opcode));
159 }
160 NOKPROBE_SYMBOL(arch_disarm_kprobe);
161 
162 void arch_remove_kprobe(struct kprobe *p)
163 {
164 	if (p->ainsn.insn) {
165 		free_insn_slot(p->ainsn.insn, 0);
166 		p->ainsn.insn = NULL;
167 	}
168 }
169 NOKPROBE_SYMBOL(arch_remove_kprobe);
170 
171 static nokprobe_inline void prepare_singlestep(struct kprobe *p, struct pt_regs *regs)
172 {
173 	enable_single_step(regs);
174 
175 	/*
176 	 * On powerpc we should single step on the original
177 	 * instruction even if the probed insn is a trap
178 	 * variant as values in regs could play a part in
179 	 * if the trap is taken or not
180 	 */
181 	regs->nip = (unsigned long)p->ainsn.insn;
182 }
183 
184 static nokprobe_inline void save_previous_kprobe(struct kprobe_ctlblk *kcb)
185 {
186 	kcb->prev_kprobe.kp = kprobe_running();
187 	kcb->prev_kprobe.status = kcb->kprobe_status;
188 	kcb->prev_kprobe.saved_msr = kcb->kprobe_saved_msr;
189 }
190 
191 static nokprobe_inline void restore_previous_kprobe(struct kprobe_ctlblk *kcb)
192 {
193 	__this_cpu_write(current_kprobe, kcb->prev_kprobe.kp);
194 	kcb->kprobe_status = kcb->prev_kprobe.status;
195 	kcb->kprobe_saved_msr = kcb->prev_kprobe.saved_msr;
196 }
197 
198 static nokprobe_inline void set_current_kprobe(struct kprobe *p, struct pt_regs *regs,
199 				struct kprobe_ctlblk *kcb)
200 {
201 	__this_cpu_write(current_kprobe, p);
202 	kcb->kprobe_saved_msr = regs->msr;
203 }
204 
205 bool arch_kprobe_on_func_entry(unsigned long offset)
206 {
207 #ifdef PPC64_ELF_ABI_v2
208 #ifdef CONFIG_KPROBES_ON_FTRACE
209 	return offset <= 16;
210 #else
211 	return offset <= 8;
212 #endif
213 #else
214 	return !offset;
215 #endif
216 }
217 
218 void arch_prepare_kretprobe(struct kretprobe_instance *ri, struct pt_regs *regs)
219 {
220 	ri->ret_addr = (kprobe_opcode_t *)regs->link;
221 
222 	/* Replace the return addr with trampoline addr */
223 	regs->link = (unsigned long)kretprobe_trampoline;
224 }
225 NOKPROBE_SYMBOL(arch_prepare_kretprobe);
226 
227 static int try_to_emulate(struct kprobe *p, struct pt_regs *regs)
228 {
229 	int ret;
230 	struct ppc_inst insn = ppc_inst_read((struct ppc_inst *)p->ainsn.insn);
231 
232 	/* regs->nip is also adjusted if emulate_step returns 1 */
233 	ret = emulate_step(regs, insn);
234 	if (ret > 0) {
235 		/*
236 		 * Once this instruction has been boosted
237 		 * successfully, set the boostable flag
238 		 */
239 		if (unlikely(p->ainsn.boostable == 0))
240 			p->ainsn.boostable = 1;
241 	} else if (ret < 0) {
242 		/*
243 		 * We don't allow kprobes on mtmsr(d)/rfi(d), etc.
244 		 * So, we should never get here... but, its still
245 		 * good to catch them, just in case...
246 		 */
247 		printk("Can't step on instruction %x\n", ppc_inst_val(insn));
248 		BUG();
249 	} else {
250 		/*
251 		 * If we haven't previously emulated this instruction, then it
252 		 * can't be boosted. Note it down so we don't try to do so again.
253 		 *
254 		 * If, however, we had emulated this instruction in the past,
255 		 * then this is just an error with the current run (for
256 		 * instance, exceptions due to a load/store). We return 0 so
257 		 * that this is now single-stepped, but continue to try
258 		 * emulating it in subsequent probe hits.
259 		 */
260 		if (unlikely(p->ainsn.boostable != 1))
261 			p->ainsn.boostable = -1;
262 	}
263 
264 	return ret;
265 }
266 NOKPROBE_SYMBOL(try_to_emulate);
267 
268 int kprobe_handler(struct pt_regs *regs)
269 {
270 	struct kprobe *p;
271 	int ret = 0;
272 	unsigned int *addr = (unsigned int *)regs->nip;
273 	struct kprobe_ctlblk *kcb;
274 
275 	if (user_mode(regs))
276 		return 0;
277 
278 	if (!(regs->msr & MSR_IR) || !(regs->msr & MSR_DR))
279 		return 0;
280 
281 	/*
282 	 * We don't want to be preempted for the entire
283 	 * duration of kprobe processing
284 	 */
285 	preempt_disable();
286 	kcb = get_kprobe_ctlblk();
287 
288 	p = get_kprobe(addr);
289 	if (!p) {
290 		unsigned int instr;
291 
292 		if (probe_kernel_address(addr, instr))
293 			goto no_kprobe;
294 
295 		if (instr != BREAKPOINT_INSTRUCTION) {
296 			/*
297 			 * PowerPC has multiple variants of the "trap"
298 			 * instruction. If the current instruction is a
299 			 * trap variant, it could belong to someone else
300 			 */
301 			if (is_trap(instr))
302 				goto no_kprobe;
303 			/*
304 			 * The breakpoint instruction was removed right
305 			 * after we hit it.  Another cpu has removed
306 			 * either a probepoint or a debugger breakpoint
307 			 * at this address.  In either case, no further
308 			 * handling of this interrupt is appropriate.
309 			 */
310 			ret = 1;
311 		}
312 		/* Not one of ours: let kernel handle it */
313 		goto no_kprobe;
314 	}
315 
316 	/* Check we're not actually recursing */
317 	if (kprobe_running()) {
318 		kprobe_opcode_t insn = *p->ainsn.insn;
319 		if (kcb->kprobe_status == KPROBE_HIT_SS && is_trap(insn)) {
320 			/* Turn off 'trace' bits */
321 			regs->msr &= ~MSR_SINGLESTEP;
322 			regs->msr |= kcb->kprobe_saved_msr;
323 			goto no_kprobe;
324 		}
325 
326 		/*
327 		 * We have reentered the kprobe_handler(), since another probe
328 		 * was hit while within the handler. We here save the original
329 		 * kprobes variables and just single step on the instruction of
330 		 * the new probe without calling any user handlers.
331 		 */
332 		save_previous_kprobe(kcb);
333 		set_current_kprobe(p, regs, kcb);
334 		kprobes_inc_nmissed_count(p);
335 		kcb->kprobe_status = KPROBE_REENTER;
336 		if (p->ainsn.boostable >= 0) {
337 			ret = try_to_emulate(p, regs);
338 
339 			if (ret > 0) {
340 				restore_previous_kprobe(kcb);
341 				preempt_enable_no_resched();
342 				return 1;
343 			}
344 		}
345 		prepare_singlestep(p, regs);
346 		return 1;
347 	}
348 
349 	kcb->kprobe_status = KPROBE_HIT_ACTIVE;
350 	set_current_kprobe(p, regs, kcb);
351 	if (p->pre_handler && p->pre_handler(p, regs)) {
352 		/* handler changed execution path, so skip ss setup */
353 		reset_current_kprobe();
354 		preempt_enable_no_resched();
355 		return 1;
356 	}
357 
358 	if (p->ainsn.boostable >= 0) {
359 		ret = try_to_emulate(p, regs);
360 
361 		if (ret > 0) {
362 			if (p->post_handler)
363 				p->post_handler(p, regs, 0);
364 
365 			kcb->kprobe_status = KPROBE_HIT_SSDONE;
366 			reset_current_kprobe();
367 			preempt_enable_no_resched();
368 			return 1;
369 		}
370 	}
371 	prepare_singlestep(p, regs);
372 	kcb->kprobe_status = KPROBE_HIT_SS;
373 	return 1;
374 
375 no_kprobe:
376 	preempt_enable_no_resched();
377 	return ret;
378 }
379 NOKPROBE_SYMBOL(kprobe_handler);
380 
381 /*
382  * Function return probe trampoline:
383  * 	- init_kprobes() establishes a probepoint here
384  * 	- When the probed function returns, this probe
385  * 		causes the handlers to fire
386  */
387 asm(".global kretprobe_trampoline\n"
388 	".type kretprobe_trampoline, @function\n"
389 	"kretprobe_trampoline:\n"
390 	"nop\n"
391 	"blr\n"
392 	".size kretprobe_trampoline, .-kretprobe_trampoline\n");
393 
394 /*
395  * Called when the probe at kretprobe trampoline is hit
396  */
397 static int trampoline_probe_handler(struct kprobe *p, struct pt_regs *regs)
398 {
399 	struct kretprobe_instance *ri = NULL;
400 	struct hlist_head *head, empty_rp;
401 	struct hlist_node *tmp;
402 	unsigned long flags, orig_ret_address = 0;
403 	unsigned long trampoline_address =(unsigned long)&kretprobe_trampoline;
404 
405 	INIT_HLIST_HEAD(&empty_rp);
406 	kretprobe_hash_lock(current, &head, &flags);
407 
408 	/*
409 	 * It is possible to have multiple instances associated with a given
410 	 * task either because an multiple functions in the call path
411 	 * have a return probe installed on them, and/or more than one return
412 	 * return probe was registered for a target function.
413 	 *
414 	 * We can handle this because:
415 	 *     - instances are always inserted at the head of the list
416 	 *     - when multiple return probes are registered for the same
417 	 *       function, the first instance's ret_addr will point to the
418 	 *       real return address, and all the rest will point to
419 	 *       kretprobe_trampoline
420 	 */
421 	hlist_for_each_entry_safe(ri, tmp, head, hlist) {
422 		if (ri->task != current)
423 			/* another task is sharing our hash bucket */
424 			continue;
425 
426 		if (ri->rp && ri->rp->handler)
427 			ri->rp->handler(ri, regs);
428 
429 		orig_ret_address = (unsigned long)ri->ret_addr;
430 		recycle_rp_inst(ri, &empty_rp);
431 
432 		if (orig_ret_address != trampoline_address)
433 			/*
434 			 * This is the real return address. Any other
435 			 * instances associated with this task are for
436 			 * other calls deeper on the call stack
437 			 */
438 			break;
439 	}
440 
441 	kretprobe_assert(ri, orig_ret_address, trampoline_address);
442 
443 	/*
444 	 * We get here through one of two paths:
445 	 * 1. by taking a trap -> kprobe_handler() -> here
446 	 * 2. by optprobe branch -> optimized_callback() -> opt_pre_handler() -> here
447 	 *
448 	 * When going back through (1), we need regs->nip to be setup properly
449 	 * as it is used to determine the return address from the trap.
450 	 * For (2), since nip is not honoured with optprobes, we instead setup
451 	 * the link register properly so that the subsequent 'blr' in
452 	 * kretprobe_trampoline jumps back to the right instruction.
453 	 *
454 	 * For nip, we should set the address to the previous instruction since
455 	 * we end up emulating it in kprobe_handler(), which increments the nip
456 	 * again.
457 	 */
458 	regs->nip = orig_ret_address - 4;
459 	regs->link = orig_ret_address;
460 
461 	kretprobe_hash_unlock(current, &flags);
462 
463 	hlist_for_each_entry_safe(ri, tmp, &empty_rp, hlist) {
464 		hlist_del(&ri->hlist);
465 		kfree(ri);
466 	}
467 
468 	return 0;
469 }
470 NOKPROBE_SYMBOL(trampoline_probe_handler);
471 
472 /*
473  * Called after single-stepping.  p->addr is the address of the
474  * instruction whose first byte has been replaced by the "breakpoint"
475  * instruction.  To avoid the SMP problems that can occur when we
476  * temporarily put back the original opcode to single-step, we
477  * single-stepped a copy of the instruction.  The address of this
478  * copy is p->ainsn.insn.
479  */
480 int kprobe_post_handler(struct pt_regs *regs)
481 {
482 	int len;
483 	struct kprobe *cur = kprobe_running();
484 	struct kprobe_ctlblk *kcb = get_kprobe_ctlblk();
485 
486 	if (!cur || user_mode(regs))
487 		return 0;
488 
489 	len = ppc_inst_len(ppc_inst_read((struct ppc_inst *)cur->ainsn.insn));
490 	/* make sure we got here for instruction we have a kprobe on */
491 	if (((unsigned long)cur->ainsn.insn + len) != regs->nip)
492 		return 0;
493 
494 	if ((kcb->kprobe_status != KPROBE_REENTER) && cur->post_handler) {
495 		kcb->kprobe_status = KPROBE_HIT_SSDONE;
496 		cur->post_handler(cur, regs, 0);
497 	}
498 
499 	/* Adjust nip to after the single-stepped instruction */
500 	regs->nip = (unsigned long)cur->addr + len;
501 	regs->msr |= kcb->kprobe_saved_msr;
502 
503 	/*Restore back the original saved kprobes variables and continue. */
504 	if (kcb->kprobe_status == KPROBE_REENTER) {
505 		restore_previous_kprobe(kcb);
506 		goto out;
507 	}
508 	reset_current_kprobe();
509 out:
510 	preempt_enable_no_resched();
511 
512 	/*
513 	 * if somebody else is singlestepping across a probe point, msr
514 	 * will have DE/SE set, in which case, continue the remaining processing
515 	 * of do_debug, as if this is not a probe hit.
516 	 */
517 	if (regs->msr & MSR_SINGLESTEP)
518 		return 0;
519 
520 	return 1;
521 }
522 NOKPROBE_SYMBOL(kprobe_post_handler);
523 
524 int kprobe_fault_handler(struct pt_regs *regs, int trapnr)
525 {
526 	struct kprobe *cur = kprobe_running();
527 	struct kprobe_ctlblk *kcb = get_kprobe_ctlblk();
528 	const struct exception_table_entry *entry;
529 
530 	switch(kcb->kprobe_status) {
531 	case KPROBE_HIT_SS:
532 	case KPROBE_REENTER:
533 		/*
534 		 * We are here because the instruction being single
535 		 * stepped caused a page fault. We reset the current
536 		 * kprobe and the nip points back to the probe address
537 		 * and allow the page fault handler to continue as a
538 		 * normal page fault.
539 		 */
540 		regs->nip = (unsigned long)cur->addr;
541 		regs->msr &= ~MSR_SINGLESTEP; /* Turn off 'trace' bits */
542 		regs->msr |= kcb->kprobe_saved_msr;
543 		if (kcb->kprobe_status == KPROBE_REENTER)
544 			restore_previous_kprobe(kcb);
545 		else
546 			reset_current_kprobe();
547 		preempt_enable_no_resched();
548 		break;
549 	case KPROBE_HIT_ACTIVE:
550 	case KPROBE_HIT_SSDONE:
551 		/*
552 		 * We increment the nmissed count for accounting,
553 		 * we can also use npre/npostfault count for accounting
554 		 * these specific fault cases.
555 		 */
556 		kprobes_inc_nmissed_count(cur);
557 
558 		/*
559 		 * We come here because instructions in the pre/post
560 		 * handler caused the page_fault, this could happen
561 		 * if handler tries to access user space by
562 		 * copy_from_user(), get_user() etc. Let the
563 		 * user-specified handler try to fix it first.
564 		 */
565 		if (cur->fault_handler && cur->fault_handler(cur, regs, trapnr))
566 			return 1;
567 
568 		/*
569 		 * In case the user-specified fault handler returned
570 		 * zero, try to fix up.
571 		 */
572 		if ((entry = search_exception_tables(regs->nip)) != NULL) {
573 			regs->nip = extable_fixup(entry);
574 			return 1;
575 		}
576 
577 		/*
578 		 * fixup_exception() could not handle it,
579 		 * Let do_page_fault() fix it.
580 		 */
581 		break;
582 	default:
583 		break;
584 	}
585 	return 0;
586 }
587 NOKPROBE_SYMBOL(kprobe_fault_handler);
588 
589 unsigned long arch_deref_entry_point(void *entry)
590 {
591 #ifdef PPC64_ELF_ABI_v1
592 	if (!kernel_text_address((unsigned long)entry))
593 		return ppc_global_function_entry(entry);
594 	else
595 #endif
596 		return (unsigned long)entry;
597 }
598 NOKPROBE_SYMBOL(arch_deref_entry_point);
599 
600 static struct kprobe trampoline_p = {
601 	.addr = (kprobe_opcode_t *) &kretprobe_trampoline,
602 	.pre_handler = trampoline_probe_handler
603 };
604 
605 int __init arch_init_kprobes(void)
606 {
607 	return register_kprobe(&trampoline_p);
608 }
609 
610 int arch_trampoline_kprobe(struct kprobe *p)
611 {
612 	if (p->addr == (kprobe_opcode_t *)&kretprobe_trampoline)
613 		return 1;
614 
615 	return 0;
616 }
617 NOKPROBE_SYMBOL(arch_trampoline_kprobe);
618