13d083395SSteven Rostedt /* 23d083395SSteven Rostedt * Code for replacing ftrace calls with jumps. 33d083395SSteven Rostedt * 43d083395SSteven Rostedt * Copyright (C) 2007-2008 Steven Rostedt <srostedt@redhat.com> 53d083395SSteven Rostedt * 63d083395SSteven Rostedt * Thanks goes to Ingo Molnar, for suggesting the idea. 73d083395SSteven Rostedt * Mathieu Desnoyers, for suggesting postponing the modifications. 83d083395SSteven Rostedt * Arjan van de Ven, for keeping me straight, and explaining to me 93d083395SSteven Rostedt * the dangers of modifying code on the run. 103d083395SSteven Rostedt */ 113d083395SSteven Rostedt 123d083395SSteven Rostedt #include <linux/spinlock.h> 133d083395SSteven Rostedt #include <linux/hardirq.h> 146f93fc07SSteven Rostedt #include <linux/uaccess.h> 153d083395SSteven Rostedt #include <linux/ftrace.h> 163d083395SSteven Rostedt #include <linux/percpu.h> 1719b3e967SIngo Molnar #include <linux/sched.h> 183d083395SSteven Rostedt #include <linux/init.h> 193d083395SSteven Rostedt #include <linux/list.h> 203d083395SSteven Rostedt 2147788c58SFrederic Weisbecker #include <trace/syscall.h> 2247788c58SFrederic Weisbecker 2316239630SSteven Rostedt #include <asm/cacheflush.h> 24395a59d0SAbhishek Sagar #include <asm/ftrace.h> 25732f3ca7SSteven Rostedt #include <asm/nops.h> 26caf4b323SFrederic Weisbecker #include <asm/nmi.h> 27dfa60abaSSteven Rostedt 283d083395SSteven Rostedt 29caf4b323SFrederic Weisbecker #ifdef CONFIG_DYNAMIC_FTRACE 303d083395SSteven Rostedt 3116239630SSteven Rostedt int ftrace_arch_code_modify_prepare(void) 3216239630SSteven Rostedt { 3316239630SSteven Rostedt set_kernel_text_rw(); 3416239630SSteven Rostedt return 0; 3516239630SSteven Rostedt } 3616239630SSteven Rostedt 3716239630SSteven Rostedt int ftrace_arch_code_modify_post_process(void) 3816239630SSteven Rostedt { 3916239630SSteven Rostedt set_kernel_text_ro(); 4016239630SSteven Rostedt return 0; 4116239630SSteven Rostedt } 4216239630SSteven Rostedt 433d083395SSteven Rostedt union ftrace_code_union { 44395a59d0SAbhishek Sagar char code[MCOUNT_INSN_SIZE]; 453d083395SSteven Rostedt struct { 463d083395SSteven Rostedt char e8; 473d083395SSteven Rostedt int offset; 483d083395SSteven Rostedt } __attribute__((packed)); 493d083395SSteven Rostedt }; 503d083395SSteven Rostedt 5115adc048SSteven Rostedt static int ftrace_calc_offset(long ip, long addr) 523c1720f0SSteven Rostedt { 533c1720f0SSteven Rostedt return (int)(addr - ip); 543d083395SSteven Rostedt } 553d083395SSteven Rostedt 5631e88909SSteven Rostedt static unsigned char *ftrace_call_replace(unsigned long ip, unsigned long addr) 573c1720f0SSteven Rostedt { 583c1720f0SSteven Rostedt static union ftrace_code_union calc; 593c1720f0SSteven Rostedt 603c1720f0SSteven Rostedt calc.e8 = 0xe8; 61395a59d0SAbhishek Sagar calc.offset = ftrace_calc_offset(ip + MCOUNT_INSN_SIZE, addr); 623c1720f0SSteven Rostedt 633c1720f0SSteven Rostedt /* 643c1720f0SSteven Rostedt * No locking needed, this must be called via kstop_machine 653c1720f0SSteven Rostedt * which in essence is like running on a uniprocessor machine. 663c1720f0SSteven Rostedt */ 673c1720f0SSteven Rostedt return calc.code; 683c1720f0SSteven Rostedt } 693c1720f0SSteven Rostedt 7017666f02SSteven Rostedt /* 7117666f02SSteven Rostedt * Modifying code must take extra care. On an SMP machine, if 7217666f02SSteven Rostedt * the code being modified is also being executed on another CPU 7317666f02SSteven Rostedt * that CPU will have undefined results and possibly take a GPF. 7417666f02SSteven Rostedt * We use kstop_machine to stop other CPUS from exectuing code. 7517666f02SSteven Rostedt * But this does not stop NMIs from happening. We still need 7617666f02SSteven Rostedt * to protect against that. We separate out the modification of 7717666f02SSteven Rostedt * the code to take care of this. 7817666f02SSteven Rostedt * 7917666f02SSteven Rostedt * Two buffers are added: An IP buffer and a "code" buffer. 8017666f02SSteven Rostedt * 81a26a2a27SSteven Rostedt * 1) Put the instruction pointer into the IP buffer 8217666f02SSteven Rostedt * and the new code into the "code" buffer. 83e9d9df44SLai Jiangshan * 2) Wait for any running NMIs to finish and set a flag that says 84e9d9df44SLai Jiangshan * we are modifying code, it is done in an atomic operation. 85e9d9df44SLai Jiangshan * 3) Write the code 86e9d9df44SLai Jiangshan * 4) clear the flag. 87e9d9df44SLai Jiangshan * 5) Wait for any running NMIs to finish. 8817666f02SSteven Rostedt * 8917666f02SSteven Rostedt * If an NMI is executed, the first thing it does is to call 9017666f02SSteven Rostedt * "ftrace_nmi_enter". This will check if the flag is set to write 9117666f02SSteven Rostedt * and if it is, it will write what is in the IP and "code" buffers. 9217666f02SSteven Rostedt * 9317666f02SSteven Rostedt * The trick is, it does not matter if everyone is writing the same 9417666f02SSteven Rostedt * content to the code location. Also, if a CPU is executing code 9517666f02SSteven Rostedt * it is OK to write to that code location if the contents being written 9617666f02SSteven Rostedt * are the same as what exists. 9717666f02SSteven Rostedt */ 9817666f02SSteven Rostedt 99e9d9df44SLai Jiangshan #define MOD_CODE_WRITE_FLAG (1 << 31) /* set when NMI should do the write */ 1004e6ea144SSteven Rostedt static atomic_t nmi_running = ATOMIC_INIT(0); 101a26a2a27SSteven Rostedt static int mod_code_status; /* holds return value of text write */ 102a26a2a27SSteven Rostedt static void *mod_code_ip; /* holds the IP to write to */ 103a26a2a27SSteven Rostedt static void *mod_code_newcode; /* holds the text to write to the IP */ 10417666f02SSteven Rostedt 105a26a2a27SSteven Rostedt static unsigned nmi_wait_count; 106a26a2a27SSteven Rostedt static atomic_t nmi_update_count = ATOMIC_INIT(0); 107b807c3d0SSteven Rostedt 108b807c3d0SSteven Rostedt int ftrace_arch_read_dyn_info(char *buf, int size) 109b807c3d0SSteven Rostedt { 110b807c3d0SSteven Rostedt int r; 111b807c3d0SSteven Rostedt 112b807c3d0SSteven Rostedt r = snprintf(buf, size, "%u %u", 113b807c3d0SSteven Rostedt nmi_wait_count, 114b807c3d0SSteven Rostedt atomic_read(&nmi_update_count)); 115b807c3d0SSteven Rostedt return r; 116b807c3d0SSteven Rostedt } 117b807c3d0SSteven Rostedt 118e9d9df44SLai Jiangshan static void clear_mod_flag(void) 119e9d9df44SLai Jiangshan { 120e9d9df44SLai Jiangshan int old = atomic_read(&nmi_running); 121e9d9df44SLai Jiangshan 122e9d9df44SLai Jiangshan for (;;) { 123e9d9df44SLai Jiangshan int new = old & ~MOD_CODE_WRITE_FLAG; 124e9d9df44SLai Jiangshan 125e9d9df44SLai Jiangshan if (old == new) 126e9d9df44SLai Jiangshan break; 127e9d9df44SLai Jiangshan 128e9d9df44SLai Jiangshan old = atomic_cmpxchg(&nmi_running, old, new); 129e9d9df44SLai Jiangshan } 130e9d9df44SLai Jiangshan } 131e9d9df44SLai Jiangshan 13217666f02SSteven Rostedt static void ftrace_mod_code(void) 13317666f02SSteven Rostedt { 13417666f02SSteven Rostedt /* 13517666f02SSteven Rostedt * Yes, more than one CPU process can be writing to mod_code_status. 13617666f02SSteven Rostedt * (and the code itself) 13717666f02SSteven Rostedt * But if one were to fail, then they all should, and if one were 13817666f02SSteven Rostedt * to succeed, then they all should. 13917666f02SSteven Rostedt */ 14017666f02SSteven Rostedt mod_code_status = probe_kernel_write(mod_code_ip, mod_code_newcode, 14117666f02SSteven Rostedt MCOUNT_INSN_SIZE); 14290c7ac49SSteven Rostedt 14390c7ac49SSteven Rostedt /* if we fail, then kill any new writers */ 14490c7ac49SSteven Rostedt if (mod_code_status) 145e9d9df44SLai Jiangshan clear_mod_flag(); 14617666f02SSteven Rostedt } 14717666f02SSteven Rostedt 148a81bd80aSSteven Rostedt void ftrace_nmi_enter(void) 14917666f02SSteven Rostedt { 150e9d9df44SLai Jiangshan if (atomic_inc_return(&nmi_running) & MOD_CODE_WRITE_FLAG) { 151e9d9df44SLai Jiangshan smp_rmb(); 15217666f02SSteven Rostedt ftrace_mod_code(); 153b807c3d0SSteven Rostedt atomic_inc(&nmi_update_count); 154b807c3d0SSteven Rostedt } 155e9d9df44SLai Jiangshan /* Must have previous changes seen before executions */ 156e9d9df44SLai Jiangshan smp_mb(); 15717666f02SSteven Rostedt } 15817666f02SSteven Rostedt 159a81bd80aSSteven Rostedt void ftrace_nmi_exit(void) 16017666f02SSteven Rostedt { 1614e6ea144SSteven Rostedt /* Finish all executions before clearing nmi_running */ 162e9d9df44SLai Jiangshan smp_mb(); 1634e6ea144SSteven Rostedt atomic_dec(&nmi_running); 16417666f02SSteven Rostedt } 16517666f02SSteven Rostedt 166e9d9df44SLai Jiangshan static void wait_for_nmi_and_set_mod_flag(void) 167e9d9df44SLai Jiangshan { 168e9d9df44SLai Jiangshan if (!atomic_cmpxchg(&nmi_running, 0, MOD_CODE_WRITE_FLAG)) 169e9d9df44SLai Jiangshan return; 170e9d9df44SLai Jiangshan 171e9d9df44SLai Jiangshan do { 172e9d9df44SLai Jiangshan cpu_relax(); 173e9d9df44SLai Jiangshan } while (atomic_cmpxchg(&nmi_running, 0, MOD_CODE_WRITE_FLAG)); 174e9d9df44SLai Jiangshan 175e9d9df44SLai Jiangshan nmi_wait_count++; 176e9d9df44SLai Jiangshan } 177e9d9df44SLai Jiangshan 17817666f02SSteven Rostedt static void wait_for_nmi(void) 17917666f02SSteven Rostedt { 1804e6ea144SSteven Rostedt if (!atomic_read(&nmi_running)) 18189025282SCyrill Gorcunov return; 182b807c3d0SSteven Rostedt 18389025282SCyrill Gorcunov do { 18417666f02SSteven Rostedt cpu_relax(); 1854e6ea144SSteven Rostedt } while (atomic_read(&nmi_running)); 18617666f02SSteven Rostedt 187b807c3d0SSteven Rostedt nmi_wait_count++; 188b807c3d0SSteven Rostedt } 189b807c3d0SSteven Rostedt 19017666f02SSteven Rostedt static int 19117666f02SSteven Rostedt do_ftrace_mod_code(unsigned long ip, void *new_code) 19217666f02SSteven Rostedt { 19317666f02SSteven Rostedt mod_code_ip = (void *)ip; 19417666f02SSteven Rostedt mod_code_newcode = new_code; 19517666f02SSteven Rostedt 19617666f02SSteven Rostedt /* The buffers need to be visible before we let NMIs write them */ 19717666f02SSteven Rostedt smp_mb(); 19817666f02SSteven Rostedt 199e9d9df44SLai Jiangshan wait_for_nmi_and_set_mod_flag(); 20017666f02SSteven Rostedt 20117666f02SSteven Rostedt /* Make sure all running NMIs have finished before we write the code */ 20217666f02SSteven Rostedt smp_mb(); 20317666f02SSteven Rostedt 20417666f02SSteven Rostedt ftrace_mod_code(); 20517666f02SSteven Rostedt 20617666f02SSteven Rostedt /* Make sure the write happens before clearing the bit */ 20717666f02SSteven Rostedt smp_mb(); 20817666f02SSteven Rostedt 209e9d9df44SLai Jiangshan clear_mod_flag(); 21017666f02SSteven Rostedt wait_for_nmi(); 21117666f02SSteven Rostedt 21217666f02SSteven Rostedt return mod_code_status; 21317666f02SSteven Rostedt } 21417666f02SSteven Rostedt 21517666f02SSteven Rostedt 216caf4b323SFrederic Weisbecker 217caf4b323SFrederic Weisbecker 218caf4b323SFrederic Weisbecker static unsigned char ftrace_nop[MCOUNT_INSN_SIZE]; 219caf4b323SFrederic Weisbecker 22031e88909SSteven Rostedt static unsigned char *ftrace_nop_replace(void) 221caf4b323SFrederic Weisbecker { 222caf4b323SFrederic Weisbecker return ftrace_nop; 223caf4b323SFrederic Weisbecker } 224caf4b323SFrederic Weisbecker 22531e88909SSteven Rostedt static int 2263d083395SSteven Rostedt ftrace_modify_code(unsigned long ip, unsigned char *old_code, 2273d083395SSteven Rostedt unsigned char *new_code) 2283d083395SSteven Rostedt { 2296f93fc07SSteven Rostedt unsigned char replaced[MCOUNT_INSN_SIZE]; 2303d083395SSteven Rostedt 2313d083395SSteven Rostedt /* 2323d083395SSteven Rostedt * Note: Due to modules and __init, code can 2333d083395SSteven Rostedt * disappear and change, we need to protect against faulting 23476aefee5SSteven Rostedt * as well as code changing. We do this by using the 235ab9a0918SSteven Rostedt * probe_kernel_* functions. 2363d083395SSteven Rostedt * 2373d083395SSteven Rostedt * No real locking needed, this code is run through 2386f93fc07SSteven Rostedt * kstop_machine, or before SMP starts. 2393d083395SSteven Rostedt */ 24076aefee5SSteven Rostedt 24176aefee5SSteven Rostedt /* read the text we want to modify */ 242ab9a0918SSteven Rostedt if (probe_kernel_read(replaced, (void *)ip, MCOUNT_INSN_SIZE)) 243593eb8a2SSteven Rostedt return -EFAULT; 2446f93fc07SSteven Rostedt 24576aefee5SSteven Rostedt /* Make sure it is what we expect it to be */ 2466f93fc07SSteven Rostedt if (memcmp(replaced, old_code, MCOUNT_INSN_SIZE) != 0) 247593eb8a2SSteven Rostedt return -EINVAL; 2486f93fc07SSteven Rostedt 24976aefee5SSteven Rostedt /* replace the text with the new text */ 25017666f02SSteven Rostedt if (do_ftrace_mod_code(ip, new_code)) 251593eb8a2SSteven Rostedt return -EPERM; 2526f93fc07SSteven Rostedt 2533d083395SSteven Rostedt sync_core(); 2543d083395SSteven Rostedt 2556f93fc07SSteven Rostedt return 0; 2563d083395SSteven Rostedt } 2573d083395SSteven Rostedt 25831e88909SSteven Rostedt int ftrace_make_nop(struct module *mod, 25931e88909SSteven Rostedt struct dyn_ftrace *rec, unsigned long addr) 26031e88909SSteven Rostedt { 26131e88909SSteven Rostedt unsigned char *new, *old; 26231e88909SSteven Rostedt unsigned long ip = rec->ip; 26331e88909SSteven Rostedt 26431e88909SSteven Rostedt old = ftrace_call_replace(ip, addr); 26531e88909SSteven Rostedt new = ftrace_nop_replace(); 26631e88909SSteven Rostedt 26731e88909SSteven Rostedt return ftrace_modify_code(rec->ip, old, new); 26831e88909SSteven Rostedt } 26931e88909SSteven Rostedt 27031e88909SSteven Rostedt int ftrace_make_call(struct dyn_ftrace *rec, unsigned long addr) 27131e88909SSteven Rostedt { 27231e88909SSteven Rostedt unsigned char *new, *old; 27331e88909SSteven Rostedt unsigned long ip = rec->ip; 27431e88909SSteven Rostedt 27531e88909SSteven Rostedt old = ftrace_nop_replace(); 27631e88909SSteven Rostedt new = ftrace_call_replace(ip, addr); 27731e88909SSteven Rostedt 27831e88909SSteven Rostedt return ftrace_modify_code(rec->ip, old, new); 27931e88909SSteven Rostedt } 28031e88909SSteven Rostedt 28115adc048SSteven Rostedt int ftrace_update_ftrace_func(ftrace_func_t func) 282d61f82d0SSteven Rostedt { 283d61f82d0SSteven Rostedt unsigned long ip = (unsigned long)(&ftrace_call); 284395a59d0SAbhishek Sagar unsigned char old[MCOUNT_INSN_SIZE], *new; 285d61f82d0SSteven Rostedt int ret; 286d61f82d0SSteven Rostedt 287395a59d0SAbhishek Sagar memcpy(old, &ftrace_call, MCOUNT_INSN_SIZE); 288d61f82d0SSteven Rostedt new = ftrace_call_replace(ip, (unsigned long)func); 289d61f82d0SSteven Rostedt ret = ftrace_modify_code(ip, old, new); 290d61f82d0SSteven Rostedt 291d61f82d0SSteven Rostedt return ret; 292d61f82d0SSteven Rostedt } 293d61f82d0SSteven Rostedt 294d61f82d0SSteven Rostedt int __init ftrace_dyn_arch_init(void *data) 2953d083395SSteven Rostedt { 296732f3ca7SSteven Rostedt extern const unsigned char ftrace_test_p6nop[]; 297732f3ca7SSteven Rostedt extern const unsigned char ftrace_test_nop5[]; 298732f3ca7SSteven Rostedt extern const unsigned char ftrace_test_jmp[]; 299732f3ca7SSteven Rostedt int faulted = 0; 3003d083395SSteven Rostedt 301732f3ca7SSteven Rostedt /* 302732f3ca7SSteven Rostedt * There is no good nop for all x86 archs. 303732f3ca7SSteven Rostedt * We will default to using the P6_NOP5, but first we 304732f3ca7SSteven Rostedt * will test to make sure that the nop will actually 305732f3ca7SSteven Rostedt * work on this CPU. If it faults, we will then 306732f3ca7SSteven Rostedt * go to a lesser efficient 5 byte nop. If that fails 307732f3ca7SSteven Rostedt * we then just use a jmp as our nop. This isn't the most 308732f3ca7SSteven Rostedt * efficient nop, but we can not use a multi part nop 309732f3ca7SSteven Rostedt * since we would then risk being preempted in the middle 310732f3ca7SSteven Rostedt * of that nop, and if we enabled tracing then, it might 311732f3ca7SSteven Rostedt * cause a system crash. 312732f3ca7SSteven Rostedt * 313732f3ca7SSteven Rostedt * TODO: check the cpuid to determine the best nop. 314732f3ca7SSteven Rostedt */ 315732f3ca7SSteven Rostedt asm volatile ( 316732f3ca7SSteven Rostedt "ftrace_test_jmp:" 317732f3ca7SSteven Rostedt "jmp ftrace_test_p6nop\n" 3188b27386aSAnders Kaseorg "nop\n" 3198b27386aSAnders Kaseorg "nop\n" 3208b27386aSAnders Kaseorg "nop\n" /* 2 byte jmp + 3 bytes */ 321732f3ca7SSteven Rostedt "ftrace_test_p6nop:" 322732f3ca7SSteven Rostedt P6_NOP5 323732f3ca7SSteven Rostedt "jmp 1f\n" 324732f3ca7SSteven Rostedt "ftrace_test_nop5:" 325732f3ca7SSteven Rostedt ".byte 0x66,0x66,0x66,0x66,0x90\n" 326732f3ca7SSteven Rostedt "1:" 327732f3ca7SSteven Rostedt ".section .fixup, \"ax\"\n" 328732f3ca7SSteven Rostedt "2: movl $1, %0\n" 329732f3ca7SSteven Rostedt " jmp ftrace_test_nop5\n" 330732f3ca7SSteven Rostedt "3: movl $2, %0\n" 331732f3ca7SSteven Rostedt " jmp 1b\n" 332732f3ca7SSteven Rostedt ".previous\n" 333732f3ca7SSteven Rostedt _ASM_EXTABLE(ftrace_test_p6nop, 2b) 334732f3ca7SSteven Rostedt _ASM_EXTABLE(ftrace_test_nop5, 3b) 335732f3ca7SSteven Rostedt : "=r"(faulted) : "0" (faulted)); 336d61f82d0SSteven Rostedt 337732f3ca7SSteven Rostedt switch (faulted) { 338732f3ca7SSteven Rostedt case 0: 339732f3ca7SSteven Rostedt pr_info("ftrace: converting mcount calls to 0f 1f 44 00 00\n"); 3408115f3f0SSteven Rostedt memcpy(ftrace_nop, ftrace_test_p6nop, MCOUNT_INSN_SIZE); 341732f3ca7SSteven Rostedt break; 342732f3ca7SSteven Rostedt case 1: 343732f3ca7SSteven Rostedt pr_info("ftrace: converting mcount calls to 66 66 66 66 90\n"); 3448115f3f0SSteven Rostedt memcpy(ftrace_nop, ftrace_test_nop5, MCOUNT_INSN_SIZE); 345732f3ca7SSteven Rostedt break; 346732f3ca7SSteven Rostedt case 2: 3478b27386aSAnders Kaseorg pr_info("ftrace: converting mcount calls to jmp . + 5\n"); 3488115f3f0SSteven Rostedt memcpy(ftrace_nop, ftrace_test_jmp, MCOUNT_INSN_SIZE); 349732f3ca7SSteven Rostedt break; 350732f3ca7SSteven Rostedt } 351d61f82d0SSteven Rostedt 352732f3ca7SSteven Rostedt /* The return code is retured via data */ 353732f3ca7SSteven Rostedt *(unsigned long *)data = 0; 354dfa60abaSSteven Rostedt 3553d083395SSteven Rostedt return 0; 3563d083395SSteven Rostedt } 357caf4b323SFrederic Weisbecker #endif 358e7d3737eSFrederic Weisbecker 359fb52607aSFrederic Weisbecker #ifdef CONFIG_FUNCTION_GRAPH_TRACER 360e7d3737eSFrederic Weisbecker 3615a45cfe1SSteven Rostedt #ifdef CONFIG_DYNAMIC_FTRACE 3625a45cfe1SSteven Rostedt extern void ftrace_graph_call(void); 3635a45cfe1SSteven Rostedt 3645a45cfe1SSteven Rostedt static int ftrace_mod_jmp(unsigned long ip, 3655a45cfe1SSteven Rostedt int old_offset, int new_offset) 3665a45cfe1SSteven Rostedt { 3675a45cfe1SSteven Rostedt unsigned char code[MCOUNT_INSN_SIZE]; 3685a45cfe1SSteven Rostedt 3695a45cfe1SSteven Rostedt if (probe_kernel_read(code, (void *)ip, MCOUNT_INSN_SIZE)) 3705a45cfe1SSteven Rostedt return -EFAULT; 3715a45cfe1SSteven Rostedt 3725a45cfe1SSteven Rostedt if (code[0] != 0xe9 || old_offset != *(int *)(&code[1])) 3735a45cfe1SSteven Rostedt return -EINVAL; 3745a45cfe1SSteven Rostedt 3755a45cfe1SSteven Rostedt *(int *)(&code[1]) = new_offset; 3765a45cfe1SSteven Rostedt 3775a45cfe1SSteven Rostedt if (do_ftrace_mod_code(ip, &code)) 3785a45cfe1SSteven Rostedt return -EPERM; 3795a45cfe1SSteven Rostedt 3805a45cfe1SSteven Rostedt return 0; 3815a45cfe1SSteven Rostedt } 3825a45cfe1SSteven Rostedt 3835a45cfe1SSteven Rostedt int ftrace_enable_ftrace_graph_caller(void) 3845a45cfe1SSteven Rostedt { 3855a45cfe1SSteven Rostedt unsigned long ip = (unsigned long)(&ftrace_graph_call); 3865a45cfe1SSteven Rostedt int old_offset, new_offset; 3875a45cfe1SSteven Rostedt 3885a45cfe1SSteven Rostedt old_offset = (unsigned long)(&ftrace_stub) - (ip + MCOUNT_INSN_SIZE); 3895a45cfe1SSteven Rostedt new_offset = (unsigned long)(&ftrace_graph_caller) - (ip + MCOUNT_INSN_SIZE); 3905a45cfe1SSteven Rostedt 3915a45cfe1SSteven Rostedt return ftrace_mod_jmp(ip, old_offset, new_offset); 3925a45cfe1SSteven Rostedt } 3935a45cfe1SSteven Rostedt 3945a45cfe1SSteven Rostedt int ftrace_disable_ftrace_graph_caller(void) 3955a45cfe1SSteven Rostedt { 3965a45cfe1SSteven Rostedt unsigned long ip = (unsigned long)(&ftrace_graph_call); 3975a45cfe1SSteven Rostedt int old_offset, new_offset; 3985a45cfe1SSteven Rostedt 3995a45cfe1SSteven Rostedt old_offset = (unsigned long)(&ftrace_graph_caller) - (ip + MCOUNT_INSN_SIZE); 4005a45cfe1SSteven Rostedt new_offset = (unsigned long)(&ftrace_stub) - (ip + MCOUNT_INSN_SIZE); 4015a45cfe1SSteven Rostedt 4025a45cfe1SSteven Rostedt return ftrace_mod_jmp(ip, old_offset, new_offset); 4035a45cfe1SSteven Rostedt } 4045a45cfe1SSteven Rostedt 405e7d3737eSFrederic Weisbecker #endif /* !CONFIG_DYNAMIC_FTRACE */ 406e7d3737eSFrederic Weisbecker 407e7d3737eSFrederic Weisbecker /* 408e7d3737eSFrederic Weisbecker * Hook the return address and push it in the stack of return addrs 409e7d3737eSFrederic Weisbecker * in current thread info. 410e7d3737eSFrederic Weisbecker */ 411e7d3737eSFrederic Weisbecker void prepare_ftrace_return(unsigned long *parent, unsigned long self_addr) 412e7d3737eSFrederic Weisbecker { 413e7d3737eSFrederic Weisbecker unsigned long old; 414e7d3737eSFrederic Weisbecker int faulted; 415287b6e68SFrederic Weisbecker struct ftrace_graph_ent trace; 416e7d3737eSFrederic Weisbecker unsigned long return_hooker = (unsigned long) 417e7d3737eSFrederic Weisbecker &return_to_handler; 418e7d3737eSFrederic Weisbecker 419e7d3737eSFrederic Weisbecker /* Nmi's are currently unsupported */ 4209a5fd902SSteven Rostedt if (unlikely(in_nmi())) 421380c4b14SFrederic Weisbecker return; 422380c4b14SFrederic Weisbecker 423380c4b14SFrederic Weisbecker if (unlikely(atomic_read(¤t->tracing_graph_pause))) 424e7d3737eSFrederic Weisbecker return; 425e7d3737eSFrederic Weisbecker 426e7d3737eSFrederic Weisbecker /* 427e7d3737eSFrederic Weisbecker * Protect against fault, even if it shouldn't 428e7d3737eSFrederic Weisbecker * happen. This tool is too much intrusive to 429e7d3737eSFrederic Weisbecker * ignore such a protection. 430e7d3737eSFrederic Weisbecker */ 431e7d3737eSFrederic Weisbecker asm volatile( 43296665788SSteven Rostedt "1: " _ASM_MOV " (%[parent]), %[old]\n" 43396665788SSteven Rostedt "2: " _ASM_MOV " %[return_hooker], (%[parent])\n" 434e7d3737eSFrederic Weisbecker " movl $0, %[faulted]\n" 435e3944bfaSSteven Rostedt "3:\n" 436e7d3737eSFrederic Weisbecker 437e7d3737eSFrederic Weisbecker ".section .fixup, \"ax\"\n" 438e3944bfaSSteven Rostedt "4: movl $1, %[faulted]\n" 439e3944bfaSSteven Rostedt " jmp 3b\n" 440e7d3737eSFrederic Weisbecker ".previous\n" 441e7d3737eSFrederic Weisbecker 442e3944bfaSSteven Rostedt _ASM_EXTABLE(1b, 4b) 443e3944bfaSSteven Rostedt _ASM_EXTABLE(2b, 4b) 444e7d3737eSFrederic Weisbecker 445*aa512a27SSteven Rostedt : [old] "=&r" (old), [faulted] "=r" (faulted) 44696665788SSteven Rostedt : [parent] "r" (parent), [return_hooker] "r" (return_hooker) 447e7d3737eSFrederic Weisbecker : "memory" 448e7d3737eSFrederic Weisbecker ); 449e7d3737eSFrederic Weisbecker 45014a866c5SSteven Rostedt if (unlikely(faulted)) { 45114a866c5SSteven Rostedt ftrace_graph_stop(); 45214a866c5SSteven Rostedt WARN_ON(1); 453e7d3737eSFrederic Weisbecker return; 454e7d3737eSFrederic Weisbecker } 455e7d3737eSFrederic Weisbecker 4565d1a03dcSSteven Rostedt if (ftrace_push_return_trace(old, self_addr, &trace.depth) == -EBUSY) { 457e7d3737eSFrederic Weisbecker *parent = old; 458287b6e68SFrederic Weisbecker return; 459287b6e68SFrederic Weisbecker } 460287b6e68SFrederic Weisbecker 461287b6e68SFrederic Weisbecker trace.func = self_addr; 462287b6e68SFrederic Weisbecker 463e49dc19cSSteven Rostedt /* Only trace if the calling function expects to */ 464e49dc19cSSteven Rostedt if (!ftrace_graph_entry(&trace)) { 465e49dc19cSSteven Rostedt current->curr_ret_stack--; 466e49dc19cSSteven Rostedt *parent = old; 467e49dc19cSSteven Rostedt } 468e7d3737eSFrederic Weisbecker } 469fb52607aSFrederic Weisbecker #endif /* CONFIG_FUNCTION_GRAPH_TRACER */ 470f58ba100SFrederic Weisbecker 471f58ba100SFrederic Weisbecker #ifdef CONFIG_FTRACE_SYSCALLS 472f58ba100SFrederic Weisbecker 473f58ba100SFrederic Weisbecker extern unsigned long __start_syscalls_metadata[]; 474f58ba100SFrederic Weisbecker extern unsigned long __stop_syscalls_metadata[]; 475f58ba100SFrederic Weisbecker extern unsigned long *sys_call_table; 476f58ba100SFrederic Weisbecker 477f58ba100SFrederic Weisbecker static struct syscall_metadata **syscalls_metadata; 478f58ba100SFrederic Weisbecker 479f58ba100SFrederic Weisbecker static struct syscall_metadata *find_syscall_meta(unsigned long *syscall) 480f58ba100SFrederic Weisbecker { 481f58ba100SFrederic Weisbecker struct syscall_metadata *start; 482f58ba100SFrederic Weisbecker struct syscall_metadata *stop; 483f58ba100SFrederic Weisbecker char str[KSYM_SYMBOL_LEN]; 484f58ba100SFrederic Weisbecker 485f58ba100SFrederic Weisbecker 486f58ba100SFrederic Weisbecker start = (struct syscall_metadata *)__start_syscalls_metadata; 487f58ba100SFrederic Weisbecker stop = (struct syscall_metadata *)__stop_syscalls_metadata; 488f58ba100SFrederic Weisbecker kallsyms_lookup((unsigned long) syscall, NULL, NULL, NULL, str); 489f58ba100SFrederic Weisbecker 490f58ba100SFrederic Weisbecker for ( ; start < stop; start++) { 491f58ba100SFrederic Weisbecker if (start->name && !strcmp(start->name, str)) 492f58ba100SFrederic Weisbecker return start; 493f58ba100SFrederic Weisbecker } 494f58ba100SFrederic Weisbecker return NULL; 495f58ba100SFrederic Weisbecker } 496f58ba100SFrederic Weisbecker 497f58ba100SFrederic Weisbecker struct syscall_metadata *syscall_nr_to_meta(int nr) 498f58ba100SFrederic Weisbecker { 499f58ba100SFrederic Weisbecker if (!syscalls_metadata || nr >= FTRACE_SYSCALL_MAX || nr < 0) 500f58ba100SFrederic Weisbecker return NULL; 501f58ba100SFrederic Weisbecker 502f58ba100SFrederic Weisbecker return syscalls_metadata[nr]; 503f58ba100SFrederic Weisbecker } 504f58ba100SFrederic Weisbecker 505f58ba100SFrederic Weisbecker void arch_init_ftrace_syscalls(void) 506f58ba100SFrederic Weisbecker { 507f58ba100SFrederic Weisbecker int i; 508f58ba100SFrederic Weisbecker struct syscall_metadata *meta; 509f58ba100SFrederic Weisbecker unsigned long **psys_syscall_table = &sys_call_table; 510f58ba100SFrederic Weisbecker static atomic_t refs; 511f58ba100SFrederic Weisbecker 512f58ba100SFrederic Weisbecker if (atomic_inc_return(&refs) != 1) 513f58ba100SFrederic Weisbecker goto end; 514f58ba100SFrederic Weisbecker 515f58ba100SFrederic Weisbecker syscalls_metadata = kzalloc(sizeof(*syscalls_metadata) * 516f58ba100SFrederic Weisbecker FTRACE_SYSCALL_MAX, GFP_KERNEL); 517f58ba100SFrederic Weisbecker if (!syscalls_metadata) { 518f58ba100SFrederic Weisbecker WARN_ON(1); 519f58ba100SFrederic Weisbecker return; 520f58ba100SFrederic Weisbecker } 521f58ba100SFrederic Weisbecker 522f58ba100SFrederic Weisbecker for (i = 0; i < FTRACE_SYSCALL_MAX; i++) { 523f58ba100SFrederic Weisbecker meta = find_syscall_meta(psys_syscall_table[i]); 524f58ba100SFrederic Weisbecker syscalls_metadata[i] = meta; 525f58ba100SFrederic Weisbecker } 526f58ba100SFrederic Weisbecker return; 527f58ba100SFrederic Weisbecker 528f58ba100SFrederic Weisbecker /* Paranoid: avoid overflow */ 529f58ba100SFrederic Weisbecker end: 530f58ba100SFrederic Weisbecker atomic_dec(&refs); 531f58ba100SFrederic Weisbecker } 532f58ba100SFrederic Weisbecker #endif 533