13d083395SSteven Rostedt /* 23d083395SSteven Rostedt * Code for replacing ftrace calls with jumps. 33d083395SSteven Rostedt * 43d083395SSteven Rostedt * Copyright (C) 2007-2008 Steven Rostedt <srostedt@redhat.com> 53d083395SSteven Rostedt * 63d083395SSteven Rostedt * Thanks goes to Ingo Molnar, for suggesting the idea. 73d083395SSteven Rostedt * Mathieu Desnoyers, for suggesting postponing the modifications. 83d083395SSteven Rostedt * Arjan van de Ven, for keeping me straight, and explaining to me 93d083395SSteven Rostedt * the dangers of modifying code on the run. 103d083395SSteven Rostedt */ 113d083395SSteven Rostedt 123d083395SSteven Rostedt #include <linux/spinlock.h> 133d083395SSteven Rostedt #include <linux/hardirq.h> 146f93fc07SSteven Rostedt #include <linux/uaccess.h> 153d083395SSteven Rostedt #include <linux/ftrace.h> 163d083395SSteven Rostedt #include <linux/percpu.h> 1719b3e967SIngo Molnar #include <linux/sched.h> 183d083395SSteven Rostedt #include <linux/init.h> 193d083395SSteven Rostedt #include <linux/list.h> 203d083395SSteven Rostedt 2147788c58SFrederic Weisbecker #include <trace/syscall.h> 2247788c58SFrederic Weisbecker 2316239630SSteven Rostedt #include <asm/cacheflush.h> 24395a59d0SAbhishek Sagar #include <asm/ftrace.h> 25732f3ca7SSteven Rostedt #include <asm/nops.h> 26caf4b323SFrederic Weisbecker #include <asm/nmi.h> 27dfa60abaSSteven Rostedt 283d083395SSteven Rostedt 29caf4b323SFrederic Weisbecker #ifdef CONFIG_DYNAMIC_FTRACE 303d083395SSteven Rostedt 3116239630SSteven Rostedt int ftrace_arch_code_modify_prepare(void) 3216239630SSteven Rostedt { 3316239630SSteven Rostedt set_kernel_text_rw(); 3416239630SSteven Rostedt return 0; 3516239630SSteven Rostedt } 3616239630SSteven Rostedt 3716239630SSteven Rostedt int ftrace_arch_code_modify_post_process(void) 3816239630SSteven Rostedt { 3916239630SSteven Rostedt set_kernel_text_ro(); 4016239630SSteven Rostedt return 0; 4116239630SSteven Rostedt } 4216239630SSteven Rostedt 433d083395SSteven Rostedt union ftrace_code_union { 44395a59d0SAbhishek Sagar char code[MCOUNT_INSN_SIZE]; 453d083395SSteven Rostedt struct { 463d083395SSteven Rostedt char e8; 473d083395SSteven Rostedt int offset; 483d083395SSteven Rostedt } __attribute__((packed)); 493d083395SSteven Rostedt }; 503d083395SSteven Rostedt 5115adc048SSteven Rostedt static int ftrace_calc_offset(long ip, long addr) 523c1720f0SSteven Rostedt { 533c1720f0SSteven Rostedt return (int)(addr - ip); 543d083395SSteven Rostedt } 553d083395SSteven Rostedt 5631e88909SSteven Rostedt static unsigned char *ftrace_call_replace(unsigned long ip, unsigned long addr) 573c1720f0SSteven Rostedt { 583c1720f0SSteven Rostedt static union ftrace_code_union calc; 593c1720f0SSteven Rostedt 603c1720f0SSteven Rostedt calc.e8 = 0xe8; 61395a59d0SAbhishek Sagar calc.offset = ftrace_calc_offset(ip + MCOUNT_INSN_SIZE, addr); 623c1720f0SSteven Rostedt 633c1720f0SSteven Rostedt /* 643c1720f0SSteven Rostedt * No locking needed, this must be called via kstop_machine 653c1720f0SSteven Rostedt * which in essence is like running on a uniprocessor machine. 663c1720f0SSteven Rostedt */ 673c1720f0SSteven Rostedt return calc.code; 683c1720f0SSteven Rostedt } 693c1720f0SSteven Rostedt 7017666f02SSteven Rostedt /* 7117666f02SSteven Rostedt * Modifying code must take extra care. On an SMP machine, if 7217666f02SSteven Rostedt * the code being modified is also being executed on another CPU 7317666f02SSteven Rostedt * that CPU will have undefined results and possibly take a GPF. 7417666f02SSteven Rostedt * We use kstop_machine to stop other CPUS from exectuing code. 7517666f02SSteven Rostedt * But this does not stop NMIs from happening. We still need 7617666f02SSteven Rostedt * to protect against that. We separate out the modification of 7717666f02SSteven Rostedt * the code to take care of this. 7817666f02SSteven Rostedt * 7917666f02SSteven Rostedt * Two buffers are added: An IP buffer and a "code" buffer. 8017666f02SSteven Rostedt * 81a26a2a27SSteven Rostedt * 1) Put the instruction pointer into the IP buffer 8217666f02SSteven Rostedt * and the new code into the "code" buffer. 83e9d9df44SLai Jiangshan * 2) Wait for any running NMIs to finish and set a flag that says 84e9d9df44SLai Jiangshan * we are modifying code, it is done in an atomic operation. 85e9d9df44SLai Jiangshan * 3) Write the code 86e9d9df44SLai Jiangshan * 4) clear the flag. 87e9d9df44SLai Jiangshan * 5) Wait for any running NMIs to finish. 8817666f02SSteven Rostedt * 8917666f02SSteven Rostedt * If an NMI is executed, the first thing it does is to call 9017666f02SSteven Rostedt * "ftrace_nmi_enter". This will check if the flag is set to write 9117666f02SSteven Rostedt * and if it is, it will write what is in the IP and "code" buffers. 9217666f02SSteven Rostedt * 9317666f02SSteven Rostedt * The trick is, it does not matter if everyone is writing the same 9417666f02SSteven Rostedt * content to the code location. Also, if a CPU is executing code 9517666f02SSteven Rostedt * it is OK to write to that code location if the contents being written 9617666f02SSteven Rostedt * are the same as what exists. 9717666f02SSteven Rostedt */ 9817666f02SSteven Rostedt 99e9d9df44SLai Jiangshan #define MOD_CODE_WRITE_FLAG (1 << 31) /* set when NMI should do the write */ 1004e6ea144SSteven Rostedt static atomic_t nmi_running = ATOMIC_INIT(0); 101a26a2a27SSteven Rostedt static int mod_code_status; /* holds return value of text write */ 102a26a2a27SSteven Rostedt static void *mod_code_ip; /* holds the IP to write to */ 103a26a2a27SSteven Rostedt static void *mod_code_newcode; /* holds the text to write to the IP */ 10417666f02SSteven Rostedt 105a26a2a27SSteven Rostedt static unsigned nmi_wait_count; 106a26a2a27SSteven Rostedt static atomic_t nmi_update_count = ATOMIC_INIT(0); 107b807c3d0SSteven Rostedt 108b807c3d0SSteven Rostedt int ftrace_arch_read_dyn_info(char *buf, int size) 109b807c3d0SSteven Rostedt { 110b807c3d0SSteven Rostedt int r; 111b807c3d0SSteven Rostedt 112b807c3d0SSteven Rostedt r = snprintf(buf, size, "%u %u", 113b807c3d0SSteven Rostedt nmi_wait_count, 114b807c3d0SSteven Rostedt atomic_read(&nmi_update_count)); 115b807c3d0SSteven Rostedt return r; 116b807c3d0SSteven Rostedt } 117b807c3d0SSteven Rostedt 118e9d9df44SLai Jiangshan static void clear_mod_flag(void) 119e9d9df44SLai Jiangshan { 120e9d9df44SLai Jiangshan int old = atomic_read(&nmi_running); 121e9d9df44SLai Jiangshan 122e9d9df44SLai Jiangshan for (;;) { 123e9d9df44SLai Jiangshan int new = old & ~MOD_CODE_WRITE_FLAG; 124e9d9df44SLai Jiangshan 125e9d9df44SLai Jiangshan if (old == new) 126e9d9df44SLai Jiangshan break; 127e9d9df44SLai Jiangshan 128e9d9df44SLai Jiangshan old = atomic_cmpxchg(&nmi_running, old, new); 129e9d9df44SLai Jiangshan } 130e9d9df44SLai Jiangshan } 131e9d9df44SLai Jiangshan 13217666f02SSteven Rostedt static void ftrace_mod_code(void) 13317666f02SSteven Rostedt { 13417666f02SSteven Rostedt /* 13517666f02SSteven Rostedt * Yes, more than one CPU process can be writing to mod_code_status. 13617666f02SSteven Rostedt * (and the code itself) 13717666f02SSteven Rostedt * But if one were to fail, then they all should, and if one were 13817666f02SSteven Rostedt * to succeed, then they all should. 13917666f02SSteven Rostedt */ 14017666f02SSteven Rostedt mod_code_status = probe_kernel_write(mod_code_ip, mod_code_newcode, 14117666f02SSteven Rostedt MCOUNT_INSN_SIZE); 14290c7ac49SSteven Rostedt 14390c7ac49SSteven Rostedt /* if we fail, then kill any new writers */ 14490c7ac49SSteven Rostedt if (mod_code_status) 145e9d9df44SLai Jiangshan clear_mod_flag(); 14617666f02SSteven Rostedt } 14717666f02SSteven Rostedt 148a81bd80aSSteven Rostedt void ftrace_nmi_enter(void) 14917666f02SSteven Rostedt { 150e9d9df44SLai Jiangshan if (atomic_inc_return(&nmi_running) & MOD_CODE_WRITE_FLAG) { 151e9d9df44SLai Jiangshan smp_rmb(); 15217666f02SSteven Rostedt ftrace_mod_code(); 153b807c3d0SSteven Rostedt atomic_inc(&nmi_update_count); 154b807c3d0SSteven Rostedt } 155e9d9df44SLai Jiangshan /* Must have previous changes seen before executions */ 156e9d9df44SLai Jiangshan smp_mb(); 15717666f02SSteven Rostedt } 15817666f02SSteven Rostedt 159a81bd80aSSteven Rostedt void ftrace_nmi_exit(void) 16017666f02SSteven Rostedt { 1614e6ea144SSteven Rostedt /* Finish all executions before clearing nmi_running */ 162e9d9df44SLai Jiangshan smp_mb(); 1634e6ea144SSteven Rostedt atomic_dec(&nmi_running); 16417666f02SSteven Rostedt } 16517666f02SSteven Rostedt 166e9d9df44SLai Jiangshan static void wait_for_nmi_and_set_mod_flag(void) 167e9d9df44SLai Jiangshan { 168e9d9df44SLai Jiangshan if (!atomic_cmpxchg(&nmi_running, 0, MOD_CODE_WRITE_FLAG)) 169e9d9df44SLai Jiangshan return; 170e9d9df44SLai Jiangshan 171e9d9df44SLai Jiangshan do { 172e9d9df44SLai Jiangshan cpu_relax(); 173e9d9df44SLai Jiangshan } while (atomic_cmpxchg(&nmi_running, 0, MOD_CODE_WRITE_FLAG)); 174e9d9df44SLai Jiangshan 175e9d9df44SLai Jiangshan nmi_wait_count++; 176e9d9df44SLai Jiangshan } 177e9d9df44SLai Jiangshan 17817666f02SSteven Rostedt static void wait_for_nmi(void) 17917666f02SSteven Rostedt { 1804e6ea144SSteven Rostedt if (!atomic_read(&nmi_running)) 18189025282SCyrill Gorcunov return; 182b807c3d0SSteven Rostedt 18389025282SCyrill Gorcunov do { 18417666f02SSteven Rostedt cpu_relax(); 1854e6ea144SSteven Rostedt } while (atomic_read(&nmi_running)); 18617666f02SSteven Rostedt 187b807c3d0SSteven Rostedt nmi_wait_count++; 188b807c3d0SSteven Rostedt } 189b807c3d0SSteven Rostedt 190*55ca3cc1SSuresh Siddha static inline int 191*55ca3cc1SSuresh Siddha within(unsigned long addr, unsigned long start, unsigned long end) 192*55ca3cc1SSuresh Siddha { 193*55ca3cc1SSuresh Siddha return addr >= start && addr < end; 194*55ca3cc1SSuresh Siddha } 195*55ca3cc1SSuresh Siddha 19617666f02SSteven Rostedt static int 19717666f02SSteven Rostedt do_ftrace_mod_code(unsigned long ip, void *new_code) 19817666f02SSteven Rostedt { 199*55ca3cc1SSuresh Siddha /* 200*55ca3cc1SSuresh Siddha * On x86_64, kernel text mappings are mapped read-only with 201*55ca3cc1SSuresh Siddha * CONFIG_DEBUG_RODATA. So we use the kernel identity mapping instead 202*55ca3cc1SSuresh Siddha * of the kernel text mapping to modify the kernel text. 203*55ca3cc1SSuresh Siddha * 204*55ca3cc1SSuresh Siddha * For 32bit kernels, these mappings are same and we can use 205*55ca3cc1SSuresh Siddha * kernel identity mapping to modify code. 206*55ca3cc1SSuresh Siddha */ 207*55ca3cc1SSuresh Siddha if (within(ip, (unsigned long)_text, (unsigned long)_etext)) 208*55ca3cc1SSuresh Siddha ip = (unsigned long)__va(__pa(ip)); 209*55ca3cc1SSuresh Siddha 21017666f02SSteven Rostedt mod_code_ip = (void *)ip; 21117666f02SSteven Rostedt mod_code_newcode = new_code; 21217666f02SSteven Rostedt 21317666f02SSteven Rostedt /* The buffers need to be visible before we let NMIs write them */ 21417666f02SSteven Rostedt smp_mb(); 21517666f02SSteven Rostedt 216e9d9df44SLai Jiangshan wait_for_nmi_and_set_mod_flag(); 21717666f02SSteven Rostedt 21817666f02SSteven Rostedt /* Make sure all running NMIs have finished before we write the code */ 21917666f02SSteven Rostedt smp_mb(); 22017666f02SSteven Rostedt 22117666f02SSteven Rostedt ftrace_mod_code(); 22217666f02SSteven Rostedt 22317666f02SSteven Rostedt /* Make sure the write happens before clearing the bit */ 22417666f02SSteven Rostedt smp_mb(); 22517666f02SSteven Rostedt 226e9d9df44SLai Jiangshan clear_mod_flag(); 22717666f02SSteven Rostedt wait_for_nmi(); 22817666f02SSteven Rostedt 22917666f02SSteven Rostedt return mod_code_status; 23017666f02SSteven Rostedt } 23117666f02SSteven Rostedt 23217666f02SSteven Rostedt 233caf4b323SFrederic Weisbecker 234caf4b323SFrederic Weisbecker 235caf4b323SFrederic Weisbecker static unsigned char ftrace_nop[MCOUNT_INSN_SIZE]; 236caf4b323SFrederic Weisbecker 23731e88909SSteven Rostedt static unsigned char *ftrace_nop_replace(void) 238caf4b323SFrederic Weisbecker { 239caf4b323SFrederic Weisbecker return ftrace_nop; 240caf4b323SFrederic Weisbecker } 241caf4b323SFrederic Weisbecker 24231e88909SSteven Rostedt static int 2433d083395SSteven Rostedt ftrace_modify_code(unsigned long ip, unsigned char *old_code, 2443d083395SSteven Rostedt unsigned char *new_code) 2453d083395SSteven Rostedt { 2466f93fc07SSteven Rostedt unsigned char replaced[MCOUNT_INSN_SIZE]; 2473d083395SSteven Rostedt 2483d083395SSteven Rostedt /* 2493d083395SSteven Rostedt * Note: Due to modules and __init, code can 2503d083395SSteven Rostedt * disappear and change, we need to protect against faulting 25176aefee5SSteven Rostedt * as well as code changing. We do this by using the 252ab9a0918SSteven Rostedt * probe_kernel_* functions. 2533d083395SSteven Rostedt * 2543d083395SSteven Rostedt * No real locking needed, this code is run through 2556f93fc07SSteven Rostedt * kstop_machine, or before SMP starts. 2563d083395SSteven Rostedt */ 25776aefee5SSteven Rostedt 25876aefee5SSteven Rostedt /* read the text we want to modify */ 259ab9a0918SSteven Rostedt if (probe_kernel_read(replaced, (void *)ip, MCOUNT_INSN_SIZE)) 260593eb8a2SSteven Rostedt return -EFAULT; 2616f93fc07SSteven Rostedt 26276aefee5SSteven Rostedt /* Make sure it is what we expect it to be */ 2636f93fc07SSteven Rostedt if (memcmp(replaced, old_code, MCOUNT_INSN_SIZE) != 0) 264593eb8a2SSteven Rostedt return -EINVAL; 2656f93fc07SSteven Rostedt 26676aefee5SSteven Rostedt /* replace the text with the new text */ 26717666f02SSteven Rostedt if (do_ftrace_mod_code(ip, new_code)) 268593eb8a2SSteven Rostedt return -EPERM; 2696f93fc07SSteven Rostedt 2703d083395SSteven Rostedt sync_core(); 2713d083395SSteven Rostedt 2726f93fc07SSteven Rostedt return 0; 2733d083395SSteven Rostedt } 2743d083395SSteven Rostedt 27531e88909SSteven Rostedt int ftrace_make_nop(struct module *mod, 27631e88909SSteven Rostedt struct dyn_ftrace *rec, unsigned long addr) 27731e88909SSteven Rostedt { 27831e88909SSteven Rostedt unsigned char *new, *old; 27931e88909SSteven Rostedt unsigned long ip = rec->ip; 28031e88909SSteven Rostedt 28131e88909SSteven Rostedt old = ftrace_call_replace(ip, addr); 28231e88909SSteven Rostedt new = ftrace_nop_replace(); 28331e88909SSteven Rostedt 28431e88909SSteven Rostedt return ftrace_modify_code(rec->ip, old, new); 28531e88909SSteven Rostedt } 28631e88909SSteven Rostedt 28731e88909SSteven Rostedt int ftrace_make_call(struct dyn_ftrace *rec, unsigned long addr) 28831e88909SSteven Rostedt { 28931e88909SSteven Rostedt unsigned char *new, *old; 29031e88909SSteven Rostedt unsigned long ip = rec->ip; 29131e88909SSteven Rostedt 29231e88909SSteven Rostedt old = ftrace_nop_replace(); 29331e88909SSteven Rostedt new = ftrace_call_replace(ip, addr); 29431e88909SSteven Rostedt 29531e88909SSteven Rostedt return ftrace_modify_code(rec->ip, old, new); 29631e88909SSteven Rostedt } 29731e88909SSteven Rostedt 29815adc048SSteven Rostedt int ftrace_update_ftrace_func(ftrace_func_t func) 299d61f82d0SSteven Rostedt { 300d61f82d0SSteven Rostedt unsigned long ip = (unsigned long)(&ftrace_call); 301395a59d0SAbhishek Sagar unsigned char old[MCOUNT_INSN_SIZE], *new; 302d61f82d0SSteven Rostedt int ret; 303d61f82d0SSteven Rostedt 304395a59d0SAbhishek Sagar memcpy(old, &ftrace_call, MCOUNT_INSN_SIZE); 305d61f82d0SSteven Rostedt new = ftrace_call_replace(ip, (unsigned long)func); 306d61f82d0SSteven Rostedt ret = ftrace_modify_code(ip, old, new); 307d61f82d0SSteven Rostedt 308d61f82d0SSteven Rostedt return ret; 309d61f82d0SSteven Rostedt } 310d61f82d0SSteven Rostedt 311d61f82d0SSteven Rostedt int __init ftrace_dyn_arch_init(void *data) 3123d083395SSteven Rostedt { 313732f3ca7SSteven Rostedt extern const unsigned char ftrace_test_p6nop[]; 314732f3ca7SSteven Rostedt extern const unsigned char ftrace_test_nop5[]; 315732f3ca7SSteven Rostedt extern const unsigned char ftrace_test_jmp[]; 316732f3ca7SSteven Rostedt int faulted = 0; 3173d083395SSteven Rostedt 318732f3ca7SSteven Rostedt /* 319732f3ca7SSteven Rostedt * There is no good nop for all x86 archs. 320732f3ca7SSteven Rostedt * We will default to using the P6_NOP5, but first we 321732f3ca7SSteven Rostedt * will test to make sure that the nop will actually 322732f3ca7SSteven Rostedt * work on this CPU. If it faults, we will then 323732f3ca7SSteven Rostedt * go to a lesser efficient 5 byte nop. If that fails 324732f3ca7SSteven Rostedt * we then just use a jmp as our nop. This isn't the most 325732f3ca7SSteven Rostedt * efficient nop, but we can not use a multi part nop 326732f3ca7SSteven Rostedt * since we would then risk being preempted in the middle 327732f3ca7SSteven Rostedt * of that nop, and if we enabled tracing then, it might 328732f3ca7SSteven Rostedt * cause a system crash. 329732f3ca7SSteven Rostedt * 330732f3ca7SSteven Rostedt * TODO: check the cpuid to determine the best nop. 331732f3ca7SSteven Rostedt */ 332732f3ca7SSteven Rostedt asm volatile ( 333732f3ca7SSteven Rostedt "ftrace_test_jmp:" 334732f3ca7SSteven Rostedt "jmp ftrace_test_p6nop\n" 3358b27386aSAnders Kaseorg "nop\n" 3368b27386aSAnders Kaseorg "nop\n" 3378b27386aSAnders Kaseorg "nop\n" /* 2 byte jmp + 3 bytes */ 338732f3ca7SSteven Rostedt "ftrace_test_p6nop:" 339732f3ca7SSteven Rostedt P6_NOP5 340732f3ca7SSteven Rostedt "jmp 1f\n" 341732f3ca7SSteven Rostedt "ftrace_test_nop5:" 342732f3ca7SSteven Rostedt ".byte 0x66,0x66,0x66,0x66,0x90\n" 343732f3ca7SSteven Rostedt "1:" 344732f3ca7SSteven Rostedt ".section .fixup, \"ax\"\n" 345732f3ca7SSteven Rostedt "2: movl $1, %0\n" 346732f3ca7SSteven Rostedt " jmp ftrace_test_nop5\n" 347732f3ca7SSteven Rostedt "3: movl $2, %0\n" 348732f3ca7SSteven Rostedt " jmp 1b\n" 349732f3ca7SSteven Rostedt ".previous\n" 350732f3ca7SSteven Rostedt _ASM_EXTABLE(ftrace_test_p6nop, 2b) 351732f3ca7SSteven Rostedt _ASM_EXTABLE(ftrace_test_nop5, 3b) 352732f3ca7SSteven Rostedt : "=r"(faulted) : "0" (faulted)); 353d61f82d0SSteven Rostedt 354732f3ca7SSteven Rostedt switch (faulted) { 355732f3ca7SSteven Rostedt case 0: 356732f3ca7SSteven Rostedt pr_info("ftrace: converting mcount calls to 0f 1f 44 00 00\n"); 3578115f3f0SSteven Rostedt memcpy(ftrace_nop, ftrace_test_p6nop, MCOUNT_INSN_SIZE); 358732f3ca7SSteven Rostedt break; 359732f3ca7SSteven Rostedt case 1: 360732f3ca7SSteven Rostedt pr_info("ftrace: converting mcount calls to 66 66 66 66 90\n"); 3618115f3f0SSteven Rostedt memcpy(ftrace_nop, ftrace_test_nop5, MCOUNT_INSN_SIZE); 362732f3ca7SSteven Rostedt break; 363732f3ca7SSteven Rostedt case 2: 3648b27386aSAnders Kaseorg pr_info("ftrace: converting mcount calls to jmp . + 5\n"); 3658115f3f0SSteven Rostedt memcpy(ftrace_nop, ftrace_test_jmp, MCOUNT_INSN_SIZE); 366732f3ca7SSteven Rostedt break; 367732f3ca7SSteven Rostedt } 368d61f82d0SSteven Rostedt 369732f3ca7SSteven Rostedt /* The return code is retured via data */ 370732f3ca7SSteven Rostedt *(unsigned long *)data = 0; 371dfa60abaSSteven Rostedt 3723d083395SSteven Rostedt return 0; 3733d083395SSteven Rostedt } 374caf4b323SFrederic Weisbecker #endif 375e7d3737eSFrederic Weisbecker 376fb52607aSFrederic Weisbecker #ifdef CONFIG_FUNCTION_GRAPH_TRACER 377e7d3737eSFrederic Weisbecker 3785a45cfe1SSteven Rostedt #ifdef CONFIG_DYNAMIC_FTRACE 3795a45cfe1SSteven Rostedt extern void ftrace_graph_call(void); 3805a45cfe1SSteven Rostedt 3815a45cfe1SSteven Rostedt static int ftrace_mod_jmp(unsigned long ip, 3825a45cfe1SSteven Rostedt int old_offset, int new_offset) 3835a45cfe1SSteven Rostedt { 3845a45cfe1SSteven Rostedt unsigned char code[MCOUNT_INSN_SIZE]; 3855a45cfe1SSteven Rostedt 3865a45cfe1SSteven Rostedt if (probe_kernel_read(code, (void *)ip, MCOUNT_INSN_SIZE)) 3875a45cfe1SSteven Rostedt return -EFAULT; 3885a45cfe1SSteven Rostedt 3895a45cfe1SSteven Rostedt if (code[0] != 0xe9 || old_offset != *(int *)(&code[1])) 3905a45cfe1SSteven Rostedt return -EINVAL; 3915a45cfe1SSteven Rostedt 3925a45cfe1SSteven Rostedt *(int *)(&code[1]) = new_offset; 3935a45cfe1SSteven Rostedt 3945a45cfe1SSteven Rostedt if (do_ftrace_mod_code(ip, &code)) 3955a45cfe1SSteven Rostedt return -EPERM; 3965a45cfe1SSteven Rostedt 3975a45cfe1SSteven Rostedt return 0; 3985a45cfe1SSteven Rostedt } 3995a45cfe1SSteven Rostedt 4005a45cfe1SSteven Rostedt int ftrace_enable_ftrace_graph_caller(void) 4015a45cfe1SSteven Rostedt { 4025a45cfe1SSteven Rostedt unsigned long ip = (unsigned long)(&ftrace_graph_call); 4035a45cfe1SSteven Rostedt int old_offset, new_offset; 4045a45cfe1SSteven Rostedt 4055a45cfe1SSteven Rostedt old_offset = (unsigned long)(&ftrace_stub) - (ip + MCOUNT_INSN_SIZE); 4065a45cfe1SSteven Rostedt new_offset = (unsigned long)(&ftrace_graph_caller) - (ip + MCOUNT_INSN_SIZE); 4075a45cfe1SSteven Rostedt 4085a45cfe1SSteven Rostedt return ftrace_mod_jmp(ip, old_offset, new_offset); 4095a45cfe1SSteven Rostedt } 4105a45cfe1SSteven Rostedt 4115a45cfe1SSteven Rostedt int ftrace_disable_ftrace_graph_caller(void) 4125a45cfe1SSteven Rostedt { 4135a45cfe1SSteven Rostedt unsigned long ip = (unsigned long)(&ftrace_graph_call); 4145a45cfe1SSteven Rostedt int old_offset, new_offset; 4155a45cfe1SSteven Rostedt 4165a45cfe1SSteven Rostedt old_offset = (unsigned long)(&ftrace_graph_caller) - (ip + MCOUNT_INSN_SIZE); 4175a45cfe1SSteven Rostedt new_offset = (unsigned long)(&ftrace_stub) - (ip + MCOUNT_INSN_SIZE); 4185a45cfe1SSteven Rostedt 4195a45cfe1SSteven Rostedt return ftrace_mod_jmp(ip, old_offset, new_offset); 4205a45cfe1SSteven Rostedt } 4215a45cfe1SSteven Rostedt 422e7d3737eSFrederic Weisbecker #endif /* !CONFIG_DYNAMIC_FTRACE */ 423e7d3737eSFrederic Weisbecker 424e7d3737eSFrederic Weisbecker /* 425e7d3737eSFrederic Weisbecker * Hook the return address and push it in the stack of return addrs 426e7d3737eSFrederic Weisbecker * in current thread info. 427e7d3737eSFrederic Weisbecker */ 42871e308a2SSteven Rostedt void prepare_ftrace_return(unsigned long *parent, unsigned long self_addr, 42971e308a2SSteven Rostedt unsigned long frame_pointer) 430e7d3737eSFrederic Weisbecker { 431e7d3737eSFrederic Weisbecker unsigned long old; 432e7d3737eSFrederic Weisbecker int faulted; 433287b6e68SFrederic Weisbecker struct ftrace_graph_ent trace; 434e7d3737eSFrederic Weisbecker unsigned long return_hooker = (unsigned long) 435e7d3737eSFrederic Weisbecker &return_to_handler; 436e7d3737eSFrederic Weisbecker 437380c4b14SFrederic Weisbecker if (unlikely(atomic_read(¤t->tracing_graph_pause))) 438e7d3737eSFrederic Weisbecker return; 439e7d3737eSFrederic Weisbecker 440e7d3737eSFrederic Weisbecker /* 441e7d3737eSFrederic Weisbecker * Protect against fault, even if it shouldn't 442e7d3737eSFrederic Weisbecker * happen. This tool is too much intrusive to 443e7d3737eSFrederic Weisbecker * ignore such a protection. 444e7d3737eSFrederic Weisbecker */ 445e7d3737eSFrederic Weisbecker asm volatile( 44696665788SSteven Rostedt "1: " _ASM_MOV " (%[parent]), %[old]\n" 44796665788SSteven Rostedt "2: " _ASM_MOV " %[return_hooker], (%[parent])\n" 448e7d3737eSFrederic Weisbecker " movl $0, %[faulted]\n" 449e3944bfaSSteven Rostedt "3:\n" 450e7d3737eSFrederic Weisbecker 451e7d3737eSFrederic Weisbecker ".section .fixup, \"ax\"\n" 452e3944bfaSSteven Rostedt "4: movl $1, %[faulted]\n" 453e3944bfaSSteven Rostedt " jmp 3b\n" 454e7d3737eSFrederic Weisbecker ".previous\n" 455e7d3737eSFrederic Weisbecker 456e3944bfaSSteven Rostedt _ASM_EXTABLE(1b, 4b) 457e3944bfaSSteven Rostedt _ASM_EXTABLE(2b, 4b) 458e7d3737eSFrederic Weisbecker 459aa512a27SSteven Rostedt : [old] "=&r" (old), [faulted] "=r" (faulted) 46096665788SSteven Rostedt : [parent] "r" (parent), [return_hooker] "r" (return_hooker) 461e7d3737eSFrederic Weisbecker : "memory" 462e7d3737eSFrederic Weisbecker ); 463e7d3737eSFrederic Weisbecker 46414a866c5SSteven Rostedt if (unlikely(faulted)) { 46514a866c5SSteven Rostedt ftrace_graph_stop(); 46614a866c5SSteven Rostedt WARN_ON(1); 467e7d3737eSFrederic Weisbecker return; 468e7d3737eSFrederic Weisbecker } 469e7d3737eSFrederic Weisbecker 47071e308a2SSteven Rostedt if (ftrace_push_return_trace(old, self_addr, &trace.depth, 47171e308a2SSteven Rostedt frame_pointer) == -EBUSY) { 472e7d3737eSFrederic Weisbecker *parent = old; 473287b6e68SFrederic Weisbecker return; 474287b6e68SFrederic Weisbecker } 475287b6e68SFrederic Weisbecker 476287b6e68SFrederic Weisbecker trace.func = self_addr; 477287b6e68SFrederic Weisbecker 478e49dc19cSSteven Rostedt /* Only trace if the calling function expects to */ 479e49dc19cSSteven Rostedt if (!ftrace_graph_entry(&trace)) { 480e49dc19cSSteven Rostedt current->curr_ret_stack--; 481e49dc19cSSteven Rostedt *parent = old; 482e49dc19cSSteven Rostedt } 483e7d3737eSFrederic Weisbecker } 484fb52607aSFrederic Weisbecker #endif /* CONFIG_FUNCTION_GRAPH_TRACER */ 485f58ba100SFrederic Weisbecker 486f58ba100SFrederic Weisbecker #ifdef CONFIG_FTRACE_SYSCALLS 487f58ba100SFrederic Weisbecker 488f58ba100SFrederic Weisbecker extern unsigned long __start_syscalls_metadata[]; 489f58ba100SFrederic Weisbecker extern unsigned long __stop_syscalls_metadata[]; 490f58ba100SFrederic Weisbecker extern unsigned long *sys_call_table; 491f58ba100SFrederic Weisbecker 492f58ba100SFrederic Weisbecker static struct syscall_metadata **syscalls_metadata; 493f58ba100SFrederic Weisbecker 494f58ba100SFrederic Weisbecker static struct syscall_metadata *find_syscall_meta(unsigned long *syscall) 495f58ba100SFrederic Weisbecker { 496f58ba100SFrederic Weisbecker struct syscall_metadata *start; 497f58ba100SFrederic Weisbecker struct syscall_metadata *stop; 498f58ba100SFrederic Weisbecker char str[KSYM_SYMBOL_LEN]; 499f58ba100SFrederic Weisbecker 500f58ba100SFrederic Weisbecker 501f58ba100SFrederic Weisbecker start = (struct syscall_metadata *)__start_syscalls_metadata; 502f58ba100SFrederic Weisbecker stop = (struct syscall_metadata *)__stop_syscalls_metadata; 503f58ba100SFrederic Weisbecker kallsyms_lookup((unsigned long) syscall, NULL, NULL, NULL, str); 504f58ba100SFrederic Weisbecker 505f58ba100SFrederic Weisbecker for ( ; start < stop; start++) { 506f58ba100SFrederic Weisbecker if (start->name && !strcmp(start->name, str)) 507f58ba100SFrederic Weisbecker return start; 508f58ba100SFrederic Weisbecker } 509f58ba100SFrederic Weisbecker return NULL; 510f58ba100SFrederic Weisbecker } 511f58ba100SFrederic Weisbecker 512f58ba100SFrederic Weisbecker struct syscall_metadata *syscall_nr_to_meta(int nr) 513f58ba100SFrederic Weisbecker { 51457421dbbSJason Baron if (!syscalls_metadata || nr >= NR_syscalls || nr < 0) 515f58ba100SFrederic Weisbecker return NULL; 516f58ba100SFrederic Weisbecker 517f58ba100SFrederic Weisbecker return syscalls_metadata[nr]; 518f58ba100SFrederic Weisbecker } 519f58ba100SFrederic Weisbecker 520eeac19a7SJason Baron int syscall_name_to_nr(char *name) 521eeac19a7SJason Baron { 522eeac19a7SJason Baron int i; 523eeac19a7SJason Baron 524eeac19a7SJason Baron if (!syscalls_metadata) 525eeac19a7SJason Baron return -1; 526eeac19a7SJason Baron 52757421dbbSJason Baron for (i = 0; i < NR_syscalls; i++) { 528eeac19a7SJason Baron if (syscalls_metadata[i]) { 529eeac19a7SJason Baron if (!strcmp(syscalls_metadata[i]->name, name)) 530eeac19a7SJason Baron return i; 531eeac19a7SJason Baron } 532eeac19a7SJason Baron } 533eeac19a7SJason Baron return -1; 534eeac19a7SJason Baron } 535eeac19a7SJason Baron 53664c12e04SJason Baron void set_syscall_enter_id(int num, int id) 53764c12e04SJason Baron { 53864c12e04SJason Baron syscalls_metadata[num]->enter_id = id; 53964c12e04SJason Baron } 54064c12e04SJason Baron 54164c12e04SJason Baron void set_syscall_exit_id(int num, int id) 54264c12e04SJason Baron { 54364c12e04SJason Baron syscalls_metadata[num]->exit_id = id; 54464c12e04SJason Baron } 54564c12e04SJason Baron 546066e0378SJason Baron static int __init arch_init_ftrace_syscalls(void) 547f58ba100SFrederic Weisbecker { 548f58ba100SFrederic Weisbecker int i; 549f58ba100SFrederic Weisbecker struct syscall_metadata *meta; 550f58ba100SFrederic Weisbecker unsigned long **psys_syscall_table = &sys_call_table; 551f58ba100SFrederic Weisbecker 552f58ba100SFrederic Weisbecker syscalls_metadata = kzalloc(sizeof(*syscalls_metadata) * 55357421dbbSJason Baron NR_syscalls, GFP_KERNEL); 554f58ba100SFrederic Weisbecker if (!syscalls_metadata) { 555f58ba100SFrederic Weisbecker WARN_ON(1); 556066e0378SJason Baron return -ENOMEM; 557f58ba100SFrederic Weisbecker } 558f58ba100SFrederic Weisbecker 55957421dbbSJason Baron for (i = 0; i < NR_syscalls; i++) { 560f58ba100SFrederic Weisbecker meta = find_syscall_meta(psys_syscall_table[i]); 561f58ba100SFrederic Weisbecker syscalls_metadata[i] = meta; 562f58ba100SFrederic Weisbecker } 563066e0378SJason Baron return 0; 564f58ba100SFrederic Weisbecker } 565066e0378SJason Baron arch_initcall(arch_init_ftrace_syscalls); 566f58ba100SFrederic Weisbecker #endif 567