2 * Code for replacing ftrace calls with jumps.
6 * Thanks goes out to P.A. Semi, Inc for supplying me with a PPC64 box.
8 * Added function graph tracer code, taken from x86 that was written
9 * by Frederic Weisbecker, and ported to PPC by Steven Rostedt.
13 #define pr_fmt(fmt) "ftrace-powerpc: " fmt
15 #include <linux/spinlock.h>
16 #include <linux/hardirq.h>
17 #include <linux/uaccess.h>
18 #include <linux/module.h>
19 #include <linux/ftrace.h>
20 #include <linux/percpu.h>
21 #include <linux/init.h>
22 #include <linux/list.h>
24 #include <asm/cacheflush.h>
25 #include <asm/code-patching.h>
26 #include <asm/ftrace.h>
27 #include <asm/syscall.h>
30 #ifdef CONFIG_DYNAMIC_FTRACE
32 ftrace_call_replace(unsigned long ip, unsigned long addr, int link)
36 addr = ppc_function_entry((void *)addr);
38 /* if (link) set op to 'bl' else 'b' */
39 op = create_branch((unsigned int *)ip, addr, link ? 1 : 0);
45 ftrace_modify_code(unsigned long ip, unsigned int old, unsigned int new)
47 unsigned int replaced;
50 * Note: Due to modules and __init, code can
51 * disappear and change, we need to protect against faulting
52 * as well as code changing. We do this by using the
53 * probe_kernel_* functions.
55 * No real locking needed, this code is run through
56 * kstop_machine, or before SMP starts.
59 /* read the text we want to modify */
60 if (probe_kernel_read(&replaced, (void *)ip, MCOUNT_INSN_SIZE))
63 /* Make sure it is what we expect it to be */
64 if (replaced != old) {
65 pr_err("%p: replaced (%#x) != old (%#x)",
66 (void *)ip, replaced, old);
70 /* replace the text with the new text */
71 if (patch_instruction((unsigned int *)ip, new))
78 * Helper functions that are the same for both PPC64 and PPC32.
80 static int test_24bit_addr(unsigned long ip, unsigned long addr)
82 addr = ppc_function_entry((void *)addr);
84 /* use the create_branch to verify that this offset can be branched */
85 return create_branch((unsigned int *)ip, addr, 0);
90 static int is_bl_op(unsigned int op)
92 return (op & 0xfc000003) == 0x48000001;
95 static unsigned long find_bl_target(unsigned long ip, unsigned int op)
99 offset = (op & 0x03fffffc);
101 if (offset & 0x02000000)
102 offset |= 0xfe000000;
104 return ip + (long)offset;
109 __ftrace_make_nop(struct module *mod,
110 struct dyn_ftrace *rec, unsigned long addr)
112 unsigned long entry, ptr, tramp;
113 unsigned long ip = rec->ip;
114 unsigned int op, pop;
116 /* read where this goes */
117 if (probe_kernel_read(&op, (void *)ip, sizeof(int))) {
118 pr_err("Fetching opcode failed.\n");
122 /* Make sure that that this is still a 24bit jump */
124 pr_err("Not expected bl: opcode is %x\n", op);
128 /* lets find where the pointer goes */
129 tramp = find_bl_target(ip, op);
131 pr_devel("ip:%lx jumps to %lx", ip, tramp);
133 if (module_trampoline_target(mod, tramp, &ptr)) {
134 pr_err("Failed to get trampoline target\n");
138 pr_devel("trampoline target %lx", ptr);
140 entry = ppc_global_function_entry((void *)addr);
141 /* This should match what was called */
143 pr_err("addr %lx does not match expected %lx\n", ptr, entry);
148 * Our original call site looks like:
153 * Milton Miller pointed out that we can not simply nop the branch.
154 * If a task was preempted when calling a trace function, the nops
155 * will remove the way to restore the TOC in r2 and the r2 TOC will
158 * Use a b +8 to jump over the load.
161 pop = PPC_INST_BRANCH | 8; /* b +8 */
164 * Check what is in the next instruction. We can see ld r2,40(r1), but
165 * on first pass after boot we will see mflr r0.
167 if (probe_kernel_read(&op, (void *)(ip+4), MCOUNT_INSN_SIZE)) {
168 pr_err("Fetching op failed.\n");
172 if (op != PPC_INST_LD_TOC) {
175 if (probe_kernel_read(&inst, (void *)(ip - 4), 4)) {
176 pr_err("Fetching instruction at %lx failed.\n", ip - 4);
180 /* We expect either a mlfr r0, or a std r0, LRSAVE(r1) */
181 if (inst != PPC_INST_MFLR && inst != PPC_INST_STD_LR) {
182 pr_err("Unexpected instructions around bl _mcount\n"
183 "when enabling dynamic ftrace!\t"
184 "(%08x,bl,%08x)\n", inst, op);
188 /* When using -mkernel_profile there is no load to jump over */
192 if (patch_instruction((unsigned int *)ip, pop)) {
193 pr_err("Patching NOP failed.\n");
202 __ftrace_make_nop(struct module *mod,
203 struct dyn_ftrace *rec, unsigned long addr)
207 unsigned long ip = rec->ip;
210 if (probe_kernel_read(&op, (void *)ip, MCOUNT_INSN_SIZE))
213 /* Make sure that that this is still a 24bit jump */
215 pr_err("Not expected bl: opcode is %x\n", op);
219 /* lets find where the pointer goes */
220 tramp = find_bl_target(ip, op);
223 * On PPC32 the trampoline looks like:
224 * 0x3d, 0x80, 0x00, 0x00 lis r12,sym@ha
225 * 0x39, 0x8c, 0x00, 0x00 addi r12,r12,sym@l
226 * 0x7d, 0x89, 0x03, 0xa6 mtctr r12
227 * 0x4e, 0x80, 0x04, 0x20 bctr
230 pr_devel("ip:%lx jumps to %lx", ip, tramp);
232 /* Find where the trampoline jumps to */
233 if (probe_kernel_read(jmp, (void *)tramp, sizeof(jmp))) {
234 pr_err("Failed to read %lx\n", tramp);
238 pr_devel(" %08x %08x ", jmp[0], jmp[1]);
240 /* verify that this is what we expect it to be */
241 if (((jmp[0] & 0xffff0000) != 0x3d800000) ||
242 ((jmp[1] & 0xffff0000) != 0x398c0000) ||
243 (jmp[2] != 0x7d8903a6) ||
244 (jmp[3] != 0x4e800420)) {
245 pr_err("Not a trampoline\n");
249 tramp = (jmp[1] & 0xffff) |
250 ((jmp[0] & 0xffff) << 16);
254 pr_devel(" %lx ", tramp);
257 pr_err("Trampoline location %08lx does not match addr\n",
264 if (patch_instruction((unsigned int *)ip, op))
270 #endif /* CONFIG_MODULES */
272 int ftrace_make_nop(struct module *mod,
273 struct dyn_ftrace *rec, unsigned long addr)
275 unsigned long ip = rec->ip;
276 unsigned int old, new;
279 * If the calling address is more that 24 bits away,
280 * then we had to use a trampoline to make the call.
281 * Otherwise just update the call site.
283 if (test_24bit_addr(ip, addr)) {
285 old = ftrace_call_replace(ip, addr, 1);
287 return ftrace_modify_code(ip, old, new);
290 #ifdef CONFIG_MODULES
292 * Out of range jumps are called from modules.
293 * We should either already have a pointer to the module
294 * or it has been passed in.
296 if (!rec->arch.mod) {
298 pr_err("No module loaded addr=%lx\n", addr);
303 if (mod != rec->arch.mod) {
304 pr_err("Record mod %p not equal to passed in mod %p\n",
308 /* nothing to do if mod == rec->arch.mod */
312 return __ftrace_make_nop(mod, rec, addr);
314 /* We should not get here without modules */
316 #endif /* CONFIG_MODULES */
319 #ifdef CONFIG_MODULES
322 * Examine the existing instructions for __ftrace_make_call.
323 * They should effectively be a NOP, and follow formal constraints,
324 * depending on the ABI. Return false if they don't.
326 #ifndef CC_USING_MPROFILE_KERNEL
328 expected_nop_sequence(void *ip, unsigned int op0, unsigned int op1)
336 * The load offset is different depending on the ABI. For simplicity
337 * just mask it out when doing the compare.
339 if ((op0 != 0x48000008) || ((op1 & 0xffff0000) != 0xe8410000))
345 expected_nop_sequence(void *ip, unsigned int op0, unsigned int op1)
347 /* look for patched "NOP" on ppc64 with -mprofile-kernel */
348 if (op0 != PPC_INST_NOP)
355 __ftrace_make_call(struct dyn_ftrace *rec, unsigned long addr)
358 void *ip = (void *)rec->ip;
360 /* read where this goes */
361 if (probe_kernel_read(op, ip, sizeof(op)))
364 if (!expected_nop_sequence(ip, op[0], op[1])) {
365 pr_err("Unexpected call sequence at %p: %x %x\n",
370 /* If we never set up a trampoline to ftrace_caller, then bail */
371 if (!rec->arch.mod->arch.tramp) {
372 pr_err("No ftrace trampoline\n");
376 /* Ensure branch is within 24 bits */
377 if (!create_branch(ip, rec->arch.mod->arch.tramp, BRANCH_SET_LINK)) {
378 pr_err("Branch out of range\n");
382 if (patch_branch(ip, rec->arch.mod->arch.tramp, BRANCH_SET_LINK)) {
383 pr_err("REL24 out of range!\n");
390 #ifdef CONFIG_DYNAMIC_FTRACE_WITH_REGS
391 int ftrace_modify_call(struct dyn_ftrace *rec, unsigned long old_addr,
394 return ftrace_make_call(rec, addr);
398 #else /* !CONFIG_PPC64: */
400 __ftrace_make_call(struct dyn_ftrace *rec, unsigned long addr)
403 unsigned long ip = rec->ip;
405 /* read where this goes */
406 if (probe_kernel_read(&op, (void *)ip, MCOUNT_INSN_SIZE))
409 /* It should be pointing to a nop */
410 if (op != PPC_INST_NOP) {
411 pr_err("Expected NOP but have %x\n", op);
415 /* If we never set up a trampoline to ftrace_caller, then bail */
416 if (!rec->arch.mod->arch.tramp) {
417 pr_err("No ftrace trampoline\n");
421 /* create the branch to the trampoline */
422 op = create_branch((unsigned int *)ip,
423 rec->arch.mod->arch.tramp, BRANCH_SET_LINK);
425 pr_err("REL24 out of range!\n");
429 pr_devel("write to %lx\n", rec->ip);
431 if (patch_instruction((unsigned int *)ip, op))
436 #endif /* CONFIG_PPC64 */
437 #endif /* CONFIG_MODULES */
439 int ftrace_make_call(struct dyn_ftrace *rec, unsigned long addr)
441 unsigned long ip = rec->ip;
442 unsigned int old, new;
445 * If the calling address is more that 24 bits away,
446 * then we had to use a trampoline to make the call.
447 * Otherwise just update the call site.
449 if (test_24bit_addr(ip, addr)) {
452 new = ftrace_call_replace(ip, addr, 1);
453 return ftrace_modify_code(ip, old, new);
456 #ifdef CONFIG_MODULES
458 * Out of range jumps are called from modules.
459 * Being that we are converting from nop, it had better
460 * already have a module defined.
462 if (!rec->arch.mod) {
463 pr_err("No module loaded\n");
467 return __ftrace_make_call(rec, addr);
469 /* We should not get here without modules */
471 #endif /* CONFIG_MODULES */
474 int ftrace_update_ftrace_func(ftrace_func_t func)
476 unsigned long ip = (unsigned long)(&ftrace_call);
477 unsigned int old, new;
480 old = *(unsigned int *)&ftrace_call;
481 new = ftrace_call_replace(ip, (unsigned long)func, 1);
482 ret = ftrace_modify_code(ip, old, new);
487 static int __ftrace_replace_code(struct dyn_ftrace *rec, int enable)
489 unsigned long ftrace_addr = (unsigned long)FTRACE_ADDR;
492 ret = ftrace_update_record(rec, enable);
495 case FTRACE_UPDATE_IGNORE:
497 case FTRACE_UPDATE_MAKE_CALL:
498 return ftrace_make_call(rec, ftrace_addr);
499 case FTRACE_UPDATE_MAKE_NOP:
500 return ftrace_make_nop(NULL, rec, ftrace_addr);
506 void ftrace_replace_code(int enable)
508 struct ftrace_rec_iter *iter;
509 struct dyn_ftrace *rec;
512 for (iter = ftrace_rec_iter_start(); iter;
513 iter = ftrace_rec_iter_next(iter)) {
514 rec = ftrace_rec_iter_record(iter);
515 ret = __ftrace_replace_code(rec, enable);
517 ftrace_bug(ret, rec);
524 * Use the default ftrace_modify_all_code, but without
527 void arch_ftrace_update_code(int command)
529 ftrace_modify_all_code(command);
532 int __init ftrace_dyn_arch_init(void)
536 #endif /* CONFIG_DYNAMIC_FTRACE */
538 #ifdef CONFIG_FUNCTION_GRAPH_TRACER
540 #ifdef CONFIG_DYNAMIC_FTRACE
541 extern void ftrace_graph_call(void);
542 extern void ftrace_graph_stub(void);
544 int ftrace_enable_ftrace_graph_caller(void)
546 unsigned long ip = (unsigned long)(&ftrace_graph_call);
547 unsigned long addr = (unsigned long)(&ftrace_graph_caller);
548 unsigned long stub = (unsigned long)(&ftrace_graph_stub);
549 unsigned int old, new;
551 old = ftrace_call_replace(ip, stub, 0);
552 new = ftrace_call_replace(ip, addr, 0);
554 return ftrace_modify_code(ip, old, new);
557 int ftrace_disable_ftrace_graph_caller(void)
559 unsigned long ip = (unsigned long)(&ftrace_graph_call);
560 unsigned long addr = (unsigned long)(&ftrace_graph_caller);
561 unsigned long stub = (unsigned long)(&ftrace_graph_stub);
562 unsigned int old, new;
564 old = ftrace_call_replace(ip, addr, 0);
565 new = ftrace_call_replace(ip, stub, 0);
567 return ftrace_modify_code(ip, old, new);
569 #endif /* CONFIG_DYNAMIC_FTRACE */
572 * Hook the return address and push it in the stack of return addrs
573 * in current thread info. Return the address we want to divert to.
575 unsigned long prepare_ftrace_return(unsigned long parent, unsigned long ip)
577 struct ftrace_graph_ent trace;
578 unsigned long return_hooker;
580 if (unlikely(ftrace_graph_is_dead()))
583 if (unlikely(atomic_read(¤t->tracing_graph_pause)))
586 return_hooker = ppc_function_entry(return_to_handler);
589 trace.depth = current->curr_ret_stack + 1;
591 /* Only trace if the calling function expects to */
592 if (!ftrace_graph_entry(&trace))
595 if (ftrace_push_return_trace(parent, ip, &trace.depth, 0) == -EBUSY)
598 parent = return_hooker;
602 #endif /* CONFIG_FUNCTION_GRAPH_TRACER */
604 #if defined(CONFIG_FTRACE_SYSCALLS) && defined(CONFIG_PPC64)
605 unsigned long __init arch_syscall_addr(int nr)
607 return sys_call_table[nr*2];
609 #endif /* CONFIG_FTRACE_SYSCALLS && CONFIG_PPC64 */