1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * arch/arm64/kernel/ftrace.c 4 * 5 * Copyright (C) 2013 Linaro Limited 6 * Author: AKASHI Takahiro <takahiro.akashi@linaro.org> 7 */ 8 9 #include <linux/ftrace.h> 10 #include <linux/module.h> 11 #include <linux/swab.h> 12 #include <linux/uaccess.h> 13 14 #include <asm/cacheflush.h> 15 #include <asm/debug-monitors.h> 16 #include <asm/ftrace.h> 17 #include <asm/insn.h> 18 #include <asm/text-patching.h> 19 20 #ifdef CONFIG_DYNAMIC_FTRACE_WITH_ARGS 21 struct fregs_offset { 22 const char *name; 23 int offset; 24 }; 25 26 #define FREGS_OFFSET(n, field) \ 27 { \ 28 .name = n, \ 29 .offset = offsetof(struct __arch_ftrace_regs, field), \ 30 } 31 32 static const struct fregs_offset fregs_offsets[] = { 33 FREGS_OFFSET("x0", regs[0]), 34 FREGS_OFFSET("x1", regs[1]), 35 FREGS_OFFSET("x2", regs[2]), 36 FREGS_OFFSET("x3", regs[3]), 37 FREGS_OFFSET("x4", regs[4]), 38 FREGS_OFFSET("x5", regs[5]), 39 FREGS_OFFSET("x6", regs[6]), 40 FREGS_OFFSET("x7", regs[7]), 41 FREGS_OFFSET("x8", regs[8]), 42 43 FREGS_OFFSET("x29", fp), 44 FREGS_OFFSET("x30", lr), 45 FREGS_OFFSET("lr", lr), 46 47 FREGS_OFFSET("sp", sp), 48 FREGS_OFFSET("pc", pc), 49 }; 50 51 int ftrace_regs_query_register_offset(const char *name) 52 { 53 for (int i = 0; i < ARRAY_SIZE(fregs_offsets); i++) { 54 const struct fregs_offset *roff = &fregs_offsets[i]; 55 if (!strcmp(roff->name, name)) 56 return roff->offset; 57 } 58 59 return -EINVAL; 60 } 61 #endif 62 63 unsigned long ftrace_call_adjust(unsigned long addr) 64 { 65 /* 66 * When using mcount, addr is the address of the mcount call 67 * instruction, and no adjustment is necessary. 68 */ 69 if (!IS_ENABLED(CONFIG_DYNAMIC_FTRACE_WITH_ARGS)) 70 return addr; 71 72 /* 73 * When using patchable-function-entry without pre-function NOPS, addr 74 * is the address of the first NOP after the function entry point. 75 * 76 * The compiler has either generated: 77 * 78 * addr+00: func: NOP // To be patched to MOV X9, LR 79 * addr+04: NOP // To be patched to BL <caller> 80 * 81 * Or: 82 * 83 * addr-04: BTI C 84 * addr+00: func: NOP // To be patched to MOV X9, LR 85 * addr+04: NOP // To be patched to BL <caller> 86 * 87 * We must adjust addr to the address of the NOP which will be patched 88 * to `BL <caller>`, which is at `addr + 4` bytes in either case. 89 * 90 */ 91 if (!IS_ENABLED(CONFIG_DYNAMIC_FTRACE_WITH_CALL_OPS)) 92 return addr + AARCH64_INSN_SIZE; 93 94 /* 95 * When using patchable-function-entry with pre-function NOPs, addr is 96 * the address of the first pre-function NOP. 97 * 98 * Starting from an 8-byte aligned base, the compiler has either 99 * generated: 100 * 101 * addr+00: NOP // Literal (first 32 bits) 102 * addr+04: NOP // Literal (last 32 bits) 103 * addr+08: func: NOP // To be patched to MOV X9, LR 104 * addr+12: NOP // To be patched to BL <caller> 105 * 106 * Or: 107 * 108 * addr+00: NOP // Literal (first 32 bits) 109 * addr+04: NOP // Literal (last 32 bits) 110 * addr+08: func: BTI C 111 * addr+12: NOP // To be patched to MOV X9, LR 112 * addr+16: NOP // To be patched to BL <caller> 113 * 114 * We must adjust addr to the address of the NOP which will be patched 115 * to `BL <caller>`, which is at either addr+12 or addr+16 depending on 116 * whether there is a BTI. 117 */ 118 119 if (!IS_ALIGNED(addr, sizeof(unsigned long))) { 120 WARN_RATELIMIT(1, "Misaligned patch-site %pS\n", 121 (void *)(addr + 8)); 122 return 0; 123 } 124 125 /* Skip the NOPs placed before the function entry point */ 126 addr += 2 * AARCH64_INSN_SIZE; 127 128 /* Skip any BTI */ 129 if (IS_ENABLED(CONFIG_ARM64_BTI_KERNEL)) { 130 u32 insn = le32_to_cpu(*(__le32 *)addr); 131 132 if (aarch64_insn_is_bti(insn)) { 133 addr += AARCH64_INSN_SIZE; 134 } else if (insn != aarch64_insn_gen_nop()) { 135 WARN_RATELIMIT(1, "unexpected insn in patch-site %pS: 0x%08x\n", 136 (void *)addr, insn); 137 } 138 } 139 140 /* Skip the first NOP after function entry */ 141 addr += AARCH64_INSN_SIZE; 142 143 return addr; 144 } 145 146 /* Convert fentry_ip to the symbol address without kallsyms */ 147 unsigned long arch_ftrace_get_symaddr(unsigned long fentry_ip) 148 { 149 u32 insn; 150 151 /* 152 * When using patchable-function-entry without pre-function NOPS, ftrace 153 * entry is the address of the first NOP after the function entry point. 154 * 155 * The compiler has either generated: 156 * 157 * func+00: func: NOP // To be patched to MOV X9, LR 158 * func+04: NOP // To be patched to BL <caller> 159 * 160 * Or: 161 * 162 * func-04: BTI C 163 * func+00: func: NOP // To be patched to MOV X9, LR 164 * func+04: NOP // To be patched to BL <caller> 165 * 166 * The fentry_ip is the address of `BL <caller>` which is at `func + 4` 167 * bytes in either case. 168 */ 169 if (!IS_ENABLED(CONFIG_DYNAMIC_FTRACE_WITH_CALL_OPS)) 170 return fentry_ip - AARCH64_INSN_SIZE; 171 172 /* 173 * When using patchable-function-entry with pre-function NOPs, BTI is 174 * a bit different. 175 * 176 * func+00: func: NOP // To be patched to MOV X9, LR 177 * func+04: NOP // To be patched to BL <caller> 178 * 179 * Or: 180 * 181 * func+00: func: BTI C 182 * func+04: NOP // To be patched to MOV X9, LR 183 * func+08: NOP // To be patched to BL <caller> 184 * 185 * The fentry_ip is the address of `BL <caller>` which is at either 186 * `func + 4` or `func + 8` depends on whether there is a BTI. 187 */ 188 189 /* If there is no BTI, the func address should be one instruction before. */ 190 if (!IS_ENABLED(CONFIG_ARM64_BTI_KERNEL)) 191 return fentry_ip - AARCH64_INSN_SIZE; 192 193 /* We want to be extra safe in case entry ip is on the page edge, 194 * but otherwise we need to avoid get_kernel_nofault()'s overhead. 195 */ 196 if ((fentry_ip & ~PAGE_MASK) < AARCH64_INSN_SIZE * 2) { 197 if (get_kernel_nofault(insn, (u32 *)(fentry_ip - AARCH64_INSN_SIZE * 2))) 198 return 0; 199 } else { 200 insn = *(u32 *)(fentry_ip - AARCH64_INSN_SIZE * 2); 201 } 202 203 if (aarch64_insn_is_bti(le32_to_cpu((__le32)insn))) 204 return fentry_ip - AARCH64_INSN_SIZE * 2; 205 206 return fentry_ip - AARCH64_INSN_SIZE; 207 } 208 209 /* 210 * Replace a single instruction, which may be a branch or NOP. 211 * If @validate == true, a replaced instruction is checked against 'old'. 212 */ 213 static int ftrace_modify_code(unsigned long pc, u32 old, u32 new, 214 bool validate) 215 { 216 u32 replaced; 217 218 /* 219 * Note: 220 * We are paranoid about modifying text, as if a bug were to happen, it 221 * could cause us to read or write to someplace that could cause harm. 222 * Carefully read and modify the code with aarch64_insn_*() which uses 223 * probe_kernel_*(), and make sure what we read is what we expected it 224 * to be before modifying it. 225 */ 226 if (validate) { 227 if (aarch64_insn_read((void *)pc, &replaced)) 228 return -EFAULT; 229 230 if (replaced != old) 231 return -EINVAL; 232 } 233 if (aarch64_insn_patch_text_nosync((void *)pc, new)) 234 return -EPERM; 235 236 return 0; 237 } 238 239 /* 240 * Replace tracer function in ftrace_caller() 241 */ 242 int ftrace_update_ftrace_func(ftrace_func_t func) 243 { 244 unsigned long pc; 245 u32 new; 246 247 /* 248 * When using CALL_OPS, the function to call is associated with the 249 * call site, and we don't have a global function pointer to update. 250 */ 251 if (IS_ENABLED(CONFIG_DYNAMIC_FTRACE_WITH_CALL_OPS)) 252 return 0; 253 254 pc = (unsigned long)ftrace_call; 255 new = aarch64_insn_gen_branch_imm(pc, (unsigned long)func, 256 AARCH64_INSN_BRANCH_LINK); 257 258 return ftrace_modify_code(pc, 0, new, false); 259 } 260 261 static struct plt_entry *get_ftrace_plt(struct module *mod, unsigned long addr) 262 { 263 #ifdef CONFIG_MODULES 264 struct plt_entry *plt = NULL; 265 266 if (within_module_mem_type(addr, mod, MOD_INIT_TEXT)) 267 plt = mod->arch.init_ftrace_trampolines; 268 else if (within_module_mem_type(addr, mod, MOD_TEXT)) 269 plt = mod->arch.ftrace_trampolines; 270 else 271 return NULL; 272 273 return &plt[FTRACE_PLT_IDX]; 274 #else 275 return NULL; 276 #endif 277 } 278 279 static bool reachable_by_bl(unsigned long addr, unsigned long pc) 280 { 281 long offset = (long)addr - (long)pc; 282 283 return offset >= -SZ_128M && offset < SZ_128M; 284 } 285 286 /* 287 * Find the address the callsite must branch to in order to reach '*addr'. 288 * 289 * Due to the limited range of 'BL' instructions, modules may be placed too far 290 * away to branch directly and must use a PLT. 291 * 292 * Returns true when '*addr' contains a reachable target address, or has been 293 * modified to contain a PLT address. Returns false otherwise. 294 */ 295 static bool ftrace_find_callable_addr(struct dyn_ftrace *rec, 296 struct module *mod, 297 unsigned long *addr) 298 { 299 unsigned long pc = rec->ip; 300 struct plt_entry *plt; 301 302 /* 303 * If a custom trampoline is unreachable, rely on the ftrace_caller 304 * trampoline which knows how to indirectly reach that trampoline 305 * through ops->direct_call. 306 */ 307 if (*addr != FTRACE_ADDR && !reachable_by_bl(*addr, pc)) 308 *addr = FTRACE_ADDR; 309 310 /* 311 * When the target is within range of the 'BL' instruction, use 'addr' 312 * as-is and branch to that directly. 313 */ 314 if (reachable_by_bl(*addr, pc)) 315 return true; 316 317 /* 318 * When the target is outside of the range of a 'BL' instruction, we 319 * must use a PLT to reach it. We can only place PLTs for modules, and 320 * only when module PLT support is built-in. 321 */ 322 if (!IS_ENABLED(CONFIG_MODULES)) 323 return false; 324 325 /* 326 * 'mod' is only set at module load time, but if we end up 327 * dealing with an out-of-range condition, we can assume it 328 * is due to a module being loaded far away from the kernel. 329 * 330 * NOTE: __module_text_address() must be called within a RCU read 331 * section, but we can rely on ftrace_lock to ensure that 'mod' 332 * retains its validity throughout the remainder of this code. 333 */ 334 if (!mod) { 335 guard(rcu)(); 336 mod = __module_text_address(pc); 337 } 338 339 if (WARN_ON(!mod)) 340 return false; 341 342 plt = get_ftrace_plt(mod, pc); 343 if (!plt) { 344 pr_err("ftrace: no module PLT for %ps\n", (void *)*addr); 345 return false; 346 } 347 348 *addr = (unsigned long)plt; 349 return true; 350 } 351 352 #ifdef CONFIG_DYNAMIC_FTRACE_WITH_CALL_OPS 353 static const struct ftrace_ops *arm64_rec_get_ops(struct dyn_ftrace *rec) 354 { 355 const struct ftrace_ops *ops = NULL; 356 357 if (rec->flags & FTRACE_FL_CALL_OPS_EN) { 358 ops = ftrace_find_unique_ops(rec); 359 WARN_ON_ONCE(!ops); 360 } 361 362 if (!ops) 363 ops = &ftrace_list_ops; 364 365 return ops; 366 } 367 368 static int ftrace_rec_set_ops(const struct dyn_ftrace *rec, 369 const struct ftrace_ops *ops) 370 { 371 unsigned long literal = ALIGN_DOWN(rec->ip - 12, 8); 372 return aarch64_insn_write_literal_u64((void *)literal, 373 (unsigned long)ops); 374 } 375 376 static int ftrace_rec_set_nop_ops(struct dyn_ftrace *rec) 377 { 378 return ftrace_rec_set_ops(rec, &ftrace_nop_ops); 379 } 380 381 static int ftrace_rec_update_ops(struct dyn_ftrace *rec) 382 { 383 return ftrace_rec_set_ops(rec, arm64_rec_get_ops(rec)); 384 } 385 #else 386 static int ftrace_rec_set_nop_ops(struct dyn_ftrace *rec) { return 0; } 387 static int ftrace_rec_update_ops(struct dyn_ftrace *rec) { return 0; } 388 #endif 389 390 /* 391 * Turn on the call to ftrace_caller() in instrumented function 392 */ 393 int ftrace_make_call(struct dyn_ftrace *rec, unsigned long addr) 394 { 395 unsigned long pc = rec->ip; 396 u32 old, new; 397 int ret; 398 399 ret = ftrace_rec_update_ops(rec); 400 if (ret) 401 return ret; 402 403 if (!ftrace_find_callable_addr(rec, NULL, &addr)) 404 return -EINVAL; 405 406 old = aarch64_insn_gen_nop(); 407 new = aarch64_insn_gen_branch_imm(pc, addr, AARCH64_INSN_BRANCH_LINK); 408 409 return ftrace_modify_code(pc, old, new, true); 410 } 411 412 #ifdef CONFIG_DYNAMIC_FTRACE_WITH_CALL_OPS 413 int ftrace_modify_call(struct dyn_ftrace *rec, unsigned long old_addr, 414 unsigned long addr) 415 { 416 unsigned long pc = rec->ip; 417 u32 old, new; 418 int ret; 419 420 ret = ftrace_rec_set_ops(rec, arm64_rec_get_ops(rec)); 421 if (ret) 422 return ret; 423 424 if (!ftrace_find_callable_addr(rec, NULL, &old_addr)) 425 return -EINVAL; 426 if (!ftrace_find_callable_addr(rec, NULL, &addr)) 427 return -EINVAL; 428 429 old = aarch64_insn_gen_branch_imm(pc, old_addr, 430 AARCH64_INSN_BRANCH_LINK); 431 new = aarch64_insn_gen_branch_imm(pc, addr, AARCH64_INSN_BRANCH_LINK); 432 433 return ftrace_modify_code(pc, old, new, true); 434 } 435 #endif 436 437 #ifdef CONFIG_DYNAMIC_FTRACE_WITH_ARGS 438 /* 439 * The compiler has inserted two NOPs before the regular function prologue. 440 * All instrumented functions follow the AAPCS, so x0-x8 and x19-x30 are live, 441 * and x9-x18 are free for our use. 442 * 443 * At runtime we want to be able to swing a single NOP <-> BL to enable or 444 * disable the ftrace call. The BL requires us to save the original LR value, 445 * so here we insert a <MOV X9, LR> over the first NOP so the instructions 446 * before the regular prologue are: 447 * 448 * | Compiled | Disabled | Enabled | 449 * +----------+------------+------------+ 450 * | NOP | MOV X9, LR | MOV X9, LR | 451 * | NOP | NOP | BL <entry> | 452 * 453 * The LR value will be recovered by ftrace_caller, and restored into LR 454 * before returning to the regular function prologue. When a function is not 455 * being traced, the MOV is not harmful given x9 is not live per the AAPCS. 456 * 457 * Note: ftrace_process_locs() has pre-adjusted rec->ip to be the address of 458 * the BL. 459 */ 460 int ftrace_init_nop(struct module *mod, struct dyn_ftrace *rec) 461 { 462 unsigned long pc = rec->ip - AARCH64_INSN_SIZE; 463 u32 old, new; 464 int ret; 465 466 ret = ftrace_rec_set_nop_ops(rec); 467 if (ret) 468 return ret; 469 470 old = aarch64_insn_gen_nop(); 471 new = aarch64_insn_gen_move_reg(AARCH64_INSN_REG_9, 472 AARCH64_INSN_REG_LR, 473 AARCH64_INSN_VARIANT_64BIT); 474 return ftrace_modify_code(pc, old, new, true); 475 } 476 #endif 477 478 /* 479 * Turn off the call to ftrace_caller() in instrumented function 480 */ 481 int ftrace_make_nop(struct module *mod, struct dyn_ftrace *rec, 482 unsigned long addr) 483 { 484 unsigned long pc = rec->ip; 485 u32 old = 0, new; 486 int ret; 487 488 new = aarch64_insn_gen_nop(); 489 490 ret = ftrace_rec_set_nop_ops(rec); 491 if (ret) 492 return ret; 493 494 /* 495 * When using mcount, callsites in modules may have been initalized to 496 * call an arbitrary module PLT (which redirects to the _mcount stub) 497 * rather than the ftrace PLT we'll use at runtime (which redirects to 498 * the ftrace trampoline). We can ignore the old PLT when initializing 499 * the callsite. 500 * 501 * Note: 'mod' is only set at module load time. 502 */ 503 if (!IS_ENABLED(CONFIG_DYNAMIC_FTRACE_WITH_ARGS) && mod) 504 return aarch64_insn_patch_text_nosync((void *)pc, new); 505 506 if (!ftrace_find_callable_addr(rec, mod, &addr)) 507 return -EINVAL; 508 509 old = aarch64_insn_gen_branch_imm(pc, addr, AARCH64_INSN_BRANCH_LINK); 510 511 return ftrace_modify_code(pc, old, new, true); 512 } 513 514 void arch_ftrace_update_code(int command) 515 { 516 command |= FTRACE_MAY_SLEEP; 517 ftrace_modify_all_code(command); 518 } 519 520 #ifdef CONFIG_FUNCTION_GRAPH_TRACER 521 /* 522 * function_graph tracer expects ftrace_return_to_handler() to be called 523 * on the way back to parent. For this purpose, this function is called 524 * in _mcount() or ftrace_caller() to replace return address (*parent) on 525 * the call stack to return_to_handler. 526 */ 527 void prepare_ftrace_return(unsigned long self_addr, unsigned long *parent, 528 unsigned long frame_pointer) 529 { 530 unsigned long return_hooker = (unsigned long)&return_to_handler; 531 unsigned long old; 532 533 if (unlikely(atomic_read(¤t->tracing_graph_pause))) 534 return; 535 536 /* 537 * Note: 538 * No protection against faulting at *parent, which may be seen 539 * on other archs. It's unlikely on AArch64. 540 */ 541 old = *parent; 542 543 if (!function_graph_enter(old, self_addr, frame_pointer, 544 (void *)frame_pointer)) { 545 *parent = return_hooker; 546 } 547 } 548 549 #ifdef CONFIG_DYNAMIC_FTRACE_WITH_ARGS 550 void ftrace_graph_func(unsigned long ip, unsigned long parent_ip, 551 struct ftrace_ops *op, struct ftrace_regs *fregs) 552 { 553 unsigned long return_hooker = (unsigned long)&return_to_handler; 554 unsigned long frame_pointer = arch_ftrace_regs(fregs)->fp; 555 unsigned long *parent = &arch_ftrace_regs(fregs)->lr; 556 unsigned long old; 557 558 if (unlikely(atomic_read(¤t->tracing_graph_pause))) 559 return; 560 561 old = *parent; 562 563 if (!function_graph_enter_regs(old, ip, frame_pointer, 564 (void *)frame_pointer, fregs)) { 565 *parent = return_hooker; 566 } 567 } 568 #else 569 /* 570 * Turn on/off the call to ftrace_graph_caller() in ftrace_caller() 571 * depending on @enable. 572 */ 573 static int ftrace_modify_graph_caller(bool enable) 574 { 575 unsigned long pc = (unsigned long)&ftrace_graph_call; 576 u32 branch, nop; 577 578 branch = aarch64_insn_gen_branch_imm(pc, 579 (unsigned long)ftrace_graph_caller, 580 AARCH64_INSN_BRANCH_NOLINK); 581 nop = aarch64_insn_gen_nop(); 582 583 if (enable) 584 return ftrace_modify_code(pc, nop, branch, true); 585 else 586 return ftrace_modify_code(pc, branch, nop, true); 587 } 588 589 int ftrace_enable_ftrace_graph_caller(void) 590 { 591 return ftrace_modify_graph_caller(true); 592 } 593 594 int ftrace_disable_ftrace_graph_caller(void) 595 { 596 return ftrace_modify_graph_caller(false); 597 } 598 #endif /* CONFIG_DYNAMIC_FTRACE_WITH_ARGS */ 599 #endif /* CONFIG_FUNCTION_GRAPH_TRACER */ 600