1 // SPDX-License-Identifier: GPL-2.0-or-later 2 /* Kernel module help for PPC64. 3 Copyright (C) 2001, 2003 Rusty Russell IBM Corporation. 4 5 */ 6 7 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 8 9 #include <linux/module.h> 10 #include <linux/elf.h> 11 #include <linux/moduleloader.h> 12 #include <linux/err.h> 13 #include <linux/vmalloc.h> 14 #include <linux/ftrace.h> 15 #include <linux/bug.h> 16 #include <linux/uaccess.h> 17 #include <linux/kernel.h> 18 #include <asm/module.h> 19 #include <asm/firmware.h> 20 #include <asm/code-patching.h> 21 #include <linux/sort.h> 22 #include <asm/setup.h> 23 #include <asm/sections.h> 24 #include <asm/inst.h> 25 26 /* FIXME: We don't do .init separately. To do this, we'd need to have 27 a separate r2 value in the init and core section, and stub between 28 them, too. 29 30 Using a magic allocator which places modules within 32MB solves 31 this, and makes other things simpler. Anton? 32 --RR. */ 33 34 bool module_elf_check_arch(Elf_Ehdr *hdr) 35 { 36 unsigned long abi_level = hdr->e_flags & 0x3; 37 38 if (IS_ENABLED(CONFIG_PPC64_ELF_ABI_V2)) 39 return abi_level == 2; 40 else 41 return abi_level < 2; 42 } 43 44 #ifdef CONFIG_PPC64_ELF_ABI_V2 45 46 static func_desc_t func_desc(unsigned long addr) 47 { 48 func_desc_t desc = { 49 .addr = addr, 50 }; 51 52 return desc; 53 } 54 55 /* PowerPC64 specific values for the Elf64_Sym st_other field. */ 56 #define STO_PPC64_LOCAL_BIT 5 57 #define STO_PPC64_LOCAL_MASK (7 << STO_PPC64_LOCAL_BIT) 58 #define PPC64_LOCAL_ENTRY_OFFSET(other) \ 59 (((1 << (((other) & STO_PPC64_LOCAL_MASK) >> STO_PPC64_LOCAL_BIT)) >> 2) << 2) 60 61 static unsigned int local_entry_offset(const Elf64_Sym *sym) 62 { 63 /* sym->st_other indicates offset to local entry point 64 * (otherwise it will assume r12 is the address of the start 65 * of function and try to derive r2 from it). */ 66 return PPC64_LOCAL_ENTRY_OFFSET(sym->st_other); 67 } 68 #else 69 70 static func_desc_t func_desc(unsigned long addr) 71 { 72 return *(struct func_desc *)addr; 73 } 74 static unsigned int local_entry_offset(const Elf64_Sym *sym) 75 { 76 return 0; 77 } 78 79 void *dereference_module_function_descriptor(struct module *mod, void *ptr) 80 { 81 if (ptr < (void *)mod->arch.start_opd || 82 ptr >= (void *)mod->arch.end_opd) 83 return ptr; 84 85 return dereference_function_descriptor(ptr); 86 } 87 #endif 88 89 static unsigned long func_addr(unsigned long addr) 90 { 91 return func_desc(addr).addr; 92 } 93 94 static unsigned long stub_func_addr(func_desc_t func) 95 { 96 return func.addr; 97 } 98 99 #define STUB_MAGIC 0x73747562 /* stub */ 100 101 /* Like PPC32, we need little trampolines to do > 24-bit jumps (into 102 the kernel itself). But on PPC64, these need to be used for every 103 jump, actually, to reset r2 (TOC+0x8000). */ 104 struct ppc64_stub_entry { 105 /* 106 * 28 byte jump instruction sequence (7 instructions) that can 107 * hold ppc64_stub_insns or stub_insns. Must be 8-byte aligned 108 * with PCREL kernels that use prefix instructions in the stub. 109 */ 110 u32 jump[7]; 111 /* Used by ftrace to identify stubs */ 112 u32 magic; 113 /* Data for the above code */ 114 func_desc_t funcdata; 115 } __aligned(8); 116 117 struct ppc64_got_entry { 118 u64 addr; 119 }; 120 121 /* 122 * PPC64 uses 24 bit jumps, but we need to jump into other modules or 123 * the kernel which may be further. So we jump to a stub. 124 * 125 * Target address and TOC are loaded from function descriptor in the 126 * ppc64_stub_entry. 127 * 128 * r12 is used to generate the target address, which is required for the 129 * ELFv2 global entry point calling convention. 130 * 131 * TOC handling: 132 * - PCREL does not have a TOC. 133 * - ELFv2 non-PCREL just has to save r2, the callee is responsible for 134 * setting its own TOC pointer at the global entry address. 135 * - ELFv1 must load the new TOC pointer from the function descriptor. 136 */ 137 static u32 ppc64_stub_insns[] = { 138 #ifdef CONFIG_PPC_KERNEL_PCREL 139 /* pld r12,addr */ 140 PPC_PREFIX_8LS | __PPC_PRFX_R(1), 141 PPC_INST_PLD | ___PPC_RT(_R12), 142 #else 143 PPC_RAW_ADDIS(_R11, _R2, 0), 144 PPC_RAW_ADDI(_R11, _R11, 0), 145 /* Save current r2 value in magic place on the stack. */ 146 PPC_RAW_STD(_R2, _R1, R2_STACK_OFFSET), 147 PPC_RAW_LD(_R12, _R11, 32), 148 #ifdef CONFIG_PPC64_ELF_ABI_V1 149 /* Set up new r2 from function descriptor */ 150 PPC_RAW_LD(_R2, _R11, 40), 151 #endif 152 #endif 153 PPC_RAW_MTCTR(_R12), 154 PPC_RAW_BCTR(), 155 }; 156 157 /* 158 * Count how many different r_type relocations (different symbol, 159 * different addend). 160 */ 161 static unsigned int count_relocs(const Elf64_Rela *rela, unsigned int num, 162 unsigned long r_type) 163 { 164 unsigned int i, r_info, r_addend, _count_relocs; 165 166 /* FIXME: Only count external ones --RR */ 167 _count_relocs = 0; 168 r_info = 0; 169 r_addend = 0; 170 for (i = 0; i < num; i++) 171 /* Only count r_type relocs, others don't need stubs */ 172 if (ELF64_R_TYPE(rela[i].r_info) == r_type && 173 (r_info != ELF64_R_SYM(rela[i].r_info) || 174 r_addend != rela[i].r_addend)) { 175 _count_relocs++; 176 r_info = ELF64_R_SYM(rela[i].r_info); 177 r_addend = rela[i].r_addend; 178 } 179 180 return _count_relocs; 181 } 182 183 static int relacmp(const void *_x, const void *_y) 184 { 185 const Elf64_Rela *x, *y; 186 187 y = (Elf64_Rela *)_x; 188 x = (Elf64_Rela *)_y; 189 190 /* Compare the entire r_info (as opposed to ELF64_R_SYM(r_info) only) to 191 * make the comparison cheaper/faster. It won't affect the sorting or 192 * the counting algorithms' performance 193 */ 194 if (x->r_info < y->r_info) 195 return -1; 196 else if (x->r_info > y->r_info) 197 return 1; 198 else if (x->r_addend < y->r_addend) 199 return -1; 200 else if (x->r_addend > y->r_addend) 201 return 1; 202 else 203 return 0; 204 } 205 206 /* Get size of potential trampolines required. */ 207 static unsigned long get_stubs_size(const Elf64_Ehdr *hdr, 208 const Elf64_Shdr *sechdrs) 209 { 210 /* One extra reloc so it's always 0-addr terminated */ 211 unsigned long relocs = 1; 212 unsigned i; 213 214 /* Every relocated section... */ 215 for (i = 1; i < hdr->e_shnum; i++) { 216 if (sechdrs[i].sh_type == SHT_RELA) { 217 pr_debug("Found relocations in section %u\n", i); 218 pr_debug("Ptr: %p. Number: %Lu\n", 219 (void *)sechdrs[i].sh_addr, 220 sechdrs[i].sh_size / sizeof(Elf64_Rela)); 221 222 /* Sort the relocation information based on a symbol and 223 * addend key. This is a stable O(n*log n) complexity 224 * algorithm but it will reduce the complexity of 225 * count_relocs() to linear complexity O(n) 226 */ 227 sort((void *)sechdrs[i].sh_addr, 228 sechdrs[i].sh_size / sizeof(Elf64_Rela), 229 sizeof(Elf64_Rela), relacmp, NULL); 230 231 relocs += count_relocs((void *)sechdrs[i].sh_addr, 232 sechdrs[i].sh_size 233 / sizeof(Elf64_Rela), 234 R_PPC_REL24); 235 #ifdef CONFIG_PPC_KERNEL_PCREL 236 relocs += count_relocs((void *)sechdrs[i].sh_addr, 237 sechdrs[i].sh_size 238 / sizeof(Elf64_Rela), 239 R_PPC64_REL24_NOTOC); 240 #endif 241 } 242 } 243 244 #ifdef CONFIG_DYNAMIC_FTRACE 245 /* make the trampoline to the ftrace_caller */ 246 relocs++; 247 #ifdef CONFIG_DYNAMIC_FTRACE_WITH_REGS 248 /* an additional one for ftrace_regs_caller */ 249 relocs++; 250 #endif 251 #endif 252 253 pr_debug("Looks like a total of %lu stubs, max\n", relocs); 254 return relocs * sizeof(struct ppc64_stub_entry); 255 } 256 257 #ifdef CONFIG_PPC_KERNEL_PCREL 258 static int count_pcpu_relocs(const Elf64_Shdr *sechdrs, 259 const Elf64_Rela *rela, unsigned int num, 260 unsigned int symindex, unsigned int pcpu) 261 { 262 unsigned int i, r_info, r_addend, _count_relocs; 263 264 _count_relocs = 0; 265 r_info = 0; 266 r_addend = 0; 267 268 for (i = 0; i < num; i++) { 269 Elf64_Sym *sym; 270 271 /* This is the symbol it is referring to */ 272 sym = (Elf64_Sym *)sechdrs[symindex].sh_addr 273 + ELF64_R_SYM(rela[i].r_info); 274 275 if (sym->st_shndx == pcpu && 276 (r_info != ELF64_R_SYM(rela[i].r_info) || 277 r_addend != rela[i].r_addend)) { 278 _count_relocs++; 279 r_info = ELF64_R_SYM(rela[i].r_info); 280 r_addend = rela[i].r_addend; 281 } 282 } 283 284 return _count_relocs; 285 } 286 287 /* Get size of potential GOT required. */ 288 static unsigned long get_got_size(const Elf64_Ehdr *hdr, 289 const Elf64_Shdr *sechdrs, 290 struct module *me) 291 { 292 /* One extra reloc so it's always 0-addr terminated */ 293 unsigned long relocs = 1; 294 unsigned int i, symindex = 0; 295 296 for (i = 1; i < hdr->e_shnum; i++) { 297 if (sechdrs[i].sh_type == SHT_SYMTAB) { 298 symindex = i; 299 break; 300 } 301 } 302 WARN_ON_ONCE(!symindex); 303 304 /* Every relocated section... */ 305 for (i = 1; i < hdr->e_shnum; i++) { 306 if (sechdrs[i].sh_type == SHT_RELA) { 307 pr_debug("Found relocations in section %u\n", i); 308 pr_debug("Ptr: %p. Number: %llu\n", (void *)sechdrs[i].sh_addr, 309 sechdrs[i].sh_size / sizeof(Elf64_Rela)); 310 311 /* 312 * Sort the relocation information based on a symbol and 313 * addend key. This is a stable O(n*log n) complexity 314 * algorithm but it will reduce the complexity of 315 * count_relocs() to linear complexity O(n) 316 */ 317 sort((void *)sechdrs[i].sh_addr, 318 sechdrs[i].sh_size / sizeof(Elf64_Rela), 319 sizeof(Elf64_Rela), relacmp, NULL); 320 321 relocs += count_relocs((void *)sechdrs[i].sh_addr, 322 sechdrs[i].sh_size 323 / sizeof(Elf64_Rela), 324 R_PPC64_GOT_PCREL34); 325 326 /* 327 * Percpu data access typically gets linked with 328 * REL34 relocations, but the percpu section gets 329 * moved at load time and requires that to be 330 * converted to GOT linkage. 331 */ 332 if (IS_ENABLED(CONFIG_SMP) && symindex) 333 relocs += count_pcpu_relocs(sechdrs, 334 (void *)sechdrs[i].sh_addr, 335 sechdrs[i].sh_size 336 / sizeof(Elf64_Rela), 337 symindex, me->arch.pcpu_section); 338 } 339 } 340 341 pr_debug("Looks like a total of %lu GOT entries, max\n", relocs); 342 return relocs * sizeof(struct ppc64_got_entry); 343 } 344 #else /* CONFIG_PPC_KERNEL_PCREL */ 345 346 /* Still needed for ELFv2, for .TOC. */ 347 static void dedotify_versions(struct modversion_info *vers, 348 unsigned long size) 349 { 350 struct modversion_info *end; 351 352 for (end = (void *)vers + size; vers < end; vers++) 353 if (vers->name[0] == '.') { 354 memmove(vers->name, vers->name+1, strlen(vers->name)); 355 } 356 } 357 358 /* 359 * Undefined symbols which refer to .funcname, hack to funcname. Make .TOC. 360 * seem to be defined (value set later). 361 */ 362 static void dedotify(Elf64_Sym *syms, unsigned int numsyms, char *strtab) 363 { 364 unsigned int i; 365 366 for (i = 1; i < numsyms; i++) { 367 if (syms[i].st_shndx == SHN_UNDEF) { 368 char *name = strtab + syms[i].st_name; 369 if (name[0] == '.') { 370 if (strcmp(name+1, "TOC.") == 0) 371 syms[i].st_shndx = SHN_ABS; 372 syms[i].st_name++; 373 } 374 } 375 } 376 } 377 378 static Elf64_Sym *find_dot_toc(Elf64_Shdr *sechdrs, 379 const char *strtab, 380 unsigned int symindex) 381 { 382 unsigned int i, numsyms; 383 Elf64_Sym *syms; 384 385 syms = (Elf64_Sym *)sechdrs[symindex].sh_addr; 386 numsyms = sechdrs[symindex].sh_size / sizeof(Elf64_Sym); 387 388 for (i = 1; i < numsyms; i++) { 389 if (syms[i].st_shndx == SHN_ABS 390 && strcmp(strtab + syms[i].st_name, "TOC.") == 0) 391 return &syms[i]; 392 } 393 return NULL; 394 } 395 #endif /* CONFIG_PPC_KERNEL_PCREL */ 396 397 bool module_init_section(const char *name) 398 { 399 /* We don't handle .init for the moment: always return false. */ 400 return false; 401 } 402 403 int module_frob_arch_sections(Elf64_Ehdr *hdr, 404 Elf64_Shdr *sechdrs, 405 char *secstrings, 406 struct module *me) 407 { 408 unsigned int i; 409 410 /* Find .toc and .stubs sections, symtab and strtab */ 411 for (i = 1; i < hdr->e_shnum; i++) { 412 if (strcmp(secstrings + sechdrs[i].sh_name, ".stubs") == 0) 413 me->arch.stubs_section = i; 414 #ifdef CONFIG_PPC_KERNEL_PCREL 415 else if (strcmp(secstrings + sechdrs[i].sh_name, ".data..percpu") == 0) 416 me->arch.pcpu_section = i; 417 else if (strcmp(secstrings + sechdrs[i].sh_name, ".mygot") == 0) { 418 me->arch.got_section = i; 419 if (sechdrs[i].sh_addralign < 8) 420 sechdrs[i].sh_addralign = 8; 421 } 422 #else 423 else if (strcmp(secstrings + sechdrs[i].sh_name, ".toc") == 0) { 424 me->arch.toc_section = i; 425 if (sechdrs[i].sh_addralign < 8) 426 sechdrs[i].sh_addralign = 8; 427 } 428 else if (strcmp(secstrings+sechdrs[i].sh_name,"__versions")==0) 429 dedotify_versions((void *)hdr + sechdrs[i].sh_offset, 430 sechdrs[i].sh_size); 431 432 if (sechdrs[i].sh_type == SHT_SYMTAB) 433 dedotify((void *)hdr + sechdrs[i].sh_offset, 434 sechdrs[i].sh_size / sizeof(Elf64_Sym), 435 (void *)hdr 436 + sechdrs[sechdrs[i].sh_link].sh_offset); 437 #endif 438 } 439 440 if (!me->arch.stubs_section) { 441 pr_err("%s: doesn't contain .stubs.\n", me->name); 442 return -ENOEXEC; 443 } 444 445 #ifdef CONFIG_PPC_KERNEL_PCREL 446 if (!me->arch.got_section) { 447 pr_err("%s: doesn't contain .mygot.\n", me->name); 448 return -ENOEXEC; 449 } 450 451 /* Override the got size */ 452 sechdrs[me->arch.got_section].sh_size = get_got_size(hdr, sechdrs, me); 453 #else 454 /* If we don't have a .toc, just use .stubs. We need to set r2 455 to some reasonable value in case the module calls out to 456 other functions via a stub, or if a function pointer escapes 457 the module by some means. */ 458 if (!me->arch.toc_section) 459 me->arch.toc_section = me->arch.stubs_section; 460 #endif 461 462 /* Override the stubs size */ 463 sechdrs[me->arch.stubs_section].sh_size = get_stubs_size(hdr, sechdrs); 464 465 return 0; 466 } 467 468 #if defined(CONFIG_MPROFILE_KERNEL) || defined(CONFIG_ARCH_USING_PATCHABLE_FUNCTION_ENTRY) 469 470 static u32 stub_insns[] = { 471 #ifdef CONFIG_PPC_KERNEL_PCREL 472 PPC_RAW_LD(_R12, _R13, offsetof(struct paca_struct, kernelbase)), 473 PPC_RAW_NOP(), /* align the prefix insn */ 474 /* paddi r12,r12,addr */ 475 PPC_PREFIX_MLS | __PPC_PRFX_R(0), 476 PPC_INST_PADDI | ___PPC_RT(_R12) | ___PPC_RA(_R12), 477 PPC_RAW_MTCTR(_R12), 478 PPC_RAW_BCTR(), 479 #else 480 PPC_RAW_LD(_R12, _R13, offsetof(struct paca_struct, kernel_toc)), 481 PPC_RAW_ADDIS(_R12, _R12, 0), 482 PPC_RAW_ADDI(_R12, _R12, 0), 483 PPC_RAW_MTCTR(_R12), 484 PPC_RAW_BCTR(), 485 #endif 486 }; 487 488 /* 489 * For mprofile-kernel we use a special stub for ftrace_caller() because we 490 * can't rely on r2 containing this module's TOC when we enter the stub. 491 * 492 * That can happen if the function calling us didn't need to use the toc. In 493 * that case it won't have setup r2, and the r2 value will be either the 494 * kernel's toc, or possibly another modules toc. 495 * 496 * To deal with that this stub uses the kernel toc, which is always accessible 497 * via the paca (in r13). The target (ftrace_caller()) is responsible for 498 * saving and restoring the toc before returning. 499 */ 500 static inline int create_ftrace_stub(struct ppc64_stub_entry *entry, 501 unsigned long addr, 502 struct module *me) 503 { 504 long reladdr; 505 506 if ((unsigned long)entry->jump % 8 != 0) { 507 pr_err("%s: Address of stub entry is not 8-byte aligned\n", me->name); 508 return 0; 509 } 510 511 BUILD_BUG_ON(sizeof(stub_insns) > sizeof(entry->jump)); 512 memcpy(entry->jump, stub_insns, sizeof(stub_insns)); 513 514 if (IS_ENABLED(CONFIG_PPC_KERNEL_PCREL)) { 515 /* Stub uses address relative to kernel base (from the paca) */ 516 reladdr = addr - local_paca->kernelbase; 517 if (reladdr > 0x1FFFFFFFFL || reladdr < -0x200000000L) { 518 pr_err("%s: Address of %ps out of range of 34-bit relative address.\n", 519 me->name, (void *)addr); 520 return 0; 521 } 522 523 entry->jump[2] |= IMM_H18(reladdr); 524 entry->jump[3] |= IMM_L(reladdr); 525 } else { 526 /* Stub uses address relative to kernel toc (from the paca) */ 527 reladdr = addr - kernel_toc_addr(); 528 if (reladdr > 0x7FFFFFFF || reladdr < -(0x80000000L)) { 529 pr_err("%s: Address of %ps out of range of kernel_toc.\n", 530 me->name, (void *)addr); 531 return 0; 532 } 533 534 entry->jump[1] |= PPC_HA(reladdr); 535 entry->jump[2] |= PPC_LO(reladdr); 536 } 537 538 /* Even though we don't use funcdata in the stub, it's needed elsewhere. */ 539 entry->funcdata = func_desc(addr); 540 entry->magic = STUB_MAGIC; 541 542 return 1; 543 } 544 545 static bool is_mprofile_ftrace_call(const char *name) 546 { 547 if (!strcmp("_mcount", name)) 548 return true; 549 #ifdef CONFIG_DYNAMIC_FTRACE 550 if (!strcmp("ftrace_caller", name)) 551 return true; 552 #ifdef CONFIG_DYNAMIC_FTRACE_WITH_REGS 553 if (!strcmp("ftrace_regs_caller", name)) 554 return true; 555 #endif 556 #endif 557 558 return false; 559 } 560 #else 561 static inline int create_ftrace_stub(struct ppc64_stub_entry *entry, 562 unsigned long addr, 563 struct module *me) 564 { 565 return 0; 566 } 567 568 static bool is_mprofile_ftrace_call(const char *name) 569 { 570 return false; 571 } 572 #endif 573 574 /* 575 * r2 is the TOC pointer: it actually points 0x8000 into the TOC (this gives the 576 * value maximum span in an instruction which uses a signed offset). Round down 577 * to a 256 byte boundary for the odd case where we are setting up r2 without a 578 * .toc section. 579 */ 580 static inline unsigned long my_r2(const Elf64_Shdr *sechdrs, struct module *me) 581 { 582 #ifndef CONFIG_PPC_KERNEL_PCREL 583 return (sechdrs[me->arch.toc_section].sh_addr & ~0xfful) + 0x8000; 584 #else 585 return -1; 586 #endif 587 } 588 589 /* Patch stub to reference function and correct r2 value. */ 590 static inline int create_stub(const Elf64_Shdr *sechdrs, 591 struct ppc64_stub_entry *entry, 592 unsigned long addr, 593 struct module *me, 594 const char *name) 595 { 596 long reladdr; 597 func_desc_t desc; 598 int i; 599 600 if (is_mprofile_ftrace_call(name)) 601 return create_ftrace_stub(entry, addr, me); 602 603 if ((unsigned long)entry->jump % 8 != 0) { 604 pr_err("%s: Address of stub entry is not 8-byte aligned\n", me->name); 605 return 0; 606 } 607 608 BUILD_BUG_ON(sizeof(ppc64_stub_insns) > sizeof(entry->jump)); 609 for (i = 0; i < ARRAY_SIZE(ppc64_stub_insns); i++) { 610 if (patch_instruction(&entry->jump[i], 611 ppc_inst(ppc64_stub_insns[i]))) 612 return 0; 613 } 614 615 if (IS_ENABLED(CONFIG_PPC_KERNEL_PCREL)) { 616 /* Stub uses address relative to itself! */ 617 reladdr = 0 + offsetof(struct ppc64_stub_entry, funcdata); 618 BUILD_BUG_ON(reladdr != 32); 619 if (reladdr > 0x1FFFFFFFFL || reladdr < -0x200000000L) { 620 pr_err("%s: Address of %p out of range of 34-bit relative address.\n", 621 me->name, (void *)reladdr); 622 return 0; 623 } 624 pr_debug("Stub %p get data from reladdr %li\n", entry, reladdr); 625 626 /* May not even need this if we're relative to 0 */ 627 if (patch_instruction(&entry->jump[0], 628 ppc_inst_prefix(entry->jump[0] | IMM_H18(reladdr), 629 entry->jump[1] | IMM_L(reladdr)))) 630 return 0; 631 632 } else { 633 /* Stub uses address relative to r2. */ 634 reladdr = (unsigned long)entry - my_r2(sechdrs, me); 635 if (reladdr > 0x7FFFFFFF || reladdr < -(0x80000000L)) { 636 pr_err("%s: Address %p of stub out of range of %p.\n", 637 me->name, (void *)reladdr, (void *)my_r2); 638 return 0; 639 } 640 pr_debug("Stub %p get data from reladdr %li\n", entry, reladdr); 641 642 if (patch_instruction(&entry->jump[0], 643 ppc_inst(entry->jump[0] | PPC_HA(reladdr)))) 644 return 0; 645 646 if (patch_instruction(&entry->jump[1], 647 ppc_inst(entry->jump[1] | PPC_LO(reladdr)))) 648 return 0; 649 } 650 651 // func_desc_t is 8 bytes if ABIv2, else 16 bytes 652 desc = func_desc(addr); 653 for (i = 0; i < sizeof(func_desc_t) / sizeof(u32); i++) { 654 if (patch_u32(((u32 *)&entry->funcdata) + i, ((u32 *)&desc)[i])) 655 return 0; 656 } 657 658 if (patch_u32(&entry->magic, STUB_MAGIC)) 659 return 0; 660 661 return 1; 662 } 663 664 /* Create stub to jump to function described in this OPD/ptr: we need the 665 stub to set up the TOC ptr (r2) for the function. */ 666 static unsigned long stub_for_addr(const Elf64_Shdr *sechdrs, 667 unsigned long addr, 668 struct module *me, 669 const char *name) 670 { 671 struct ppc64_stub_entry *stubs; 672 unsigned int i, num_stubs; 673 674 num_stubs = sechdrs[me->arch.stubs_section].sh_size / sizeof(*stubs); 675 676 /* Find this stub, or if that fails, the next avail. entry */ 677 stubs = (void *)sechdrs[me->arch.stubs_section].sh_addr; 678 for (i = 0; stub_func_addr(stubs[i].funcdata); i++) { 679 if (WARN_ON(i >= num_stubs)) 680 return 0; 681 682 if (stub_func_addr(stubs[i].funcdata) == func_addr(addr)) 683 return (unsigned long)&stubs[i]; 684 } 685 686 if (!create_stub(sechdrs, &stubs[i], addr, me, name)) 687 return 0; 688 689 return (unsigned long)&stubs[i]; 690 } 691 692 #ifdef CONFIG_PPC_KERNEL_PCREL 693 /* Create GOT to load the location described in this ptr */ 694 static unsigned long got_for_addr(const Elf64_Shdr *sechdrs, 695 unsigned long addr, 696 struct module *me, 697 const char *name) 698 { 699 struct ppc64_got_entry *got; 700 unsigned int i, num_got; 701 702 if (!IS_ENABLED(CONFIG_PPC_KERNEL_PCREL)) 703 return addr; 704 705 num_got = sechdrs[me->arch.got_section].sh_size / sizeof(*got); 706 707 /* Find this stub, or if that fails, the next avail. entry */ 708 got = (void *)sechdrs[me->arch.got_section].sh_addr; 709 for (i = 0; got[i].addr; i++) { 710 if (WARN_ON(i >= num_got)) 711 return 0; 712 713 if (got[i].addr == addr) 714 return (unsigned long)&got[i]; 715 } 716 717 got[i].addr = addr; 718 719 return (unsigned long)&got[i]; 720 } 721 #endif 722 723 /* We expect a noop next: if it is, replace it with instruction to 724 restore r2. */ 725 static int restore_r2(const char *name, u32 *instruction, struct module *me) 726 { 727 u32 *prev_insn = instruction - 1; 728 u32 insn_val = *instruction; 729 730 if (IS_ENABLED(CONFIG_PPC_KERNEL_PCREL)) 731 return 0; 732 733 if (is_mprofile_ftrace_call(name)) 734 return 0; 735 736 /* 737 * Make sure the branch isn't a sibling call. Sibling calls aren't 738 * "link" branches and they don't return, so they don't need the r2 739 * restore afterwards. 740 */ 741 if (!instr_is_relative_link_branch(ppc_inst(*prev_insn))) 742 return 0; 743 744 /* 745 * For livepatch, the restore r2 instruction might have already been 746 * written previously, if the referenced symbol is in a previously 747 * unloaded module which is now being loaded again. In that case, skip 748 * the warning and the instruction write. 749 */ 750 if (insn_val == PPC_INST_LD_TOC) 751 return 0; 752 753 if (insn_val != PPC_RAW_NOP()) { 754 pr_err("%s: Expected nop after call, got %08x at %pS\n", 755 me->name, insn_val, instruction); 756 return -ENOEXEC; 757 } 758 759 /* ld r2,R2_STACK_OFFSET(r1) */ 760 return patch_instruction(instruction, ppc_inst(PPC_INST_LD_TOC)); 761 } 762 763 int apply_relocate_add(Elf64_Shdr *sechdrs, 764 const char *strtab, 765 unsigned int symindex, 766 unsigned int relsec, 767 struct module *me) 768 { 769 unsigned int i; 770 Elf64_Rela *rela = (void *)sechdrs[relsec].sh_addr; 771 Elf64_Sym *sym; 772 unsigned long *location; 773 unsigned long value; 774 775 pr_debug("Applying ADD relocate section %u to %u\n", relsec, 776 sechdrs[relsec].sh_info); 777 778 #ifndef CONFIG_PPC_KERNEL_PCREL 779 /* First time we're called, we can fix up .TOC. */ 780 if (!me->arch.toc_fixed) { 781 sym = find_dot_toc(sechdrs, strtab, symindex); 782 /* It's theoretically possible that a module doesn't want a 783 * .TOC. so don't fail it just for that. */ 784 if (sym) 785 sym->st_value = my_r2(sechdrs, me); 786 me->arch.toc_fixed = true; 787 } 788 #endif 789 for (i = 0; i < sechdrs[relsec].sh_size / sizeof(*rela); i++) { 790 /* This is where to make the change */ 791 location = (void *)sechdrs[sechdrs[relsec].sh_info].sh_addr 792 + rela[i].r_offset; 793 /* This is the symbol it is referring to */ 794 sym = (Elf64_Sym *)sechdrs[symindex].sh_addr 795 + ELF64_R_SYM(rela[i].r_info); 796 797 pr_debug("RELOC at %p: %li-type as %s (0x%lx) + %li\n", 798 location, (long)ELF64_R_TYPE(rela[i].r_info), 799 strtab + sym->st_name, (unsigned long)sym->st_value, 800 (long)rela[i].r_addend); 801 802 /* `Everything is relative'. */ 803 value = sym->st_value + rela[i].r_addend; 804 805 switch (ELF64_R_TYPE(rela[i].r_info)) { 806 case R_PPC64_ADDR32: 807 /* Simply set it */ 808 *(u32 *)location = value; 809 break; 810 811 case R_PPC64_ADDR64: 812 /* Simply set it */ 813 *(unsigned long *)location = value; 814 break; 815 816 #ifndef CONFIG_PPC_KERNEL_PCREL 817 case R_PPC64_TOC: 818 *(unsigned long *)location = my_r2(sechdrs, me); 819 break; 820 821 case R_PPC64_TOC16: 822 /* Subtract TOC pointer */ 823 value -= my_r2(sechdrs, me); 824 if (value + 0x8000 > 0xffff) { 825 pr_err("%s: bad TOC16 relocation (0x%lx)\n", 826 me->name, value); 827 return -ENOEXEC; 828 } 829 *((uint16_t *) location) 830 = (*((uint16_t *) location) & ~0xffff) 831 | (value & 0xffff); 832 break; 833 834 case R_PPC64_TOC16_LO: 835 /* Subtract TOC pointer */ 836 value -= my_r2(sechdrs, me); 837 *((uint16_t *) location) 838 = (*((uint16_t *) location) & ~0xffff) 839 | (value & 0xffff); 840 break; 841 842 case R_PPC64_TOC16_DS: 843 /* Subtract TOC pointer */ 844 value -= my_r2(sechdrs, me); 845 if ((value & 3) != 0 || value + 0x8000 > 0xffff) { 846 pr_err("%s: bad TOC16_DS relocation (0x%lx)\n", 847 me->name, value); 848 return -ENOEXEC; 849 } 850 *((uint16_t *) location) 851 = (*((uint16_t *) location) & ~0xfffc) 852 | (value & 0xfffc); 853 break; 854 855 case R_PPC64_TOC16_LO_DS: 856 /* Subtract TOC pointer */ 857 value -= my_r2(sechdrs, me); 858 if ((value & 3) != 0) { 859 pr_err("%s: bad TOC16_LO_DS relocation (0x%lx)\n", 860 me->name, value); 861 return -ENOEXEC; 862 } 863 *((uint16_t *) location) 864 = (*((uint16_t *) location) & ~0xfffc) 865 | (value & 0xfffc); 866 break; 867 868 case R_PPC64_TOC16_HA: 869 /* Subtract TOC pointer */ 870 value -= my_r2(sechdrs, me); 871 value = ((value + 0x8000) >> 16); 872 *((uint16_t *) location) 873 = (*((uint16_t *) location) & ~0xffff) 874 | (value & 0xffff); 875 break; 876 #endif 877 878 case R_PPC_REL24: 879 #ifdef CONFIG_PPC_KERNEL_PCREL 880 /* PCREL still generates REL24 for mcount */ 881 case R_PPC64_REL24_NOTOC: 882 #endif 883 /* FIXME: Handle weak symbols here --RR */ 884 if (sym->st_shndx == SHN_UNDEF || 885 sym->st_shndx == SHN_LIVEPATCH) { 886 /* External: go via stub */ 887 value = stub_for_addr(sechdrs, value, me, 888 strtab + sym->st_name); 889 if (!value) 890 return -ENOENT; 891 if (restore_r2(strtab + sym->st_name, 892 (u32 *)location + 1, me)) 893 return -ENOEXEC; 894 } else 895 value += local_entry_offset(sym); 896 897 /* Convert value to relative */ 898 value -= (unsigned long)location; 899 if (value + 0x2000000 > 0x3ffffff || (value & 3) != 0){ 900 pr_err("%s: REL24 %li out of range!\n", 901 me->name, (long int)value); 902 return -ENOEXEC; 903 } 904 905 /* Only replace bits 2 through 26 */ 906 value = (*(uint32_t *)location & ~PPC_LI_MASK) | PPC_LI(value); 907 908 if (patch_instruction((u32 *)location, ppc_inst(value))) 909 return -EFAULT; 910 911 break; 912 913 case R_PPC64_REL64: 914 /* 64 bits relative (used by features fixups) */ 915 *location = value - (unsigned long)location; 916 break; 917 918 case R_PPC64_REL32: 919 /* 32 bits relative (used by relative exception tables) */ 920 /* Convert value to relative */ 921 value -= (unsigned long)location; 922 if (value + 0x80000000 > 0xffffffff) { 923 pr_err("%s: REL32 %li out of range!\n", 924 me->name, (long int)value); 925 return -ENOEXEC; 926 } 927 *(u32 *)location = value; 928 break; 929 930 #ifdef CONFIG_PPC_KERNEL_PCREL 931 case R_PPC64_PCREL34: { 932 unsigned long absvalue = value; 933 934 /* Convert value to relative */ 935 value -= (unsigned long)location; 936 937 if (value + 0x200000000 > 0x3ffffffff) { 938 if (sym->st_shndx != me->arch.pcpu_section) { 939 pr_err("%s: REL34 %li out of range!\n", 940 me->name, (long)value); 941 return -ENOEXEC; 942 } 943 944 /* 945 * per-cpu section is special cased because 946 * it is moved during loading, so has to be 947 * converted to use GOT. 948 */ 949 value = got_for_addr(sechdrs, absvalue, me, 950 strtab + sym->st_name); 951 if (!value) 952 return -ENOENT; 953 value -= (unsigned long)location; 954 955 /* Turn pla into pld */ 956 if (patch_instruction((u32 *)location, 957 ppc_inst_prefix((*(u32 *)location & ~0x02000000), 958 (*((u32 *)location + 1) & ~0xf8000000) | 0xe4000000))) 959 return -EFAULT; 960 } 961 962 if (patch_instruction((u32 *)location, 963 ppc_inst_prefix((*(u32 *)location & ~0x3ffff) | IMM_H18(value), 964 (*((u32 *)location + 1) & ~0xffff) | IMM_L(value)))) 965 return -EFAULT; 966 967 break; 968 } 969 970 #else 971 case R_PPC64_TOCSAVE: 972 /* 973 * Marker reloc indicates we don't have to save r2. 974 * That would only save us one instruction, so ignore 975 * it. 976 */ 977 break; 978 #endif 979 980 case R_PPC64_ENTRY: 981 if (IS_ENABLED(CONFIG_PPC_KERNEL_PCREL)) 982 break; 983 984 /* 985 * Optimize ELFv2 large code model entry point if 986 * the TOC is within 2GB range of current location. 987 */ 988 value = my_r2(sechdrs, me) - (unsigned long)location; 989 if (value + 0x80008000 > 0xffffffff) 990 break; 991 /* 992 * Check for the large code model prolog sequence: 993 * ld r2, ...(r12) 994 * add r2, r2, r12 995 */ 996 if ((((uint32_t *)location)[0] & ~0xfffc) != PPC_RAW_LD(_R2, _R12, 0)) 997 break; 998 if (((uint32_t *)location)[1] != PPC_RAW_ADD(_R2, _R2, _R12)) 999 break; 1000 /* 1001 * If found, replace it with: 1002 * addis r2, r12, (.TOC.-func)@ha 1003 * addi r2, r2, (.TOC.-func)@l 1004 */ 1005 ((uint32_t *)location)[0] = PPC_RAW_ADDIS(_R2, _R12, PPC_HA(value)); 1006 ((uint32_t *)location)[1] = PPC_RAW_ADDI(_R2, _R2, PPC_LO(value)); 1007 break; 1008 1009 case R_PPC64_REL16_HA: 1010 /* Subtract location pointer */ 1011 value -= (unsigned long)location; 1012 value = ((value + 0x8000) >> 16); 1013 *((uint16_t *) location) 1014 = (*((uint16_t *) location) & ~0xffff) 1015 | (value & 0xffff); 1016 break; 1017 1018 case R_PPC64_REL16_LO: 1019 /* Subtract location pointer */ 1020 value -= (unsigned long)location; 1021 *((uint16_t *) location) 1022 = (*((uint16_t *) location) & ~0xffff) 1023 | (value & 0xffff); 1024 break; 1025 1026 #ifdef CONFIG_PPC_KERNEL_PCREL 1027 case R_PPC64_GOT_PCREL34: 1028 value = got_for_addr(sechdrs, value, me, 1029 strtab + sym->st_name); 1030 if (!value) 1031 return -ENOENT; 1032 value -= (unsigned long)location; 1033 ((uint32_t *)location)[0] = (((uint32_t *)location)[0] & ~0x3ffff) | 1034 ((value >> 16) & 0x3ffff); 1035 ((uint32_t *)location)[1] = (((uint32_t *)location)[1] & ~0xffff) | 1036 (value & 0xffff); 1037 break; 1038 #endif 1039 1040 default: 1041 pr_err("%s: Unknown ADD relocation: %lu\n", 1042 me->name, 1043 (unsigned long)ELF64_R_TYPE(rela[i].r_info)); 1044 return -ENOEXEC; 1045 } 1046 } 1047 1048 return 0; 1049 } 1050 1051 #ifdef CONFIG_DYNAMIC_FTRACE 1052 int module_trampoline_target(struct module *mod, unsigned long addr, 1053 unsigned long *target) 1054 { 1055 struct ppc64_stub_entry *stub; 1056 func_desc_t funcdata; 1057 u32 magic; 1058 1059 if (!within_module_core(addr, mod)) { 1060 pr_err("%s: stub %lx not in module %s\n", __func__, addr, mod->name); 1061 return -EFAULT; 1062 } 1063 1064 stub = (struct ppc64_stub_entry *)addr; 1065 1066 if (copy_from_kernel_nofault(&magic, &stub->magic, 1067 sizeof(magic))) { 1068 pr_err("%s: fault reading magic for stub %lx for %s\n", __func__, addr, mod->name); 1069 return -EFAULT; 1070 } 1071 1072 if (magic != STUB_MAGIC) { 1073 pr_err("%s: bad magic for stub %lx for %s\n", __func__, addr, mod->name); 1074 return -EFAULT; 1075 } 1076 1077 if (copy_from_kernel_nofault(&funcdata, &stub->funcdata, 1078 sizeof(funcdata))) { 1079 pr_err("%s: fault reading funcdata for stub %lx for %s\n", __func__, addr, mod->name); 1080 return -EFAULT; 1081 } 1082 1083 *target = stub_func_addr(funcdata); 1084 1085 return 0; 1086 } 1087 1088 int module_finalize_ftrace(struct module *mod, const Elf_Shdr *sechdrs) 1089 { 1090 mod->arch.tramp = stub_for_addr(sechdrs, 1091 (unsigned long)ftrace_caller, 1092 mod, 1093 "ftrace_caller"); 1094 #ifdef CONFIG_DYNAMIC_FTRACE_WITH_REGS 1095 mod->arch.tramp_regs = stub_for_addr(sechdrs, 1096 (unsigned long)ftrace_regs_caller, 1097 mod, 1098 "ftrace_regs_caller"); 1099 if (!mod->arch.tramp_regs) 1100 return -ENOENT; 1101 #endif 1102 1103 if (!mod->arch.tramp) 1104 return -ENOENT; 1105 1106 return 0; 1107 } 1108 #endif 1109