1e1743d02SSøren Schmidt /*- 221a3ee0eSDavid E. O'Brien * Copyright (c) 2000 David O'Brien 3e1743d02SSøren Schmidt * Copyright (c) 1995-1996 S�ren Schmidt 4e1743d02SSøren Schmidt * Copyright (c) 1996 Peter Wemm 5e1743d02SSøren Schmidt * All rights reserved. 6e1743d02SSøren Schmidt * 7e1743d02SSøren Schmidt * Redistribution and use in source and binary forms, with or without 8e1743d02SSøren Schmidt * modification, are permitted provided that the following conditions 9e1743d02SSøren Schmidt * are met: 10e1743d02SSøren Schmidt * 1. Redistributions of source code must retain the above copyright 11e1743d02SSøren Schmidt * notice, this list of conditions and the following disclaimer 12e1743d02SSøren Schmidt * in this position and unchanged. 13e1743d02SSøren Schmidt * 2. Redistributions in binary form must reproduce the above copyright 14e1743d02SSøren Schmidt * notice, this list of conditions and the following disclaimer in the 15e1743d02SSøren Schmidt * documentation and/or other materials provided with the distribution. 16e1743d02SSøren Schmidt * 3. The name of the author may not be used to endorse or promote products 1721dc7d4fSJens Schweikhardt * derived from this software without specific prior written permission 18e1743d02SSøren Schmidt * 19e1743d02SSøren Schmidt * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 20e1743d02SSøren Schmidt * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 21e1743d02SSøren Schmidt * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 22e1743d02SSøren Schmidt * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 23e1743d02SSøren Schmidt * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 24e1743d02SSøren Schmidt * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 25e1743d02SSøren Schmidt * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 26e1743d02SSøren Schmidt * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 27e1743d02SSøren Schmidt * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 28e1743d02SSøren Schmidt * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 29e1743d02SSøren Schmidt */ 30e1743d02SSøren Schmidt 31677b542eSDavid E. O'Brien #include <sys/cdefs.h> 32677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 33677b542eSDavid E. O'Brien 3462919d78SPeter Wemm #include "opt_compat.h" 3562919d78SPeter Wemm 36e1743d02SSøren Schmidt #include <sys/param.h> 37e1743d02SSøren Schmidt #include <sys/exec.h> 388c64af4fSJohn Polstra #include <sys/fcntl.h> 39e1743d02SSøren Schmidt #include <sys/imgact.h> 40e1743d02SSøren Schmidt #include <sys/imgact_elf.h> 41e1743d02SSøren Schmidt #include <sys/kernel.h> 42f34fa851SJohn Baldwin #include <sys/lock.h> 43e1743d02SSøren Schmidt #include <sys/malloc.h> 4468ff2a43SChristian S.J. Peron #include <sys/mount.h> 4535e0e5b3SJohn Baldwin #include <sys/mutex.h> 468c64af4fSJohn Polstra #include <sys/mman.h> 47a794e791SBruce Evans #include <sys/namei.h> 488c64af4fSJohn Polstra #include <sys/pioctl.h> 49a794e791SBruce Evans #include <sys/proc.h> 508c64af4fSJohn Polstra #include <sys/procfs.h> 518c64af4fSJohn Polstra #include <sys/resourcevar.h> 52da61b9a6SAlan Cox #include <sys/sf_buf.h> 5336240ea5SDoug Rabson #include <sys/systm.h> 54e1743d02SSøren Schmidt #include <sys/signalvar.h> 558c64af4fSJohn Polstra #include <sys/stat.h> 561005a129SJohn Baldwin #include <sys/sx.h> 578c64af4fSJohn Polstra #include <sys/syscall.h> 58e1743d02SSøren Schmidt #include <sys/sysctl.h> 598c64af4fSJohn Polstra #include <sys/sysent.h> 60a794e791SBruce Evans #include <sys/vnode.h> 61e1743d02SSøren Schmidt 62e1743d02SSøren Schmidt #include <vm/vm.h> 63e1743d02SSøren Schmidt #include <vm/vm_kern.h> 64e1743d02SSøren Schmidt #include <vm/vm_param.h> 65e1743d02SSøren Schmidt #include <vm/pmap.h> 66e1743d02SSøren Schmidt #include <vm/vm_map.h> 670ff27d31SJohn Polstra #include <vm/vm_object.h> 68e1743d02SSøren Schmidt #include <vm/vm_extern.h> 69e1743d02SSøren Schmidt 7052c24af7SPeter Wemm #include <machine/elf.h> 71e1743d02SSøren Schmidt #include <machine/md_var.h> 72e1743d02SSøren Schmidt 7362919d78SPeter Wemm #if defined(COMPAT_IA32) && __ELF_WORD_SIZE == 32 7462919d78SPeter Wemm #include <machine/fpu.h> 7562919d78SPeter Wemm #include <compat/ia32/ia32_reg.h> 7662919d78SPeter Wemm #endif 7762919d78SPeter Wemm 78c815a20cSDavid E. O'Brien #define OLD_EI_BRAND 8 79c815a20cSDavid E. O'Brien 803ebc1248SPeter Wemm static int __elfN(check_header)(const Elf_Ehdr *hdr); 8132c01de2SDmitry Chagin static Elf_Brandinfo *__elfN(get_brandinfo)(struct image_params *imgp, 8232c01de2SDmitry Chagin const char *interp, int32_t *osrel); 833ebc1248SPeter Wemm static int __elfN(load_file)(struct proc *p, const char *file, u_long *addr, 843ebc1248SPeter Wemm u_long *entry, size_t pagesize); 85373d1a3fSAlan Cox static int __elfN(load_section)(struct vmspace *vmspace, vm_object_t object, 868c64af4fSJohn Polstra vm_offset_t offset, caddr_t vmaddr, size_t memsz, size_t filsz, 873ebc1248SPeter Wemm vm_prot_t prot, size_t pagesize); 883ebc1248SPeter Wemm static int __CONCAT(exec_, __elfN(imgact))(struct image_params *imgp); 8932c01de2SDmitry Chagin static boolean_t __elfN(check_note)(struct image_params *imgp, 9032c01de2SDmitry Chagin Elf_Brandnote *checknote, int32_t *osrel); 91e1743d02SSøren Schmidt 92a360a43dSJake Burkholder SYSCTL_NODE(_kern, OID_AUTO, __CONCAT(elf, __ELF_WORD_SIZE), CTLFLAG_RW, 0, 93a360a43dSJake Burkholder ""); 94a360a43dSJake Burkholder 95e548a1d4SJake Burkholder int __elfN(fallback_brand) = -1; 96e548a1d4SJake Burkholder SYSCTL_INT(__CONCAT(_kern_elf, __ELF_WORD_SIZE), OID_AUTO, 97e548a1d4SJake Burkholder fallback_brand, CTLFLAG_RW, &__elfN(fallback_brand), 0, 98a360a43dSJake Burkholder __XSTRING(__CONCAT(ELF, __ELF_WORD_SIZE)) " brand of last resort"); 99a360a43dSJake Burkholder TUNABLE_INT("kern.elf" __XSTRING(__ELF_WORD_SIZE) ".fallback_brand", 100e548a1d4SJake Burkholder &__elfN(fallback_brand)); 101a360a43dSJake Burkholder 102551d79e1SMarcel Moolenaar static int elf_legacy_coredump = 0; 103a360a43dSJake Burkholder SYSCTL_INT(_debug, OID_AUTO, __elfN(legacy_coredump), CTLFLAG_RW, 104551d79e1SMarcel Moolenaar &elf_legacy_coredump, 0, ""); 105e1743d02SSøren Schmidt 1063ebc1248SPeter Wemm static Elf_Brandinfo *elf_brand_list[MAX_BRANDS]; 107e1743d02SSøren Schmidt 10893d1c728SKonstantin Belousov #define trunc_page_ps(va, ps) ((va) & ~(ps - 1)) 10993d1c728SKonstantin Belousov #define round_page_ps(va, ps) (((va) + (ps - 1)) & ~(ps - 1)) 11093d1c728SKonstantin Belousov #define aligned(a, t) (trunc_page_ps((u_long)(a), sizeof(t)) == (u_long)(a)) 11193d1c728SKonstantin Belousov 11232c01de2SDmitry Chagin static const char FREEBSD_ABI_VENDOR[] = "FreeBSD"; 11332c01de2SDmitry Chagin 11432c01de2SDmitry Chagin Elf_Brandnote __elfN(freebsd_brandnote) = { 11532c01de2SDmitry Chagin .hdr.n_namesz = sizeof(FREEBSD_ABI_VENDOR), 11632c01de2SDmitry Chagin .hdr.n_descsz = sizeof(int32_t), 11732c01de2SDmitry Chagin .hdr.n_type = 1, 11832c01de2SDmitry Chagin .vendor = FREEBSD_ABI_VENDOR, 11932c01de2SDmitry Chagin .flags = BN_CAN_FETCH_OSREL 12032c01de2SDmitry Chagin }; 12132c01de2SDmitry Chagin 122e1743d02SSøren Schmidt int 1233ebc1248SPeter Wemm __elfN(insert_brand_entry)(Elf_Brandinfo *entry) 124e1743d02SSøren Schmidt { 125e1743d02SSøren Schmidt int i; 126e1743d02SSøren Schmidt 1273ebc1248SPeter Wemm for (i = 0; i < MAX_BRANDS; i++) { 128ea5a2b2eSSøren Schmidt if (elf_brand_list[i] == NULL) { 129ea5a2b2eSSøren Schmidt elf_brand_list[i] = entry; 130e1743d02SSøren Schmidt break; 131e1743d02SSøren Schmidt } 132e1743d02SSøren Schmidt } 133ea5a2b2eSSøren Schmidt if (i == MAX_BRANDS) 134a7cddfedSJake Burkholder return (-1); 135a7cddfedSJake Burkholder return (0); 136e1743d02SSøren Schmidt } 137e1743d02SSøren Schmidt 138e1743d02SSøren Schmidt int 1393ebc1248SPeter Wemm __elfN(remove_brand_entry)(Elf_Brandinfo *entry) 140e1743d02SSøren Schmidt { 141e1743d02SSøren Schmidt int i; 142e1743d02SSøren Schmidt 1433ebc1248SPeter Wemm for (i = 0; i < MAX_BRANDS; i++) { 144ea5a2b2eSSøren Schmidt if (elf_brand_list[i] == entry) { 145ea5a2b2eSSøren Schmidt elf_brand_list[i] = NULL; 146e1743d02SSøren Schmidt break; 147e1743d02SSøren Schmidt } 148e1743d02SSøren Schmidt } 149ea5a2b2eSSøren Schmidt if (i == MAX_BRANDS) 150a7cddfedSJake Burkholder return (-1); 151a7cddfedSJake Burkholder return (0); 152e1743d02SSøren Schmidt } 153e1743d02SSøren Schmidt 154096977faSMark Newton int 1553ebc1248SPeter Wemm __elfN(brand_inuse)(Elf_Brandinfo *entry) 156096977faSMark Newton { 157096977faSMark Newton struct proc *p; 158553629ebSJake Burkholder int rval = FALSE; 159096977faSMark Newton 1601005a129SJohn Baldwin sx_slock(&allproc_lock); 1614f506694SXin LI FOREACH_PROC_IN_SYSTEM(p) { 162553629ebSJake Burkholder if (p->p_sysent == entry->sysvec) { 163553629ebSJake Burkholder rval = TRUE; 164553629ebSJake Burkholder break; 165096977faSMark Newton } 166553629ebSJake Burkholder } 1671005a129SJohn Baldwin sx_sunlock(&allproc_lock); 168096977faSMark Newton 169553629ebSJake Burkholder return (rval); 170096977faSMark Newton } 171096977faSMark Newton 1725fe3ed62SJake Burkholder static Elf_Brandinfo * 17332c01de2SDmitry Chagin __elfN(get_brandinfo)(struct image_params *imgp, const char *interp, 17432c01de2SDmitry Chagin int32_t *osrel) 1755fe3ed62SJake Burkholder { 17632c01de2SDmitry Chagin const Elf_Ehdr *hdr = (const Elf_Ehdr *)imgp->image_header; 1775fe3ed62SJake Burkholder Elf_Brandinfo *bi; 17832c01de2SDmitry Chagin boolean_t ret; 1795fe3ed62SJake Burkholder int i; 1805fe3ed62SJake Burkholder 1815fe3ed62SJake Burkholder /* 18232c01de2SDmitry Chagin * We support four types of branding -- (1) the ELF EI_OSABI field 1835fe3ed62SJake Burkholder * that SCO added to the ELF spec, (2) FreeBSD 3.x's traditional string 18432c01de2SDmitry Chagin * branding w/in the ELF header, (3) path of the `interp_path' 18532c01de2SDmitry Chagin * field, and (4) the ".note.ABI-tag" ELF section. 1865fe3ed62SJake Burkholder */ 1875fe3ed62SJake Burkholder 18832c01de2SDmitry Chagin /* Look for an ".note.ABI-tag" ELF section */ 18932c01de2SDmitry Chagin for (i = 0; i < MAX_BRANDS; i++) { 19032c01de2SDmitry Chagin bi = elf_brand_list[i]; 19132c01de2SDmitry Chagin if (bi != NULL && hdr->e_machine == bi->machine && 19232c01de2SDmitry Chagin bi->brand_note != NULL) { 19332c01de2SDmitry Chagin ret = __elfN(check_note)(imgp, bi->brand_note, osrel); 19432c01de2SDmitry Chagin if (ret) 19532c01de2SDmitry Chagin return (bi); 19632c01de2SDmitry Chagin } 19732c01de2SDmitry Chagin } 19832c01de2SDmitry Chagin 1995fe3ed62SJake Burkholder /* If the executable has a brand, search for it in the brand list. */ 2005fe3ed62SJake Burkholder for (i = 0; i < MAX_BRANDS; i++) { 2015fe3ed62SJake Burkholder bi = elf_brand_list[i]; 2025fe3ed62SJake Burkholder if (bi != NULL && hdr->e_machine == bi->machine && 2035fe3ed62SJake Burkholder (hdr->e_ident[EI_OSABI] == bi->brand || 2045fe3ed62SJake Burkholder strncmp((const char *)&hdr->e_ident[OLD_EI_BRAND], 2055fe3ed62SJake Burkholder bi->compat_3_brand, strlen(bi->compat_3_brand)) == 0)) 2065fe3ed62SJake Burkholder return (bi); 2075fe3ed62SJake Burkholder } 2085fe3ed62SJake Burkholder 2095fe3ed62SJake Burkholder /* Lacking a known brand, search for a recognized interpreter. */ 2105fe3ed62SJake Burkholder if (interp != NULL) { 2115fe3ed62SJake Burkholder for (i = 0; i < MAX_BRANDS; i++) { 2125fe3ed62SJake Burkholder bi = elf_brand_list[i]; 2135fe3ed62SJake Burkholder if (bi != NULL && hdr->e_machine == bi->machine && 2145fe3ed62SJake Burkholder strcmp(interp, bi->interp_path) == 0) 2155fe3ed62SJake Burkholder return (bi); 2165fe3ed62SJake Burkholder } 2175fe3ed62SJake Burkholder } 2185fe3ed62SJake Burkholder 2195fe3ed62SJake Burkholder /* Lacking a recognized interpreter, try the default brand */ 2205fe3ed62SJake Burkholder for (i = 0; i < MAX_BRANDS; i++) { 2215fe3ed62SJake Burkholder bi = elf_brand_list[i]; 2225fe3ed62SJake Burkholder if (bi != NULL && hdr->e_machine == bi->machine && 223e548a1d4SJake Burkholder __elfN(fallback_brand) == bi->brand) 2245fe3ed62SJake Burkholder return (bi); 2255fe3ed62SJake Burkholder } 2265fe3ed62SJake Burkholder return (NULL); 2275fe3ed62SJake Burkholder } 2285fe3ed62SJake Burkholder 229e1743d02SSøren Schmidt static int 2303ebc1248SPeter Wemm __elfN(check_header)(const Elf_Ehdr *hdr) 231e1743d02SSøren Schmidt { 232d0ca7c29SPeter Wemm Elf_Brandinfo *bi; 2333ebc1248SPeter Wemm int i; 2343ebc1248SPeter Wemm 23552c24af7SPeter Wemm if (!IS_ELF(*hdr) || 23652c24af7SPeter Wemm hdr->e_ident[EI_CLASS] != ELF_TARG_CLASS || 23752c24af7SPeter Wemm hdr->e_ident[EI_DATA] != ELF_TARG_DATA || 2383dc19c46SJacques Vidrine hdr->e_ident[EI_VERSION] != EV_CURRENT || 2393dc19c46SJacques Vidrine hdr->e_phentsize != sizeof(Elf_Phdr) || 2403dc19c46SJacques Vidrine hdr->e_version != ELF_TARG_VER) 241a7cddfedSJake Burkholder return (ENOEXEC); 242e1743d02SSøren Schmidt 2433ebc1248SPeter Wemm /* 2443ebc1248SPeter Wemm * Make sure we have at least one brand for this machine. 2453ebc1248SPeter Wemm */ 2463ebc1248SPeter Wemm 2473ebc1248SPeter Wemm for (i = 0; i < MAX_BRANDS; i++) { 248d0ca7c29SPeter Wemm bi = elf_brand_list[i]; 249d0ca7c29SPeter Wemm if (bi != NULL && bi->machine == hdr->e_machine) 2503ebc1248SPeter Wemm break; 2513ebc1248SPeter Wemm } 2523ebc1248SPeter Wemm if (i == MAX_BRANDS) 253a7cddfedSJake Burkholder return (ENOEXEC); 254e1743d02SSøren Schmidt 255a7cddfedSJake Burkholder return (0); 256e1743d02SSøren Schmidt } 257e1743d02SSøren Schmidt 258e1743d02SSøren Schmidt static int 2593ebc1248SPeter Wemm __elfN(map_partial)(vm_map_t map, vm_object_t object, vm_ooffset_t offset, 260ff6f03c7SAlan Cox vm_offset_t start, vm_offset_t end, vm_prot_t prot) 2613ebc1248SPeter Wemm { 262da61b9a6SAlan Cox struct sf_buf *sf; 263da61b9a6SAlan Cox int error; 2643ebc1248SPeter Wemm vm_offset_t off; 2653ebc1248SPeter Wemm 2663ebc1248SPeter Wemm /* 2673ebc1248SPeter Wemm * Create the page if it doesn't exist yet. Ignore errors. 2683ebc1248SPeter Wemm */ 2693ebc1248SPeter Wemm vm_map_lock(map); 270ff6f03c7SAlan Cox vm_map_insert(map, NULL, 0, trunc_page(start), round_page(end), 271ff6f03c7SAlan Cox VM_PROT_ALL, VM_PROT_ALL, 0); 2723ebc1248SPeter Wemm vm_map_unlock(map); 2733ebc1248SPeter Wemm 2743ebc1248SPeter Wemm /* 2753ebc1248SPeter Wemm * Find the page from the underlying object. 2763ebc1248SPeter Wemm */ 2773ebc1248SPeter Wemm if (object) { 278da61b9a6SAlan Cox sf = vm_imgact_map_page(object, offset); 279da61b9a6SAlan Cox if (sf == NULL) 280da61b9a6SAlan Cox return (KERN_FAILURE); 2813ebc1248SPeter Wemm off = offset - trunc_page(offset); 282da61b9a6SAlan Cox error = copyout((caddr_t)sf_buf_kva(sf) + off, (caddr_t)start, 283ca0387efSJake Burkholder end - start); 284da61b9a6SAlan Cox vm_imgact_unmap_page(sf); 2853ebc1248SPeter Wemm if (error) { 286a7cddfedSJake Burkholder return (KERN_FAILURE); 2873ebc1248SPeter Wemm } 2883ebc1248SPeter Wemm } 2893ebc1248SPeter Wemm 290a7cddfedSJake Burkholder return (KERN_SUCCESS); 2913ebc1248SPeter Wemm } 2923ebc1248SPeter Wemm 2933ebc1248SPeter Wemm static int 2943ebc1248SPeter Wemm __elfN(map_insert)(vm_map_t map, vm_object_t object, vm_ooffset_t offset, 295ff6f03c7SAlan Cox vm_offset_t start, vm_offset_t end, vm_prot_t prot, int cow) 2963ebc1248SPeter Wemm { 297da61b9a6SAlan Cox struct sf_buf *sf; 298da61b9a6SAlan Cox vm_offset_t off; 299a063facbSMarcel Moolenaar vm_size_t sz; 300a063facbSMarcel Moolenaar int error, rv; 3013ebc1248SPeter Wemm 3023ebc1248SPeter Wemm if (start != trunc_page(start)) { 30381f223caSJake Burkholder rv = __elfN(map_partial)(map, object, offset, start, 304ff6f03c7SAlan Cox round_page(start), prot); 3053ebc1248SPeter Wemm if (rv) 306a7cddfedSJake Burkholder return (rv); 3073ebc1248SPeter Wemm offset += round_page(start) - start; 3083ebc1248SPeter Wemm start = round_page(start); 3093ebc1248SPeter Wemm } 3103ebc1248SPeter Wemm if (end != round_page(end)) { 31181f223caSJake Burkholder rv = __elfN(map_partial)(map, object, offset + 312ff6f03c7SAlan Cox trunc_page(end) - start, trunc_page(end), end, prot); 3133ebc1248SPeter Wemm if (rv) 314a7cddfedSJake Burkholder return (rv); 3153ebc1248SPeter Wemm end = trunc_page(end); 3163ebc1248SPeter Wemm } 3173ebc1248SPeter Wemm if (end > start) { 3183ebc1248SPeter Wemm if (offset & PAGE_MASK) { 3193ebc1248SPeter Wemm /* 3203ebc1248SPeter Wemm * The mapping is not page aligned. This means we have 3213ebc1248SPeter Wemm * to copy the data. Sigh. 3223ebc1248SPeter Wemm */ 323584716b0SAlan Cox rv = vm_map_find(map, NULL, 0, &start, end - start, 324ff6f03c7SAlan Cox FALSE, prot | VM_PROT_WRITE, VM_PROT_ALL, 0); 3253ebc1248SPeter Wemm if (rv) 326a7cddfedSJake Burkholder return (rv); 327da61b9a6SAlan Cox if (object == NULL) 328da61b9a6SAlan Cox return (KERN_SUCCESS); 329da61b9a6SAlan Cox for (; start < end; start += sz) { 330da61b9a6SAlan Cox sf = vm_imgact_map_page(object, offset); 331da61b9a6SAlan Cox if (sf == NULL) 332da61b9a6SAlan Cox return (KERN_FAILURE); 3333ebc1248SPeter Wemm off = offset - trunc_page(offset); 3343ebc1248SPeter Wemm sz = end - start; 335da61b9a6SAlan Cox if (sz > PAGE_SIZE - off) 336da61b9a6SAlan Cox sz = PAGE_SIZE - off; 337da61b9a6SAlan Cox error = copyout((caddr_t)sf_buf_kva(sf) + off, 3383ebc1248SPeter Wemm (caddr_t)start, sz); 339da61b9a6SAlan Cox vm_imgact_unmap_page(sf); 3403ebc1248SPeter Wemm if (error) { 341a7cddfedSJake Burkholder return (KERN_FAILURE); 3423ebc1248SPeter Wemm } 343da61b9a6SAlan Cox offset += sz; 3443ebc1248SPeter Wemm } 3453ebc1248SPeter Wemm rv = KERN_SUCCESS; 3463ebc1248SPeter Wemm } else { 347e5e6093bSAlan Cox vm_object_reference(object); 3483ebc1248SPeter Wemm vm_map_lock(map); 3493ebc1248SPeter Wemm rv = vm_map_insert(map, object, offset, start, end, 350ff6f03c7SAlan Cox prot, VM_PROT_ALL, cow); 3513ebc1248SPeter Wemm vm_map_unlock(map); 352e5e6093bSAlan Cox if (rv != KERN_SUCCESS) 353e5e6093bSAlan Cox vm_object_deallocate(object); 3543ebc1248SPeter Wemm } 355a7cddfedSJake Burkholder return (rv); 3563ebc1248SPeter Wemm } else { 357a7cddfedSJake Burkholder return (KERN_SUCCESS); 3583ebc1248SPeter Wemm } 3593ebc1248SPeter Wemm } 3603ebc1248SPeter Wemm 3613ebc1248SPeter Wemm static int 362373d1a3fSAlan Cox __elfN(load_section)(struct vmspace *vmspace, 363373d1a3fSAlan Cox vm_object_t object, vm_offset_t offset, 3643ebc1248SPeter Wemm caddr_t vmaddr, size_t memsz, size_t filsz, vm_prot_t prot, 3653ebc1248SPeter Wemm size_t pagesize) 366e1743d02SSøren Schmidt { 367da61b9a6SAlan Cox struct sf_buf *sf; 368e1743d02SSøren Schmidt size_t map_len; 369e1743d02SSøren Schmidt vm_offset_t map_addr; 370fa7dd9c5SMatthew Dillon int error, rv, cow; 371e1743d02SSøren Schmidt size_t copy_len; 37252c24af7SPeter Wemm vm_offset_t file_addr; 37352c24af7SPeter Wemm 37425ead034SBrian Feldman /* 37525ead034SBrian Feldman * It's necessary to fail if the filsz + offset taken from the 37625ead034SBrian Feldman * header is greater than the actual file pager object's size. 37725ead034SBrian Feldman * If we were to allow this, then the vm_map_find() below would 37825ead034SBrian Feldman * walk right off the end of the file object and into the ether. 37925ead034SBrian Feldman * 38025ead034SBrian Feldman * While I'm here, might as well check for something else that 38125ead034SBrian Feldman * is invalid: filsz cannot be greater than memsz. 38225ead034SBrian Feldman */ 38325ead034SBrian Feldman if ((off_t)filsz + offset > object->un_pager.vnp.vnp_size || 38425ead034SBrian Feldman filsz > memsz) { 38525ead034SBrian Feldman uprintf("elf_load_section: truncated ELF file\n"); 38625ead034SBrian Feldman return (ENOEXEC); 38725ead034SBrian Feldman } 38825ead034SBrian Feldman 3893ebc1248SPeter Wemm map_addr = trunc_page_ps((vm_offset_t)vmaddr, pagesize); 3903ebc1248SPeter Wemm file_addr = trunc_page_ps(offset, pagesize); 391e1743d02SSøren Schmidt 392e1743d02SSøren Schmidt /* 39352c24af7SPeter Wemm * We have two choices. We can either clear the data in the last page 39452c24af7SPeter Wemm * of an oversized mapping, or we can start the anon mapping a page 39552c24af7SPeter Wemm * early and copy the initialized data into that first page. We 39652c24af7SPeter Wemm * choose the second.. 39752c24af7SPeter Wemm */ 39852c24af7SPeter Wemm if (memsz > filsz) 3993ebc1248SPeter Wemm map_len = trunc_page_ps(offset + filsz, pagesize) - file_addr; 40052c24af7SPeter Wemm else 4013ebc1248SPeter Wemm map_len = round_page_ps(offset + filsz, pagesize) - file_addr; 40252c24af7SPeter Wemm 40352c24af7SPeter Wemm if (map_len != 0) { 404fa7dd9c5SMatthew Dillon /* cow flags: don't dump readonly sections in core */ 405fa7dd9c5SMatthew Dillon cow = MAP_COPY_ON_WRITE | MAP_PREFAULT | 406fa7dd9c5SMatthew Dillon (prot & VM_PROT_WRITE ? 0 : MAP_DISABLE_COREDUMP); 407fa7dd9c5SMatthew Dillon 4083ebc1248SPeter Wemm rv = __elfN(map_insert)(&vmspace->vm_map, 40952c24af7SPeter Wemm object, 41052c24af7SPeter Wemm file_addr, /* file offset */ 41152c24af7SPeter Wemm map_addr, /* virtual start */ 41252c24af7SPeter Wemm map_addr + map_len,/* virtual end */ 41352c24af7SPeter Wemm prot, 414fa7dd9c5SMatthew Dillon cow); 415e5e6093bSAlan Cox if (rv != KERN_SUCCESS) 416a7cddfedSJake Burkholder return (EINVAL); 41752c24af7SPeter Wemm 41852c24af7SPeter Wemm /* we can stop now if we've covered it all */ 41923955314SAlfred Perlstein if (memsz == filsz) { 420a7cddfedSJake Burkholder return (0); 42152c24af7SPeter Wemm } 42223955314SAlfred Perlstein } 42352c24af7SPeter Wemm 42452c24af7SPeter Wemm 42552c24af7SPeter Wemm /* 42652c24af7SPeter Wemm * We have to get the remaining bit of the file into the first part 42752c24af7SPeter Wemm * of the oversized map segment. This is normally because the .data 42852c24af7SPeter Wemm * segment in the file is extended to provide bss. It's a neat idea 42952c24af7SPeter Wemm * to try and save a page, but it's a pain in the behind to implement. 430e1743d02SSøren Schmidt */ 4313ebc1248SPeter Wemm copy_len = (offset + filsz) - trunc_page_ps(offset + filsz, pagesize); 4323ebc1248SPeter Wemm map_addr = trunc_page_ps((vm_offset_t)vmaddr + filsz, pagesize); 433ca0387efSJake Burkholder map_len = round_page_ps((vm_offset_t)vmaddr + memsz, pagesize) - 434ca0387efSJake Burkholder map_addr; 435e1743d02SSøren Schmidt 43652c24af7SPeter Wemm /* This had damn well better be true! */ 4378191d577SPeter Wemm if (map_len != 0) { 43881f223caSJake Burkholder rv = __elfN(map_insert)(&vmspace->vm_map, NULL, 0, map_addr, 439ff6f03c7SAlan Cox map_addr + map_len, VM_PROT_ALL, 0); 44023955314SAlfred Perlstein if (rv != KERN_SUCCESS) { 441a7cddfedSJake Burkholder return (EINVAL); 4428191d577SPeter Wemm } 44323955314SAlfred Perlstein } 444e1743d02SSøren Schmidt 44552c24af7SPeter Wemm if (copy_len != 0) { 4463ebc1248SPeter Wemm vm_offset_t off; 447da61b9a6SAlan Cox 448da61b9a6SAlan Cox sf = vm_imgact_map_page(object, offset + filsz); 449da61b9a6SAlan Cox if (sf == NULL) 450da61b9a6SAlan Cox return (EIO); 451e1743d02SSøren Schmidt 45252c24af7SPeter Wemm /* send the page fragment to user space */ 45381f223caSJake Burkholder off = trunc_page_ps(offset + filsz, pagesize) - 45481f223caSJake Burkholder trunc_page(offset + filsz); 455da61b9a6SAlan Cox error = copyout((caddr_t)sf_buf_kva(sf) + off, 456da61b9a6SAlan Cox (caddr_t)map_addr, copy_len); 457da61b9a6SAlan Cox vm_imgact_unmap_page(sf); 45823955314SAlfred Perlstein if (error) { 45952c24af7SPeter Wemm return (error); 46052c24af7SPeter Wemm } 46123955314SAlfred Perlstein } 462e1743d02SSøren Schmidt 463e1743d02SSøren Schmidt /* 4643ebc1248SPeter Wemm * set it to the specified protection. 4653ebc1248SPeter Wemm * XXX had better undo the damage from pasting over the cracks here! 466e1743d02SSøren Schmidt */ 4673ebc1248SPeter Wemm vm_map_protect(&vmspace->vm_map, trunc_page(map_addr), 4683ebc1248SPeter Wemm round_page(map_addr + map_len), prot, FALSE); 4698191d577SPeter Wemm 470ff6f03c7SAlan Cox return (0); 471e1743d02SSøren Schmidt } 472e1743d02SSøren Schmidt 473c33fe779SJohn Polstra /* 474c33fe779SJohn Polstra * Load the file "file" into memory. It may be either a shared object 475c33fe779SJohn Polstra * or an executable. 476c33fe779SJohn Polstra * 477c33fe779SJohn Polstra * The "addr" reference parameter is in/out. On entry, it specifies 478c33fe779SJohn Polstra * the address where a shared object should be loaded. If the file is 479c33fe779SJohn Polstra * an executable, this value is ignored. On exit, "addr" specifies 480c33fe779SJohn Polstra * where the file was actually loaded. 481c33fe779SJohn Polstra * 482c33fe779SJohn Polstra * The "entry" reference parameter is out only. On exit, it specifies 483c33fe779SJohn Polstra * the entry point for the loaded file. 484c33fe779SJohn Polstra */ 485e1743d02SSøren Schmidt static int 4863ebc1248SPeter Wemm __elfN(load_file)(struct proc *p, const char *file, u_long *addr, 4873ebc1248SPeter Wemm u_long *entry, size_t pagesize) 488e1743d02SSøren Schmidt { 489911c2be0SMark Peek struct { 490911c2be0SMark Peek struct nameidata nd; 491911c2be0SMark Peek struct vattr attr; 492911c2be0SMark Peek struct image_params image_params; 493911c2be0SMark Peek } *tempdata; 494d254af07SMatthew Dillon const Elf_Ehdr *hdr = NULL; 495d254af07SMatthew Dillon const Elf_Phdr *phdr = NULL; 496911c2be0SMark Peek struct nameidata *nd; 497e1743d02SSøren Schmidt struct vmspace *vmspace = p->p_vmspace; 498911c2be0SMark Peek struct vattr *attr; 499911c2be0SMark Peek struct image_params *imgp; 50052c24af7SPeter Wemm vm_prot_t prot; 501c33fe779SJohn Polstra u_long rbase; 502c33fe779SJohn Polstra u_long base_addr = 0; 50368ff2a43SChristian S.J. Peron int vfslocked, error, i, numsegs; 504e1743d02SSøren Schmidt 505a163d034SWarner Losh tempdata = malloc(sizeof(*tempdata), M_TEMP, M_WAITOK); 506911c2be0SMark Peek nd = &tempdata->nd; 507911c2be0SMark Peek attr = &tempdata->attr; 508911c2be0SMark Peek imgp = &tempdata->image_params; 509911c2be0SMark Peek 510c8a79999SPeter Wemm /* 511c8a79999SPeter Wemm * Initialize part of the common data 512c8a79999SPeter Wemm */ 513c8a79999SPeter Wemm imgp->proc = p; 514911c2be0SMark Peek imgp->attr = attr; 515c8a79999SPeter Wemm imgp->firstpage = NULL; 51659c8bc40SAlan Cox imgp->image_header = NULL; 5170b2ed1aeSJeff Roberson imgp->object = NULL; 5186d7bdc8dSRobert Watson imgp->execlabel = NULL; 519c8a79999SPeter Wemm 52068ff2a43SChristian S.J. Peron NDINIT(nd, LOOKUP, MPSAFE|LOCKLEAF|FOLLOW, UIO_SYSSPACE, file, 52168ff2a43SChristian S.J. Peron curthread); 52268ff2a43SChristian S.J. Peron vfslocked = 0; 523911c2be0SMark Peek if ((error = namei(nd)) != 0) { 524911c2be0SMark Peek nd->ni_vp = NULL; 525e1743d02SSøren Schmidt goto fail; 526e1743d02SSøren Schmidt } 52768ff2a43SChristian S.J. Peron vfslocked = NDHASGIANT(nd); 528911c2be0SMark Peek NDFREE(nd, NDF_ONLY_PNBUF); 529911c2be0SMark Peek imgp->vp = nd->ni_vp; 530c8a79999SPeter Wemm 531e1743d02SSøren Schmidt /* 532e1743d02SSøren Schmidt * Check permissions, modes, uid, etc on the file, and "open" it. 533e1743d02SSøren Schmidt */ 534c8a79999SPeter Wemm error = exec_check_permissions(imgp); 535373d1a3fSAlan Cox if (error) 536c8a79999SPeter Wemm goto fail; 537e1743d02SSøren Schmidt 538c8a79999SPeter Wemm error = exec_map_first_page(imgp); 539373d1a3fSAlan Cox if (error) 540373d1a3fSAlan Cox goto fail; 541373d1a3fSAlan Cox 54225ead034SBrian Feldman /* 54325ead034SBrian Feldman * Also make certain that the interpreter stays the same, so set 544e6e370a7SJeff Roberson * its VV_TEXT flag, too. 54525ead034SBrian Feldman */ 546e6e370a7SJeff Roberson nd->ni_vp->v_vflag |= VV_TEXT; 547e6e370a7SJeff Roberson 5488516dd18SPoul-Henning Kamp imgp->object = nd->ni_vp->v_object; 549e1743d02SSøren Schmidt 550d254af07SMatthew Dillon hdr = (const Elf_Ehdr *)imgp->image_header; 5513ebc1248SPeter Wemm if ((error = __elfN(check_header)(hdr)) != 0) 552e1743d02SSøren Schmidt goto fail; 553c33fe779SJohn Polstra if (hdr->e_type == ET_DYN) 554c33fe779SJohn Polstra rbase = *addr; 555c33fe779SJohn Polstra else if (hdr->e_type == ET_EXEC) 556c33fe779SJohn Polstra rbase = 0; 557c33fe779SJohn Polstra else { 558c33fe779SJohn Polstra error = ENOEXEC; 559c33fe779SJohn Polstra goto fail; 560c33fe779SJohn Polstra } 561e1743d02SSøren Schmidt 562c8a79999SPeter Wemm /* Only support headers that fit within first page for now */ 5633dc19c46SJacques Vidrine /* (multiplication of two Elf_Half fields will not overflow) */ 56452c24af7SPeter Wemm if ((hdr->e_phoff > PAGE_SIZE) || 5653dc19c46SJacques Vidrine (hdr->e_phentsize * hdr->e_phnum) > PAGE_SIZE - hdr->e_phoff) { 566c8a79999SPeter Wemm error = ENOEXEC; 567e1743d02SSøren Schmidt goto fail; 568c8a79999SPeter Wemm } 569c8a79999SPeter Wemm 570d254af07SMatthew Dillon phdr = (const Elf_Phdr *)(imgp->image_header + hdr->e_phoff); 57193d1c728SKonstantin Belousov if (!aligned(phdr, Elf_Addr)) { 57293d1c728SKonstantin Belousov error = ENOEXEC; 57393d1c728SKonstantin Belousov goto fail; 57493d1c728SKonstantin Belousov } 575e1743d02SSøren Schmidt 576c33fe779SJohn Polstra for (i = 0, numsegs = 0; i < hdr->e_phnum; i++) { 57752c24af7SPeter Wemm if (phdr[i].p_type == PT_LOAD) { /* Loadable segment */ 57852c24af7SPeter Wemm prot = 0; 579e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_X) 580e1743d02SSøren Schmidt prot |= VM_PROT_EXECUTE; 581e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_W) 582e1743d02SSøren Schmidt prot |= VM_PROT_WRITE; 583e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_R) 584e1743d02SSøren Schmidt prot |= VM_PROT_READ; 585e1743d02SSøren Schmidt 586373d1a3fSAlan Cox if ((error = __elfN(load_section)(vmspace, 587373d1a3fSAlan Cox imgp->object, phdr[i].p_offset, 58881f223caSJake Burkholder (caddr_t)(uintptr_t)phdr[i].p_vaddr + rbase, 58981f223caSJake Burkholder phdr[i].p_memsz, phdr[i].p_filesz, prot, 59081f223caSJake Burkholder pagesize)) != 0) 591e1743d02SSøren Schmidt goto fail; 592e1743d02SSøren Schmidt /* 593c33fe779SJohn Polstra * Establish the base address if this is the 594c33fe779SJohn Polstra * first segment. 595e1743d02SSøren Schmidt */ 596c33fe779SJohn Polstra if (numsegs == 0) 597ca0387efSJake Burkholder base_addr = trunc_page(phdr[i].p_vaddr + 598ca0387efSJake Burkholder rbase); 599c33fe779SJohn Polstra numsegs++; 600e1743d02SSøren Schmidt } 601e1743d02SSøren Schmidt } 602c33fe779SJohn Polstra *addr = base_addr; 603c33fe779SJohn Polstra *entry = (unsigned long)hdr->e_entry + rbase; 604e1743d02SSøren Schmidt 605e1743d02SSøren Schmidt fail: 606c8a79999SPeter Wemm if (imgp->firstpage) 607c8a79999SPeter Wemm exec_unmap_first_page(imgp); 6080b2ed1aeSJeff Roberson 609911c2be0SMark Peek if (nd->ni_vp) 610373d1a3fSAlan Cox vput(nd->ni_vp); 611911c2be0SMark Peek 61268ff2a43SChristian S.J. Peron VFS_UNLOCK_GIANT(vfslocked); 613911c2be0SMark Peek free(tempdata, M_TEMP); 614e1743d02SSøren Schmidt 615a7cddfedSJake Burkholder return (error); 616e1743d02SSøren Schmidt } 617e1743d02SSøren Schmidt 618303b270bSEivind Eklund static int 6193ebc1248SPeter Wemm __CONCAT(exec_, __elfN(imgact))(struct image_params *imgp) 620e1743d02SSøren Schmidt { 621ecbb00a2SDoug Rabson const Elf_Ehdr *hdr = (const Elf_Ehdr *)imgp->image_header; 62232c01de2SDmitry Chagin const Elf_Phdr *phdr; 623e5e6093bSAlan Cox Elf_Auxargs *elf_auxargs; 6245856e12eSJohn Dyson struct vmspace *vmspace; 62552c24af7SPeter Wemm vm_prot_t prot; 62621c2d047SMatthew Dillon u_long text_size = 0, data_size = 0, total_size = 0; 627e1743d02SSøren Schmidt u_long text_addr = 0, data_addr = 0; 628cac45152SMatthew Dillon u_long seg_size, seg_addr; 629e1743d02SSøren Schmidt u_long addr, entry = 0, proghdr = 0; 63032c01de2SDmitry Chagin int32_t osrel = 0; 631610ecfe0SMaxim Sobolev int error = 0, i; 6324113f8d7SPeter Wemm const char *interp = NULL, *newinterp = NULL; 633d1dbc694SJohn Polstra Elf_Brandinfo *brand_info; 634911c2be0SMark Peek char *path; 6355fe3ed62SJake Burkholder struct sysentvec *sv; 636e1743d02SSøren Schmidt 637e1743d02SSøren Schmidt /* 638e1743d02SSøren Schmidt * Do we have a valid ELF header ? 639900b28f9SMaxim Sobolev * 640900b28f9SMaxim Sobolev * Only allow ET_EXEC & ET_DYN here, reject ET_DYN later 641900b28f9SMaxim Sobolev * if particular brand doesn't support it. 642e1743d02SSøren Schmidt */ 643900b28f9SMaxim Sobolev if (__elfN(check_header)(hdr) != 0 || 644900b28f9SMaxim Sobolev (hdr->e_type != ET_EXEC && hdr->e_type != ET_DYN)) 645a7cddfedSJake Burkholder return (-1); 646e1743d02SSøren Schmidt 647e1743d02SSøren Schmidt /* 648e1743d02SSøren Schmidt * From here on down, we return an errno, not -1, as we've 649e1743d02SSøren Schmidt * detected an ELF file. 650e1743d02SSøren Schmidt */ 651e1743d02SSøren Schmidt 652e1743d02SSøren Schmidt if ((hdr->e_phoff > PAGE_SIZE) || 65352c24af7SPeter Wemm (hdr->e_phoff + hdr->e_phentsize * hdr->e_phnum) > PAGE_SIZE) { 654c8a79999SPeter Wemm /* Only support headers in first page for now */ 655a7cddfedSJake Burkholder return (ENOEXEC); 656e1743d02SSøren Schmidt } 65752c24af7SPeter Wemm phdr = (const Elf_Phdr *)(imgp->image_header + hdr->e_phoff); 65893d1c728SKonstantin Belousov if (!aligned(phdr, Elf_Addr)) 65993d1c728SKonstantin Belousov return (ENOEXEC); 6605fe3ed62SJake Burkholder for (i = 0; i < hdr->e_phnum; i++) { 661e5e6093bSAlan Cox if (phdr[i].p_type == PT_INTERP) { 662e5e6093bSAlan Cox /* Path to interpreter */ 6635fe3ed62SJake Burkholder if (phdr[i].p_filesz > MAXPATHLEN || 66460bb3943SAlan Cox phdr[i].p_offset + phdr[i].p_filesz > PAGE_SIZE) 66560bb3943SAlan Cox return (ENOEXEC); 6665fe3ed62SJake Burkholder interp = imgp->image_header + phdr[i].p_offset; 6675fe3ed62SJake Burkholder break; 6683ebc1248SPeter Wemm } 6693ebc1248SPeter Wemm } 6703ebc1248SPeter Wemm 67132c01de2SDmitry Chagin brand_info = __elfN(get_brandinfo)(imgp, interp, &osrel); 6725fe3ed62SJake Burkholder if (brand_info == NULL) { 6735fe3ed62SJake Burkholder uprintf("ELF binary type \"%u\" not known.\n", 6745fe3ed62SJake Burkholder hdr->e_ident[EI_OSABI]); 67560bb3943SAlan Cox return (ENOEXEC); 6763ebc1248SPeter Wemm } 677900b28f9SMaxim Sobolev if (hdr->e_type == ET_DYN && 678d49b2109SMaxim Sobolev (brand_info->flags & BI_CAN_EXEC_DYN) == 0) 679d49b2109SMaxim Sobolev return (ENOEXEC); 6805fe3ed62SJake Burkholder sv = brand_info->sysvec; 6819b68618dSPeter Wemm if (interp != NULL && brand_info->interp_newpath != NULL) 6824113f8d7SPeter Wemm newinterp = brand_info->interp_newpath; 6833ebc1248SPeter Wemm 68460bb3943SAlan Cox /* 68560bb3943SAlan Cox * Avoid a possible deadlock if the current address space is destroyed 68660bb3943SAlan Cox * and that address space maps the locked vnode. In the common case, 68760bb3943SAlan Cox * the locked vnode's v_usecount is decremented but remains greater 68860bb3943SAlan Cox * than zero. Consequently, the vnode lock is not needed by vrele(). 68960bb3943SAlan Cox * However, in cases where the vnode lock is external, such as nullfs, 69060bb3943SAlan Cox * v_usecount may become zero. 69160bb3943SAlan Cox */ 69222db15c0SAttilio Rao VOP_UNLOCK(imgp->vp, 0); 69360bb3943SAlan Cox 69489b57fcfSKonstantin Belousov error = exec_new_vmspace(imgp, sv); 69519059a13SJohn Baldwin imgp->proc->p_sysent = sv; 696e1743d02SSøren Schmidt 697cb05b60aSAttilio Rao vn_lock(imgp->vp, LK_EXCLUSIVE | LK_RETRY); 69889b57fcfSKonstantin Belousov if (error) 69989b57fcfSKonstantin Belousov return (error); 70060bb3943SAlan Cox 7015856e12eSJohn Dyson vmspace = imgp->proc->p_vmspace; 7025856e12eSJohn Dyson 703e1743d02SSøren Schmidt for (i = 0; i < hdr->e_phnum; i++) { 704e1743d02SSøren Schmidt switch (phdr[i].p_type) { 705e1743d02SSøren Schmidt case PT_LOAD: /* Loadable segment */ 70652c24af7SPeter Wemm prot = 0; 707e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_X) 708e1743d02SSøren Schmidt prot |= VM_PROT_EXECUTE; 709e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_W) 710e1743d02SSøren Schmidt prot |= VM_PROT_WRITE; 711e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_R) 712e1743d02SSøren Schmidt prot |= VM_PROT_READ; 713e1743d02SSøren Schmidt 7143ebc1248SPeter Wemm #if defined(__ia64__) && __ELF_WORD_SIZE == 32 && defined(IA32_ME_HARDER) 7153ebc1248SPeter Wemm /* 7163ebc1248SPeter Wemm * Some x86 binaries assume read == executable, 7173ebc1248SPeter Wemm * notably the M3 runtime and therefore cvsup 7183ebc1248SPeter Wemm */ 7193ebc1248SPeter Wemm if (prot & VM_PROT_READ) 7203ebc1248SPeter Wemm prot |= VM_PROT_EXECUTE; 7213ebc1248SPeter Wemm #endif 7223ebc1248SPeter Wemm 723373d1a3fSAlan Cox if ((error = __elfN(load_section)(vmspace, 724373d1a3fSAlan Cox imgp->object, phdr[i].p_offset, 7253ebc1248SPeter Wemm (caddr_t)(uintptr_t)phdr[i].p_vaddr, 72681f223caSJake Burkholder phdr[i].p_memsz, phdr[i].p_filesz, prot, 7275fe3ed62SJake Burkholder sv->sv_pagesize)) != 0) 72860bb3943SAlan Cox return (error); 729e1743d02SSøren Schmidt 730cfaf7e60SDoug Rabson /* 731cfaf7e60SDoug Rabson * If this segment contains the program headers, 732cfaf7e60SDoug Rabson * remember their virtual address for the AT_PHDR 733cfaf7e60SDoug Rabson * aux entry. Static binaries don't usually include 734cfaf7e60SDoug Rabson * a PT_PHDR entry. 735cfaf7e60SDoug Rabson */ 736cfaf7e60SDoug Rabson if (phdr[i].p_offset == 0 && 737cfaf7e60SDoug Rabson hdr->e_phoff + hdr->e_phnum * hdr->e_phentsize 738cfaf7e60SDoug Rabson <= phdr[i].p_filesz) 739cfaf7e60SDoug Rabson proghdr = phdr[i].p_vaddr + hdr->e_phoff; 740cfaf7e60SDoug Rabson 741cac45152SMatthew Dillon seg_addr = trunc_page(phdr[i].p_vaddr); 742cac45152SMatthew Dillon seg_size = round_page(phdr[i].p_memsz + 743cac45152SMatthew Dillon phdr[i].p_vaddr - seg_addr); 744cac45152SMatthew Dillon 745e1743d02SSøren Schmidt /* 74621c2d047SMatthew Dillon * Is this .text or .data? We can't use 74721c2d047SMatthew Dillon * VM_PROT_WRITE or VM_PROT_EXEC, it breaks the 74821c2d047SMatthew Dillon * alpha terribly and possibly does other bad 74921c2d047SMatthew Dillon * things so we stick to the old way of figuring 75021c2d047SMatthew Dillon * it out: If the segment contains the program 75121c2d047SMatthew Dillon * entry point, it's a text segment, otherwise it 75221c2d047SMatthew Dillon * is a data segment. 75321c2d047SMatthew Dillon * 75421c2d047SMatthew Dillon * Note that obreak() assumes that data_addr + 75521c2d047SMatthew Dillon * data_size == end of data load area, and the ELF 75621c2d047SMatthew Dillon * file format expects segments to be sorted by 75721c2d047SMatthew Dillon * address. If multiple data segments exist, the 75821c2d047SMatthew Dillon * last one will be used. 759e1743d02SSøren Schmidt */ 7609782ecbaSPeter Wemm if (hdr->e_entry >= phdr[i].p_vaddr && 7619782ecbaSPeter Wemm hdr->e_entry < (phdr[i].p_vaddr + 7629782ecbaSPeter Wemm phdr[i].p_memsz)) { 7639782ecbaSPeter Wemm text_size = seg_size; 7649782ecbaSPeter Wemm text_addr = seg_addr; 7659782ecbaSPeter Wemm entry = (u_long)hdr->e_entry; 7669782ecbaSPeter Wemm } else { 76721c2d047SMatthew Dillon data_size = seg_size; 768cac45152SMatthew Dillon data_addr = seg_addr; 769cac45152SMatthew Dillon } 77021c2d047SMatthew Dillon total_size += seg_size; 77196725dd0SAlexander Kabaev break; 77296725dd0SAlexander Kabaev case PT_PHDR: /* Program header table info */ 77396725dd0SAlexander Kabaev proghdr = phdr[i].p_vaddr; 77496725dd0SAlexander Kabaev break; 77596725dd0SAlexander Kabaev default: 77696725dd0SAlexander Kabaev break; 77796725dd0SAlexander Kabaev } 77896725dd0SAlexander Kabaev } 77996725dd0SAlexander Kabaev 78096725dd0SAlexander Kabaev if (data_addr == 0 && data_size == 0) { 78196725dd0SAlexander Kabaev data_addr = text_addr; 78296725dd0SAlexander Kabaev data_size = text_size; 78396725dd0SAlexander Kabaev } 784cac45152SMatthew Dillon 785cac45152SMatthew Dillon /* 786cac45152SMatthew Dillon * Check limits. It should be safe to check the 78796725dd0SAlexander Kabaev * limits after loading the segments since we do 78896725dd0SAlexander Kabaev * not actually fault in all the segments pages. 789cac45152SMatthew Dillon */ 79091d5354aSJohn Baldwin PROC_LOCK(imgp->proc); 79191d5354aSJohn Baldwin if (data_size > lim_cur(imgp->proc, RLIMIT_DATA) || 792cac45152SMatthew Dillon text_size > maxtsiz || 79391d5354aSJohn Baldwin total_size > lim_cur(imgp->proc, RLIMIT_VMEM)) { 79491d5354aSJohn Baldwin PROC_UNLOCK(imgp->proc); 79560bb3943SAlan Cox return (ENOMEM); 796cac45152SMatthew Dillon } 797e1743d02SSøren Schmidt 798e1743d02SSøren Schmidt vmspace->vm_tsize = text_size >> PAGE_SHIFT; 7997cd99438SBruce Evans vmspace->vm_taddr = (caddr_t)(uintptr_t)text_addr; 800e1743d02SSøren Schmidt vmspace->vm_dsize = data_size >> PAGE_SHIFT; 8017cd99438SBruce Evans vmspace->vm_daddr = (caddr_t)(uintptr_t)data_addr; 802e1743d02SSøren Schmidt 803c460ac3aSPeter Wemm /* 804c460ac3aSPeter Wemm * We load the dynamic linker where a userland call 805c460ac3aSPeter Wemm * to mmap(0, ...) would put it. The rationale behind this 806c460ac3aSPeter Wemm * calculation is that it leaves room for the heap to grow to 807c460ac3aSPeter Wemm * its maximum allowed size. 808c460ac3aSPeter Wemm */ 809c460ac3aSPeter Wemm addr = round_page((vm_offset_t)imgp->proc->p_vmspace->vm_daddr + 81091d5354aSJohn Baldwin lim_max(imgp->proc, RLIMIT_DATA)); 81191d5354aSJohn Baldwin PROC_UNLOCK(imgp->proc); 812e1743d02SSøren Schmidt 813ea5a2b2eSSøren Schmidt imgp->entry_addr = entry; 814ea5a2b2eSSøren Schmidt 81560bb3943SAlan Cox if (interp != NULL) { 8164113f8d7SPeter Wemm int have_interp = FALSE; 81722db15c0SAttilio Rao VOP_UNLOCK(imgp->vp, 0); 81860bb3943SAlan Cox if (brand_info->emul_path != NULL && 8199b68618dSPeter Wemm brand_info->emul_path[0] != '\0') { 820a163d034SWarner Losh path = malloc(MAXPATHLEN, M_TEMP, M_WAITOK); 82160bb3943SAlan Cox snprintf(path, MAXPATHLEN, "%s%s", 82260bb3943SAlan Cox brand_info->emul_path, interp); 8239b68618dSPeter Wemm error = __elfN(load_file)(imgp->proc, path, &addr, 8249b68618dSPeter Wemm &imgp->entry_addr, sv->sv_pagesize); 825911c2be0SMark Peek free(path, M_TEMP); 8269b68618dSPeter Wemm if (error == 0) 8274113f8d7SPeter Wemm have_interp = TRUE; 8289b68618dSPeter Wemm } 8294113f8d7SPeter Wemm if (!have_interp && newinterp != NULL) { 8304113f8d7SPeter Wemm error = __elfN(load_file)(imgp->proc, newinterp, &addr, 8314113f8d7SPeter Wemm &imgp->entry_addr, sv->sv_pagesize); 832387ad998SKonstantin Belousov if (error == 0) 8334113f8d7SPeter Wemm have_interp = TRUE; 8344113f8d7SPeter Wemm } 8354113f8d7SPeter Wemm if (!have_interp) { 8369b68618dSPeter Wemm error = __elfN(load_file)(imgp->proc, interp, &addr, 8379b68618dSPeter Wemm &imgp->entry_addr, sv->sv_pagesize); 83860bb3943SAlan Cox } 839cb05b60aSAttilio Rao vn_lock(imgp->vp, LK_EXCLUSIVE | LK_RETRY); 8409b68618dSPeter Wemm if (error != 0) { 8419b68618dSPeter Wemm uprintf("ELF interpreter %s not found\n", interp); 84260bb3943SAlan Cox return (error); 843e1743d02SSøren Schmidt } 84495c807cfSRobert Watson } else 84595c807cfSRobert Watson addr = 0; 846ea5a2b2eSSøren Schmidt 847e1743d02SSøren Schmidt /* 848e1743d02SSøren Schmidt * Construct auxargs table (used by the fixup routine) 849e1743d02SSøren Schmidt */ 850a163d034SWarner Losh elf_auxargs = malloc(sizeof(Elf_Auxargs), M_TEMP, M_WAITOK); 851e1743d02SSøren Schmidt elf_auxargs->execfd = -1; 852e1743d02SSøren Schmidt elf_auxargs->phdr = proghdr; 853e1743d02SSøren Schmidt elf_auxargs->phent = hdr->e_phentsize; 854e1743d02SSøren Schmidt elf_auxargs->phnum = hdr->e_phnum; 855e1743d02SSøren Schmidt elf_auxargs->pagesz = PAGE_SIZE; 856e1743d02SSøren Schmidt elf_auxargs->base = addr; 857e1743d02SSøren Schmidt elf_auxargs->flags = 0; 858e1743d02SSøren Schmidt elf_auxargs->entry = entry; 859e1743d02SSøren Schmidt 860e1743d02SSøren Schmidt imgp->auxargs = elf_auxargs; 861e1743d02SSøren Schmidt imgp->interpreted = 0; 86232c01de2SDmitry Chagin imgp->proc->p_osrel = osrel; 863f231de47SKonstantin Belousov 864a7cddfedSJake Burkholder return (error); 865e1743d02SSøren Schmidt } 866e1743d02SSøren Schmidt 867a360a43dSJake Burkholder #define suword __CONCAT(suword, __ELF_WORD_SIZE) 8683ebc1248SPeter Wemm 8693ebc1248SPeter Wemm int 8703ebc1248SPeter Wemm __elfN(freebsd_fixup)(register_t **stack_base, struct image_params *imgp) 871e1743d02SSøren Schmidt { 872ecbb00a2SDoug Rabson Elf_Auxargs *args = (Elf_Auxargs *)imgp->auxargs; 873a360a43dSJake Burkholder Elf_Addr *base; 874a360a43dSJake Burkholder Elf_Addr *pos; 875e1743d02SSøren Schmidt 876a360a43dSJake Burkholder base = (Elf_Addr *)*stack_base; 877610ecfe0SMaxim Sobolev pos = base + (imgp->args->argc + imgp->args->envc + 2); 878e1743d02SSøren Schmidt 87935c2a5a8SWarner Losh if (args->execfd != -1) 880e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_EXECFD, args->execfd); 881e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PHDR, args->phdr); 882e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PHENT, args->phent); 883e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PHNUM, args->phnum); 884e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PAGESZ, args->pagesz); 885e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_FLAGS, args->flags); 886e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_ENTRY, args->entry); 887e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_BASE, args->base); 888e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_NULL, 0); 889e1743d02SSøren Schmidt 890e1743d02SSøren Schmidt free(imgp->auxargs, M_TEMP); 891e1743d02SSøren Schmidt imgp->auxargs = NULL; 892e1743d02SSøren Schmidt 8933ebc1248SPeter Wemm base--; 894610ecfe0SMaxim Sobolev suword(base, (long)imgp->args->argc); 8953ebc1248SPeter Wemm *stack_base = (register_t *)base; 896a7cddfedSJake Burkholder return (0); 897e1743d02SSøren Schmidt } 898e1743d02SSøren Schmidt 899e1743d02SSøren Schmidt /* 9008c64af4fSJohn Polstra * Code for generating ELF core dumps. 9018c64af4fSJohn Polstra */ 9028c64af4fSJohn Polstra 9034d77a549SAlfred Perlstein typedef void (*segment_callback)(vm_map_entry_t, void *); 9040ff27d31SJohn Polstra 9050ff27d31SJohn Polstra /* Closure for cb_put_phdr(). */ 9060ff27d31SJohn Polstra struct phdr_closure { 9070ff27d31SJohn Polstra Elf_Phdr *phdr; /* Program header to fill in */ 9080ff27d31SJohn Polstra Elf_Off offset; /* Offset of segment in core file */ 9090ff27d31SJohn Polstra }; 9100ff27d31SJohn Polstra 9110ff27d31SJohn Polstra /* Closure for cb_size_segment(). */ 9120ff27d31SJohn Polstra struct sseg_closure { 9130ff27d31SJohn Polstra int count; /* Count of writable segments. */ 9140ff27d31SJohn Polstra size_t size; /* Total size of all writable segments. */ 9150ff27d31SJohn Polstra }; 9160ff27d31SJohn Polstra 9174d77a549SAlfred Perlstein static void cb_put_phdr(vm_map_entry_t, void *); 9184d77a549SAlfred Perlstein static void cb_size_segment(vm_map_entry_t, void *); 919247aba24SMarcel Moolenaar static void each_writable_segment(struct thread *, segment_callback, void *); 9203ebc1248SPeter Wemm static int __elfN(corehdr)(struct thread *, struct vnode *, struct ucred *, 9214d77a549SAlfred Perlstein int, void *, size_t); 922247aba24SMarcel Moolenaar static void __elfN(puthdr)(struct thread *, void *, size_t *, int); 9233ebc1248SPeter Wemm static void __elfN(putnote)(void *, size_t *, const char *, int, 9244d77a549SAlfred Perlstein const void *, size_t); 9258c64af4fSJohn Polstra 9268c64af4fSJohn Polstra int 9273ebc1248SPeter Wemm __elfN(coredump)(td, vp, limit) 928b40ce416SJulian Elischer struct thread *td; 929247aba24SMarcel Moolenaar struct vnode *vp; 930fca666a1SJulian Elischer off_t limit; 931fca666a1SJulian Elischer { 932247aba24SMarcel Moolenaar struct ucred *cred = td->td_ucred; 933fca666a1SJulian Elischer int error = 0; 9340ff27d31SJohn Polstra struct sseg_closure seginfo; 9350ff27d31SJohn Polstra void *hdr; 9368c64af4fSJohn Polstra size_t hdrsize; 9378c64af4fSJohn Polstra 9380ff27d31SJohn Polstra /* Size the program segments. */ 9390ff27d31SJohn Polstra seginfo.count = 0; 9400ff27d31SJohn Polstra seginfo.size = 0; 941247aba24SMarcel Moolenaar each_writable_segment(td, cb_size_segment, &seginfo); 9420ff27d31SJohn Polstra 9430ff27d31SJohn Polstra /* 9440ff27d31SJohn Polstra * Calculate the size of the core file header area by making 9450ff27d31SJohn Polstra * a dry run of generating it. Nothing is written, but the 9460ff27d31SJohn Polstra * size is calculated. 9470ff27d31SJohn Polstra */ 9480ff27d31SJohn Polstra hdrsize = 0; 949247aba24SMarcel Moolenaar __elfN(puthdr)(td, (void *)NULL, &hdrsize, seginfo.count); 9500ff27d31SJohn Polstra 951fca666a1SJulian Elischer if (hdrsize + seginfo.size >= limit) 9528c64af4fSJohn Polstra return (EFAULT); 9530ff27d31SJohn Polstra 9540ff27d31SJohn Polstra /* 9550ff27d31SJohn Polstra * Allocate memory for building the header, fill it up, 9560ff27d31SJohn Polstra * and write it out. 9570ff27d31SJohn Polstra */ 958a163d034SWarner Losh hdr = malloc(hdrsize, M_TEMP, M_WAITOK); 9590ff27d31SJohn Polstra if (hdr == NULL) { 960a7cddfedSJake Burkholder return (EINVAL); 9610ff27d31SJohn Polstra } 9623ebc1248SPeter Wemm error = __elfN(corehdr)(td, vp, cred, seginfo.count, hdr, hdrsize); 9630ff27d31SJohn Polstra 9640ff27d31SJohn Polstra /* Write the contents of all of the writable segments. */ 9650ff27d31SJohn Polstra if (error == 0) { 9660ff27d31SJohn Polstra Elf_Phdr *php; 9672b471bc6STim J. Robbins off_t offset; 9680ff27d31SJohn Polstra int i; 9690ff27d31SJohn Polstra 9700ff27d31SJohn Polstra php = (Elf_Phdr *)((char *)hdr + sizeof(Elf_Ehdr)) + 1; 9710ff27d31SJohn Polstra offset = hdrsize; 9720ff27d31SJohn Polstra for (i = 0; i < seginfo.count; i++) { 97306ae1e91SMatthew Dillon error = vn_rdwr_inchunks(UIO_WRITE, vp, 9742b471bc6STim J. Robbins (caddr_t)(uintptr_t)php->p_vaddr, 9752b471bc6STim J. Robbins php->p_filesz, offset, UIO_USERSPACE, 976f99619a0STim J. Robbins IO_UNIT | IO_DIRECT, cred, NOCRED, NULL, 9776617724cSJeff Roberson curthread); 9780ff27d31SJohn Polstra if (error != 0) 9792b471bc6STim J. Robbins break; 9800ff27d31SJohn Polstra offset += php->p_filesz; 9810ff27d31SJohn Polstra php++; 9820ff27d31SJohn Polstra } 9830ff27d31SJohn Polstra } 9840ff27d31SJohn Polstra free(hdr, M_TEMP); 9850ff27d31SJohn Polstra 986a7cddfedSJake Burkholder return (error); 9878c64af4fSJohn Polstra } 9888c64af4fSJohn Polstra 9890ff27d31SJohn Polstra /* 9900ff27d31SJohn Polstra * A callback for each_writable_segment() to write out the segment's 9910ff27d31SJohn Polstra * program header entry. 9920ff27d31SJohn Polstra */ 9930ff27d31SJohn Polstra static void 9940ff27d31SJohn Polstra cb_put_phdr(entry, closure) 9950ff27d31SJohn Polstra vm_map_entry_t entry; 9960ff27d31SJohn Polstra void *closure; 9970ff27d31SJohn Polstra { 9980ff27d31SJohn Polstra struct phdr_closure *phc = (struct phdr_closure *)closure; 9990ff27d31SJohn Polstra Elf_Phdr *phdr = phc->phdr; 10000ff27d31SJohn Polstra 10010ff27d31SJohn Polstra phc->offset = round_page(phc->offset); 10020ff27d31SJohn Polstra 10030ff27d31SJohn Polstra phdr->p_type = PT_LOAD; 10040ff27d31SJohn Polstra phdr->p_offset = phc->offset; 10050ff27d31SJohn Polstra phdr->p_vaddr = entry->start; 10060ff27d31SJohn Polstra phdr->p_paddr = 0; 10070ff27d31SJohn Polstra phdr->p_filesz = phdr->p_memsz = entry->end - entry->start; 10080ff27d31SJohn Polstra phdr->p_align = PAGE_SIZE; 10090ff27d31SJohn Polstra phdr->p_flags = 0; 10100ff27d31SJohn Polstra if (entry->protection & VM_PROT_READ) 10110ff27d31SJohn Polstra phdr->p_flags |= PF_R; 10120ff27d31SJohn Polstra if (entry->protection & VM_PROT_WRITE) 10130ff27d31SJohn Polstra phdr->p_flags |= PF_W; 10140ff27d31SJohn Polstra if (entry->protection & VM_PROT_EXECUTE) 10150ff27d31SJohn Polstra phdr->p_flags |= PF_X; 10160ff27d31SJohn Polstra 10170ff27d31SJohn Polstra phc->offset += phdr->p_filesz; 10180ff27d31SJohn Polstra phc->phdr++; 10190ff27d31SJohn Polstra } 10200ff27d31SJohn Polstra 10210ff27d31SJohn Polstra /* 10220ff27d31SJohn Polstra * A callback for each_writable_segment() to gather information about 10230ff27d31SJohn Polstra * the number of segments and their total size. 10240ff27d31SJohn Polstra */ 10250ff27d31SJohn Polstra static void 10260ff27d31SJohn Polstra cb_size_segment(entry, closure) 10270ff27d31SJohn Polstra vm_map_entry_t entry; 10280ff27d31SJohn Polstra void *closure; 10290ff27d31SJohn Polstra { 10300ff27d31SJohn Polstra struct sseg_closure *ssc = (struct sseg_closure *)closure; 10310ff27d31SJohn Polstra 10320ff27d31SJohn Polstra ssc->count++; 10330ff27d31SJohn Polstra ssc->size += entry->end - entry->start; 10340ff27d31SJohn Polstra } 10350ff27d31SJohn Polstra 10360ff27d31SJohn Polstra /* 10370ff27d31SJohn Polstra * For each writable segment in the process's memory map, call the given 10380ff27d31SJohn Polstra * function with a pointer to the map entry and some arbitrary 10390ff27d31SJohn Polstra * caller-supplied data. 10400ff27d31SJohn Polstra */ 10410ff27d31SJohn Polstra static void 1042247aba24SMarcel Moolenaar each_writable_segment(td, func, closure) 1043247aba24SMarcel Moolenaar struct thread *td; 10440ff27d31SJohn Polstra segment_callback func; 10450ff27d31SJohn Polstra void *closure; 10460ff27d31SJohn Polstra { 1047247aba24SMarcel Moolenaar struct proc *p = td->td_proc; 10480ff27d31SJohn Polstra vm_map_t map = &p->p_vmspace->vm_map; 10490ff27d31SJohn Polstra vm_map_entry_t entry; 1050976a87a2SAlan Cox vm_object_t backing_object, object; 1051976a87a2SAlan Cox boolean_t ignore_entry; 10520ff27d31SJohn Polstra 1053976a87a2SAlan Cox vm_map_lock_read(map); 10540ff27d31SJohn Polstra for (entry = map->header.next; entry != &map->header; 10550ff27d31SJohn Polstra entry = entry->next) { 1056fa7dd9c5SMatthew Dillon /* 1057fa7dd9c5SMatthew Dillon * Don't dump inaccessible mappings, deal with legacy 1058fa7dd9c5SMatthew Dillon * coredump mode. 1059fa7dd9c5SMatthew Dillon * 1060fa7dd9c5SMatthew Dillon * Note that read-only segments related to the elf binary 1061fa7dd9c5SMatthew Dillon * are marked MAP_ENTRY_NOCOREDUMP now so we no longer 1062fa7dd9c5SMatthew Dillon * need to arbitrarily ignore such segments. 1063fa7dd9c5SMatthew Dillon */ 1064fa7dd9c5SMatthew Dillon if (elf_legacy_coredump) { 1065fa7dd9c5SMatthew Dillon if ((entry->protection & VM_PROT_RW) != VM_PROT_RW) 10660ff27d31SJohn Polstra continue; 1067fa7dd9c5SMatthew Dillon } else { 1068fa7dd9c5SMatthew Dillon if ((entry->protection & VM_PROT_ALL) == 0) 1069fa7dd9c5SMatthew Dillon continue; 1070fa7dd9c5SMatthew Dillon } 10710ff27d31SJohn Polstra 10729730a5daSPaul Saab /* 1073fa7dd9c5SMatthew Dillon * Dont include memory segment in the coredump if 1074fa7dd9c5SMatthew Dillon * MAP_NOCORE is set in mmap(2) or MADV_NOCORE in 1075fa7dd9c5SMatthew Dillon * madvise(2). Do not dump submaps (i.e. parts of the 1076fa7dd9c5SMatthew Dillon * kernel map). 10779730a5daSPaul Saab */ 1078fa7dd9c5SMatthew Dillon if (entry->eflags & (MAP_ENTRY_NOCOREDUMP|MAP_ENTRY_IS_SUB_MAP)) 10799730a5daSPaul Saab continue; 10809730a5daSPaul Saab 1081976a87a2SAlan Cox if ((object = entry->object.vm_object) == NULL) 10820ff27d31SJohn Polstra continue; 10830ff27d31SJohn Polstra 10840ff27d31SJohn Polstra /* Ignore memory-mapped devices and such things. */ 1085976a87a2SAlan Cox VM_OBJECT_LOCK(object); 1086976a87a2SAlan Cox while ((backing_object = object->backing_object) != NULL) { 1087976a87a2SAlan Cox VM_OBJECT_LOCK(backing_object); 1088976a87a2SAlan Cox VM_OBJECT_UNLOCK(object); 1089976a87a2SAlan Cox object = backing_object; 1090976a87a2SAlan Cox } 1091976a87a2SAlan Cox ignore_entry = object->type != OBJT_DEFAULT && 1092976a87a2SAlan Cox object->type != OBJT_SWAP && object->type != OBJT_VNODE; 1093976a87a2SAlan Cox VM_OBJECT_UNLOCK(object); 1094976a87a2SAlan Cox if (ignore_entry) 10950ff27d31SJohn Polstra continue; 10960ff27d31SJohn Polstra 10970ff27d31SJohn Polstra (*func)(entry, closure); 10980ff27d31SJohn Polstra } 1099976a87a2SAlan Cox vm_map_unlock_read(map); 11000ff27d31SJohn Polstra } 11010ff27d31SJohn Polstra 11020ff27d31SJohn Polstra /* 11030ff27d31SJohn Polstra * Write the core file header to the file, including padding up to 11040ff27d31SJohn Polstra * the page boundary. 11050ff27d31SJohn Polstra */ 11068c64af4fSJohn Polstra static int 11073ebc1248SPeter Wemm __elfN(corehdr)(td, vp, cred, numsegs, hdr, hdrsize) 1108b40ce416SJulian Elischer struct thread *td; 11098c64af4fSJohn Polstra struct vnode *vp; 11108c64af4fSJohn Polstra struct ucred *cred; 11110ff27d31SJohn Polstra int numsegs; 11120ff27d31SJohn Polstra size_t hdrsize; 11130ff27d31SJohn Polstra void *hdr; 11148c64af4fSJohn Polstra { 1115911c2be0SMark Peek size_t off; 11168c64af4fSJohn Polstra 11178c64af4fSJohn Polstra /* Fill in the header. */ 11180ff27d31SJohn Polstra bzero(hdr, hdrsize); 11198c64af4fSJohn Polstra off = 0; 1120247aba24SMarcel Moolenaar __elfN(puthdr)(td, hdr, &off, numsegs); 11218c64af4fSJohn Polstra 11228c64af4fSJohn Polstra /* Write it to the core file. */ 1123a7cddfedSJake Burkholder return (vn_rdwr_inchunks(UIO_WRITE, vp, hdr, hdrsize, (off_t)0, 11249ca43589SRobert Watson UIO_SYSSPACE, IO_UNIT | IO_DIRECT, cred, NOCRED, NULL, 11256617724cSJeff Roberson td)); 1126dada0278SJohn Polstra } 1127dada0278SJohn Polstra 112862919d78SPeter Wemm #if defined(COMPAT_IA32) && __ELF_WORD_SIZE == 32 112962919d78SPeter Wemm typedef struct prstatus32 elf_prstatus_t; 113062919d78SPeter Wemm typedef struct prpsinfo32 elf_prpsinfo_t; 113162919d78SPeter Wemm typedef struct fpreg32 elf_prfpregset_t; 113262919d78SPeter Wemm typedef struct fpreg32 elf_fpregset_t; 113362919d78SPeter Wemm typedef struct reg32 elf_gregset_t; 113462919d78SPeter Wemm #else 113562919d78SPeter Wemm typedef prstatus_t elf_prstatus_t; 113662919d78SPeter Wemm typedef prpsinfo_t elf_prpsinfo_t; 113762919d78SPeter Wemm typedef prfpregset_t elf_prfpregset_t; 113862919d78SPeter Wemm typedef prfpregset_t elf_fpregset_t; 113962919d78SPeter Wemm typedef gregset_t elf_gregset_t; 114062919d78SPeter Wemm #endif 114162919d78SPeter Wemm 11428c64af4fSJohn Polstra static void 1143247aba24SMarcel Moolenaar __elfN(puthdr)(struct thread *td, void *dst, size_t *off, int numsegs) 11448c64af4fSJohn Polstra { 11458c9b7b2cSMarcel Moolenaar struct { 114662919d78SPeter Wemm elf_prstatus_t status; 114762919d78SPeter Wemm elf_prfpregset_t fpregset; 114862919d78SPeter Wemm elf_prpsinfo_t psinfo; 11498c9b7b2cSMarcel Moolenaar } *tempdata; 115062919d78SPeter Wemm elf_prstatus_t *status; 115162919d78SPeter Wemm elf_prfpregset_t *fpregset; 115262919d78SPeter Wemm elf_prpsinfo_t *psinfo; 1153247aba24SMarcel Moolenaar struct proc *p; 1154247aba24SMarcel Moolenaar struct thread *thr; 11558c9b7b2cSMarcel Moolenaar size_t ehoff, noteoff, notesz, phoff; 11568c64af4fSJohn Polstra 1157247aba24SMarcel Moolenaar p = td->td_proc; 1158247aba24SMarcel Moolenaar 11598c64af4fSJohn Polstra ehoff = *off; 11608c64af4fSJohn Polstra *off += sizeof(Elf_Ehdr); 11618c64af4fSJohn Polstra 11628c64af4fSJohn Polstra phoff = *off; 11630ff27d31SJohn Polstra *off += (numsegs + 1) * sizeof(Elf_Phdr); 11648c64af4fSJohn Polstra 11658c64af4fSJohn Polstra noteoff = *off; 11668c9b7b2cSMarcel Moolenaar /* 11678c9b7b2cSMarcel Moolenaar * Don't allocate space for the notes if we're just calculating 11688c9b7b2cSMarcel Moolenaar * the size of the header. We also don't collect the data. 11698c9b7b2cSMarcel Moolenaar */ 11708c9b7b2cSMarcel Moolenaar if (dst != NULL) { 11718c9b7b2cSMarcel Moolenaar tempdata = malloc(sizeof(*tempdata), M_TEMP, M_ZERO|M_WAITOK); 11728c9b7b2cSMarcel Moolenaar status = &tempdata->status; 11738c9b7b2cSMarcel Moolenaar fpregset = &tempdata->fpregset; 11748c9b7b2cSMarcel Moolenaar psinfo = &tempdata->psinfo; 11758c9b7b2cSMarcel Moolenaar } else { 11768c9b7b2cSMarcel Moolenaar tempdata = NULL; 11778c9b7b2cSMarcel Moolenaar status = NULL; 11788c9b7b2cSMarcel Moolenaar fpregset = NULL; 11798c9b7b2cSMarcel Moolenaar psinfo = NULL; 11808c9b7b2cSMarcel Moolenaar } 11818c9b7b2cSMarcel Moolenaar 11828c9b7b2cSMarcel Moolenaar if (dst != NULL) { 11838c9b7b2cSMarcel Moolenaar psinfo->pr_version = PRPSINFO_VERSION; 118462919d78SPeter Wemm psinfo->pr_psinfosz = sizeof(elf_prpsinfo_t); 1185ccd3953eSJohn Baldwin strlcpy(psinfo->pr_fname, p->p_comm, sizeof(psinfo->pr_fname)); 11868c9b7b2cSMarcel Moolenaar /* 11878c9b7b2cSMarcel Moolenaar * XXX - We don't fill in the command line arguments properly 11888c9b7b2cSMarcel Moolenaar * yet. 11898c9b7b2cSMarcel Moolenaar */ 1190ccd3953eSJohn Baldwin strlcpy(psinfo->pr_psargs, p->p_comm, 11918c9b7b2cSMarcel Moolenaar sizeof(psinfo->pr_psargs)); 11928c9b7b2cSMarcel Moolenaar } 11938c9b7b2cSMarcel Moolenaar __elfN(putnote)(dst, off, "FreeBSD", NT_PRPSINFO, psinfo, 11948c9b7b2cSMarcel Moolenaar sizeof *psinfo); 11958c9b7b2cSMarcel Moolenaar 11968c9b7b2cSMarcel Moolenaar /* 11971f7a1baaSMarcel Moolenaar * To have the debugger select the right thread (LWP) as the initial 11981f7a1baaSMarcel Moolenaar * thread, we dump the state of the thread passed to us in td first. 11991f7a1baaSMarcel Moolenaar * This is the thread that causes the core dump and thus likely to 12001f7a1baaSMarcel Moolenaar * be the right thread one wants to have selected in the debugger. 12018c9b7b2cSMarcel Moolenaar */ 1202247aba24SMarcel Moolenaar thr = td; 1203247aba24SMarcel Moolenaar while (thr != NULL) { 12048c9b7b2cSMarcel Moolenaar if (dst != NULL) { 12058c9b7b2cSMarcel Moolenaar status->pr_version = PRSTATUS_VERSION; 120662919d78SPeter Wemm status->pr_statussz = sizeof(elf_prstatus_t); 120762919d78SPeter Wemm status->pr_gregsetsz = sizeof(elf_gregset_t); 120862919d78SPeter Wemm status->pr_fpregsetsz = sizeof(elf_fpregset_t); 12098c9b7b2cSMarcel Moolenaar status->pr_osreldate = osreldate; 12108c9b7b2cSMarcel Moolenaar status->pr_cursig = p->p_sig; 12111f7a1baaSMarcel Moolenaar status->pr_pid = thr->td_tid; 121262919d78SPeter Wemm #if defined(COMPAT_IA32) && __ELF_WORD_SIZE == 32 121362919d78SPeter Wemm fill_regs32(thr, &status->pr_reg); 121462919d78SPeter Wemm fill_fpregs32(thr, fpregset); 121562919d78SPeter Wemm #else 12168c9b7b2cSMarcel Moolenaar fill_regs(thr, &status->pr_reg); 12178c9b7b2cSMarcel Moolenaar fill_fpregs(thr, fpregset); 121862919d78SPeter Wemm #endif 12198c9b7b2cSMarcel Moolenaar } 12203ebc1248SPeter Wemm __elfN(putnote)(dst, off, "FreeBSD", NT_PRSTATUS, status, 12218c64af4fSJohn Polstra sizeof *status); 12223ebc1248SPeter Wemm __elfN(putnote)(dst, off, "FreeBSD", NT_FPREGSET, fpregset, 12238c64af4fSJohn Polstra sizeof *fpregset); 12244da47b2fSMarcel Moolenaar /* 12254da47b2fSMarcel Moolenaar * Allow for MD specific notes, as well as any MD 12264da47b2fSMarcel Moolenaar * specific preparations for writing MI notes. 12274da47b2fSMarcel Moolenaar */ 12284da47b2fSMarcel Moolenaar __elfN(dump_thread)(thr, dst, off); 1229247aba24SMarcel Moolenaar 1230247aba24SMarcel Moolenaar thr = (thr == td) ? TAILQ_FIRST(&p->p_threads) : 12318c9b7b2cSMarcel Moolenaar TAILQ_NEXT(thr, td_plist); 1232247aba24SMarcel Moolenaar if (thr == td) 12338c9b7b2cSMarcel Moolenaar thr = TAILQ_NEXT(thr, td_plist); 1234247aba24SMarcel Moolenaar } 12358c9b7b2cSMarcel Moolenaar 12368c64af4fSJohn Polstra notesz = *off - noteoff; 12378c64af4fSJohn Polstra 12388c9b7b2cSMarcel Moolenaar if (dst != NULL) 12398c9b7b2cSMarcel Moolenaar free(tempdata, M_TEMP); 12408c9b7b2cSMarcel Moolenaar 12410ff27d31SJohn Polstra /* Align up to a page boundary for the program segments. */ 12428c64af4fSJohn Polstra *off = round_page(*off); 12438c64af4fSJohn Polstra 12448c64af4fSJohn Polstra if (dst != NULL) { 12458c64af4fSJohn Polstra Elf_Ehdr *ehdr; 12468c64af4fSJohn Polstra Elf_Phdr *phdr; 12470ff27d31SJohn Polstra struct phdr_closure phc; 12488c64af4fSJohn Polstra 12498c64af4fSJohn Polstra /* 12508c64af4fSJohn Polstra * Fill in the ELF header. 12518c64af4fSJohn Polstra */ 12528c64af4fSJohn Polstra ehdr = (Elf_Ehdr *)((char *)dst + ehoff); 12538c64af4fSJohn Polstra ehdr->e_ident[EI_MAG0] = ELFMAG0; 12548c64af4fSJohn Polstra ehdr->e_ident[EI_MAG1] = ELFMAG1; 12558c64af4fSJohn Polstra ehdr->e_ident[EI_MAG2] = ELFMAG2; 12568c64af4fSJohn Polstra ehdr->e_ident[EI_MAG3] = ELFMAG3; 12578c64af4fSJohn Polstra ehdr->e_ident[EI_CLASS] = ELF_CLASS; 12588c64af4fSJohn Polstra ehdr->e_ident[EI_DATA] = ELF_DATA; 12598c64af4fSJohn Polstra ehdr->e_ident[EI_VERSION] = EV_CURRENT; 1260c815a20cSDavid E. O'Brien ehdr->e_ident[EI_OSABI] = ELFOSABI_FREEBSD; 1261c815a20cSDavid E. O'Brien ehdr->e_ident[EI_ABIVERSION] = 0; 12628c64af4fSJohn Polstra ehdr->e_ident[EI_PAD] = 0; 12638c64af4fSJohn Polstra ehdr->e_type = ET_CORE; 126462919d78SPeter Wemm #if defined(COMPAT_IA32) && __ELF_WORD_SIZE == 32 126562919d78SPeter Wemm ehdr->e_machine = EM_386; 126662919d78SPeter Wemm #else 12678c64af4fSJohn Polstra ehdr->e_machine = ELF_ARCH; 126862919d78SPeter Wemm #endif 12698c64af4fSJohn Polstra ehdr->e_version = EV_CURRENT; 12708c64af4fSJohn Polstra ehdr->e_entry = 0; 12718c64af4fSJohn Polstra ehdr->e_phoff = phoff; 12728c64af4fSJohn Polstra ehdr->e_flags = 0; 12738c64af4fSJohn Polstra ehdr->e_ehsize = sizeof(Elf_Ehdr); 12748c64af4fSJohn Polstra ehdr->e_phentsize = sizeof(Elf_Phdr); 12750ff27d31SJohn Polstra ehdr->e_phnum = numsegs + 1; 12768c64af4fSJohn Polstra ehdr->e_shentsize = sizeof(Elf_Shdr); 12778c64af4fSJohn Polstra ehdr->e_shnum = 0; 12788c64af4fSJohn Polstra ehdr->e_shstrndx = SHN_UNDEF; 12798c64af4fSJohn Polstra 12808c64af4fSJohn Polstra /* 12818c64af4fSJohn Polstra * Fill in the program header entries. 12828c64af4fSJohn Polstra */ 12838c64af4fSJohn Polstra phdr = (Elf_Phdr *)((char *)dst + phoff); 12848c64af4fSJohn Polstra 12858c64af4fSJohn Polstra /* The note segement. */ 12868c64af4fSJohn Polstra phdr->p_type = PT_NOTE; 12878c64af4fSJohn Polstra phdr->p_offset = noteoff; 12888c64af4fSJohn Polstra phdr->p_vaddr = 0; 12898c64af4fSJohn Polstra phdr->p_paddr = 0; 12908c64af4fSJohn Polstra phdr->p_filesz = notesz; 12918c64af4fSJohn Polstra phdr->p_memsz = 0; 12928c64af4fSJohn Polstra phdr->p_flags = 0; 12938c64af4fSJohn Polstra phdr->p_align = 0; 12948c64af4fSJohn Polstra phdr++; 12958c64af4fSJohn Polstra 12960ff27d31SJohn Polstra /* All the writable segments from the program. */ 12970ff27d31SJohn Polstra phc.phdr = phdr; 12980ff27d31SJohn Polstra phc.offset = *off; 1299247aba24SMarcel Moolenaar each_writable_segment(td, cb_put_phdr, &phc); 13008c64af4fSJohn Polstra } 13018c64af4fSJohn Polstra } 13028c64af4fSJohn Polstra 13038c64af4fSJohn Polstra static void 13043ebc1248SPeter Wemm __elfN(putnote)(void *dst, size_t *off, const char *name, int type, 13058c64af4fSJohn Polstra const void *desc, size_t descsz) 13068c64af4fSJohn Polstra { 13078c64af4fSJohn Polstra Elf_Note note; 13088c64af4fSJohn Polstra 13098c64af4fSJohn Polstra note.n_namesz = strlen(name) + 1; 13108c64af4fSJohn Polstra note.n_descsz = descsz; 13118c64af4fSJohn Polstra note.n_type = type; 13128c64af4fSJohn Polstra if (dst != NULL) 13138c64af4fSJohn Polstra bcopy(¬e, (char *)dst + *off, sizeof note); 13148c64af4fSJohn Polstra *off += sizeof note; 13158c64af4fSJohn Polstra if (dst != NULL) 13168c64af4fSJohn Polstra bcopy(name, (char *)dst + *off, note.n_namesz); 13178c64af4fSJohn Polstra *off += roundup2(note.n_namesz, sizeof(Elf_Size)); 13188c64af4fSJohn Polstra if (dst != NULL) 13198c64af4fSJohn Polstra bcopy(desc, (char *)dst + *off, note.n_descsz); 13208c64af4fSJohn Polstra *off += roundup2(note.n_descsz, sizeof(Elf_Size)); 13218c64af4fSJohn Polstra } 13228c64af4fSJohn Polstra 13238c64af4fSJohn Polstra /* 132432c01de2SDmitry Chagin * Try to find the appropriate ABI-note section for checknote, 132532c01de2SDmitry Chagin * fetch the osreldate for binary from the ELF OSABI-note. Only the 132632c01de2SDmitry Chagin * first page of the image is searched, the same as for headers. 132732c01de2SDmitry Chagin */ 132832c01de2SDmitry Chagin static boolean_t 132932c01de2SDmitry Chagin __elfN(check_note)(struct image_params *imgp, Elf_Brandnote *checknote, 133032c01de2SDmitry Chagin int32_t *osrel) 133132c01de2SDmitry Chagin { 133232c01de2SDmitry Chagin const Elf_Note *note, *note_end; 133332c01de2SDmitry Chagin const Elf32_Phdr *phdr, *pnote; 133432c01de2SDmitry Chagin const Elf32_Ehdr *hdr; 133532c01de2SDmitry Chagin const char *note_name; 133632c01de2SDmitry Chagin int i; 133732c01de2SDmitry Chagin 133832c01de2SDmitry Chagin pnote = NULL; 133932c01de2SDmitry Chagin hdr = (const Elf32_Ehdr *)imgp->image_header; 134032c01de2SDmitry Chagin phdr = (const Elf32_Phdr *)(imgp->image_header + hdr->e_phoff); 134132c01de2SDmitry Chagin 134232c01de2SDmitry Chagin for (i = 0; i < hdr->e_phnum; i++) { 134332c01de2SDmitry Chagin if (phdr[i].p_type == PT_NOTE) { 134432c01de2SDmitry Chagin pnote = &phdr[i]; 134532c01de2SDmitry Chagin break; 134632c01de2SDmitry Chagin } 134732c01de2SDmitry Chagin } 134832c01de2SDmitry Chagin 134932c01de2SDmitry Chagin if (pnote == NULL || pnote->p_offset >= PAGE_SIZE || 135032c01de2SDmitry Chagin pnote->p_offset + pnote->p_filesz >= PAGE_SIZE) 135132c01de2SDmitry Chagin return (FALSE); 135232c01de2SDmitry Chagin 135332c01de2SDmitry Chagin note = (const Elf_Note *)(imgp->image_header + pnote->p_offset); 135432c01de2SDmitry Chagin if (!aligned(note, Elf32_Addr)) 135532c01de2SDmitry Chagin return (FALSE); 135632c01de2SDmitry Chagin note_end = (const Elf_Note *)(imgp->image_header + 135732c01de2SDmitry Chagin pnote->p_offset + pnote->p_filesz); 135832c01de2SDmitry Chagin while (note < note_end) { 135932c01de2SDmitry Chagin if (note->n_namesz != checknote->hdr.n_namesz || 136032c01de2SDmitry Chagin note->n_descsz != checknote->hdr.n_descsz || 136132c01de2SDmitry Chagin note->n_type != checknote->hdr.n_type) 136232c01de2SDmitry Chagin goto nextnote; 136332c01de2SDmitry Chagin note_name = (const char *)(note + 1); 136432c01de2SDmitry Chagin if (strncmp(checknote->vendor, note_name, 136532c01de2SDmitry Chagin checknote->hdr.n_namesz) != 0) 136632c01de2SDmitry Chagin goto nextnote; 136732c01de2SDmitry Chagin 136832c01de2SDmitry Chagin /* 136932c01de2SDmitry Chagin * Fetch the osreldate for binary 137032c01de2SDmitry Chagin * from the ELF OSABI-note if necessary. 137132c01de2SDmitry Chagin */ 137232c01de2SDmitry Chagin if ((checknote->flags & BN_CAN_FETCH_OSREL) != 0 && 137332c01de2SDmitry Chagin osrel != NULL) 137432c01de2SDmitry Chagin *osrel = *(const int32_t *) (note_name + 137532c01de2SDmitry Chagin roundup2(checknote->hdr.n_namesz, 137632c01de2SDmitry Chagin sizeof(Elf32_Addr))); 137732c01de2SDmitry Chagin return (TRUE); 137832c01de2SDmitry Chagin 137932c01de2SDmitry Chagin nextnote: 138032c01de2SDmitry Chagin note = (const Elf_Note *)((const char *)(note + 1) + 138132c01de2SDmitry Chagin roundup2(note->n_namesz, sizeof(Elf32_Addr)) + 138232c01de2SDmitry Chagin roundup2(note->n_descsz, sizeof(Elf32_Addr))); 138332c01de2SDmitry Chagin } 138432c01de2SDmitry Chagin 138532c01de2SDmitry Chagin return (FALSE); 138632c01de2SDmitry Chagin } 138732c01de2SDmitry Chagin 138832c01de2SDmitry Chagin /* 1389e1743d02SSøren Schmidt * Tell kern_execve.c about it, with a little help from the linker. 1390e1743d02SSøren Schmidt */ 1391a360a43dSJake Burkholder static struct execsw __elfN(execsw) = { 1392a360a43dSJake Burkholder __CONCAT(exec_, __elfN(imgact)), 1393a360a43dSJake Burkholder __XSTRING(__CONCAT(ELF, __ELF_WORD_SIZE)) 1394a360a43dSJake Burkholder }; 1395a360a43dSJake Burkholder EXEC_SET(__CONCAT(elf, __ELF_WORD_SIZE), __elfN(execsw)); 1396