1e1743d02SSøren Schmidt /*- 221a3ee0eSDavid E. O'Brien * Copyright (c) 2000 David O'Brien 3e1743d02SSøren Schmidt * Copyright (c) 1995-1996 S�ren Schmidt 4e1743d02SSøren Schmidt * Copyright (c) 1996 Peter Wemm 5e1743d02SSøren Schmidt * All rights reserved. 6e1743d02SSøren Schmidt * 7e1743d02SSøren Schmidt * Redistribution and use in source and binary forms, with or without 8e1743d02SSøren Schmidt * modification, are permitted provided that the following conditions 9e1743d02SSøren Schmidt * are met: 10e1743d02SSøren Schmidt * 1. Redistributions of source code must retain the above copyright 11e1743d02SSøren Schmidt * notice, this list of conditions and the following disclaimer 12e1743d02SSøren Schmidt * in this position and unchanged. 13e1743d02SSøren Schmidt * 2. Redistributions in binary form must reproduce the above copyright 14e1743d02SSøren Schmidt * notice, this list of conditions and the following disclaimer in the 15e1743d02SSøren Schmidt * documentation and/or other materials provided with the distribution. 16e1743d02SSøren Schmidt * 3. The name of the author may not be used to endorse or promote products 1721dc7d4fSJens Schweikhardt * derived from this software without specific prior written permission 18e1743d02SSøren Schmidt * 19e1743d02SSøren Schmidt * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 20e1743d02SSøren Schmidt * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 21e1743d02SSøren Schmidt * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 22e1743d02SSøren Schmidt * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 23e1743d02SSøren Schmidt * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 24e1743d02SSøren Schmidt * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 25e1743d02SSøren Schmidt * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 26e1743d02SSøren Schmidt * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 27e1743d02SSøren Schmidt * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 28e1743d02SSøren Schmidt * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 29e1743d02SSøren Schmidt */ 30e1743d02SSøren Schmidt 31677b542eSDavid E. O'Brien #include <sys/cdefs.h> 32677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 33677b542eSDavid E. O'Brien 3462919d78SPeter Wemm #include "opt_compat.h" 35e7228204SAlfred Perlstein #include "opt_core.h" 3662919d78SPeter Wemm 37e1743d02SSøren Schmidt #include <sys/param.h> 38e1743d02SSøren Schmidt #include <sys/exec.h> 398c64af4fSJohn Polstra #include <sys/fcntl.h> 40e1743d02SSøren Schmidt #include <sys/imgact.h> 41e1743d02SSøren Schmidt #include <sys/imgact_elf.h> 42e1743d02SSøren Schmidt #include <sys/kernel.h> 43f34fa851SJohn Baldwin #include <sys/lock.h> 44e1743d02SSøren Schmidt #include <sys/malloc.h> 4568ff2a43SChristian S.J. Peron #include <sys/mount.h> 4635e0e5b3SJohn Baldwin #include <sys/mutex.h> 478c64af4fSJohn Polstra #include <sys/mman.h> 48a794e791SBruce Evans #include <sys/namei.h> 498c64af4fSJohn Polstra #include <sys/pioctl.h> 50a794e791SBruce Evans #include <sys/proc.h> 518c64af4fSJohn Polstra #include <sys/procfs.h> 528c64af4fSJohn Polstra #include <sys/resourcevar.h> 53da61b9a6SAlan Cox #include <sys/sf_buf.h> 5436240ea5SDoug Rabson #include <sys/systm.h> 55e1743d02SSøren Schmidt #include <sys/signalvar.h> 568c64af4fSJohn Polstra #include <sys/stat.h> 571005a129SJohn Baldwin #include <sys/sx.h> 588c64af4fSJohn Polstra #include <sys/syscall.h> 59e1743d02SSøren Schmidt #include <sys/sysctl.h> 608c64af4fSJohn Polstra #include <sys/sysent.h> 61a794e791SBruce Evans #include <sys/vnode.h> 62e7228204SAlfred Perlstein #include <sys/syslog.h> 63e7228204SAlfred Perlstein #include <sys/eventhandler.h> 64e7228204SAlfred Perlstein 65e7228204SAlfred Perlstein #include <net/zlib.h> 66e1743d02SSøren Schmidt 67e1743d02SSøren Schmidt #include <vm/vm.h> 68e1743d02SSøren Schmidt #include <vm/vm_kern.h> 69e1743d02SSøren Schmidt #include <vm/vm_param.h> 70e1743d02SSøren Schmidt #include <vm/pmap.h> 71e1743d02SSøren Schmidt #include <vm/vm_map.h> 720ff27d31SJohn Polstra #include <vm/vm_object.h> 73e1743d02SSøren Schmidt #include <vm/vm_extern.h> 74e1743d02SSøren Schmidt 7552c24af7SPeter Wemm #include <machine/elf.h> 76e1743d02SSøren Schmidt #include <machine/md_var.h> 77e1743d02SSøren Schmidt 7862919d78SPeter Wemm #if defined(COMPAT_IA32) && __ELF_WORD_SIZE == 32 7962919d78SPeter Wemm #include <machine/fpu.h> 8062919d78SPeter Wemm #include <compat/ia32/ia32_reg.h> 8162919d78SPeter Wemm #endif 8262919d78SPeter Wemm 83c815a20cSDavid E. O'Brien #define OLD_EI_BRAND 8 84c815a20cSDavid E. O'Brien 853ebc1248SPeter Wemm static int __elfN(check_header)(const Elf_Ehdr *hdr); 8632c01de2SDmitry Chagin static Elf_Brandinfo *__elfN(get_brandinfo)(struct image_params *imgp, 8732c01de2SDmitry Chagin const char *interp, int32_t *osrel); 883ebc1248SPeter Wemm static int __elfN(load_file)(struct proc *p, const char *file, u_long *addr, 893ebc1248SPeter Wemm u_long *entry, size_t pagesize); 90373d1a3fSAlan Cox static int __elfN(load_section)(struct vmspace *vmspace, vm_object_t object, 918c64af4fSJohn Polstra vm_offset_t offset, caddr_t vmaddr, size_t memsz, size_t filsz, 923ebc1248SPeter Wemm vm_prot_t prot, size_t pagesize); 933ebc1248SPeter Wemm static int __CONCAT(exec_, __elfN(imgact))(struct image_params *imgp); 9489ffc202SBjoern A. Zeeb static boolean_t __elfN(freebsd_trans_osrel)(const Elf_Note *note, 9589ffc202SBjoern A. Zeeb int32_t *osrel); 9689ffc202SBjoern A. Zeeb static boolean_t kfreebsd_trans_osrel(const Elf_Note *note, int32_t *osrel); 9732c01de2SDmitry Chagin static boolean_t __elfN(check_note)(struct image_params *imgp, 9832c01de2SDmitry Chagin Elf_Brandnote *checknote, int32_t *osrel); 99e1743d02SSøren Schmidt 100a360a43dSJake Burkholder SYSCTL_NODE(_kern, OID_AUTO, __CONCAT(elf, __ELF_WORD_SIZE), CTLFLAG_RW, 0, 101a360a43dSJake Burkholder ""); 102a360a43dSJake Burkholder 103e7228204SAlfred Perlstein #ifdef COMPRESS_USER_CORES 104e7228204SAlfred Perlstein static int compress_core(gzFile, char *, char *, unsigned int, 105e7228204SAlfred Perlstein struct thread * td); 106e7228204SAlfred Perlstein #define CORE_BUF_SIZE (16 * 1024) 107e7228204SAlfred Perlstein #endif 108e7228204SAlfred Perlstein 109e548a1d4SJake Burkholder int __elfN(fallback_brand) = -1; 110e548a1d4SJake Burkholder SYSCTL_INT(__CONCAT(_kern_elf, __ELF_WORD_SIZE), OID_AUTO, 111e548a1d4SJake Burkholder fallback_brand, CTLFLAG_RW, &__elfN(fallback_brand), 0, 112a360a43dSJake Burkholder __XSTRING(__CONCAT(ELF, __ELF_WORD_SIZE)) " brand of last resort"); 113a360a43dSJake Burkholder TUNABLE_INT("kern.elf" __XSTRING(__ELF_WORD_SIZE) ".fallback_brand", 114e548a1d4SJake Burkholder &__elfN(fallback_brand)); 115a360a43dSJake Burkholder 116551d79e1SMarcel Moolenaar static int elf_legacy_coredump = 0; 117a360a43dSJake Burkholder SYSCTL_INT(_debug, OID_AUTO, __elfN(legacy_coredump), CTLFLAG_RW, 118551d79e1SMarcel Moolenaar &elf_legacy_coredump, 0, ""); 119e1743d02SSøren Schmidt 1203ebc1248SPeter Wemm static Elf_Brandinfo *elf_brand_list[MAX_BRANDS]; 121e1743d02SSøren Schmidt 12293d1c728SKonstantin Belousov #define trunc_page_ps(va, ps) ((va) & ~(ps - 1)) 12393d1c728SKonstantin Belousov #define round_page_ps(va, ps) (((va) + (ps - 1)) & ~(ps - 1)) 12493d1c728SKonstantin Belousov #define aligned(a, t) (trunc_page_ps((u_long)(a), sizeof(t)) == (u_long)(a)) 12593d1c728SKonstantin Belousov 12632c01de2SDmitry Chagin static const char FREEBSD_ABI_VENDOR[] = "FreeBSD"; 12732c01de2SDmitry Chagin 12832c01de2SDmitry Chagin Elf_Brandnote __elfN(freebsd_brandnote) = { 12932c01de2SDmitry Chagin .hdr.n_namesz = sizeof(FREEBSD_ABI_VENDOR), 13032c01de2SDmitry Chagin .hdr.n_descsz = sizeof(int32_t), 13132c01de2SDmitry Chagin .hdr.n_type = 1, 13232c01de2SDmitry Chagin .vendor = FREEBSD_ABI_VENDOR, 13389ffc202SBjoern A. Zeeb .flags = BN_TRANSLATE_OSREL, 13489ffc202SBjoern A. Zeeb .trans_osrel = __elfN(freebsd_trans_osrel) 13532c01de2SDmitry Chagin }; 13632c01de2SDmitry Chagin 13789ffc202SBjoern A. Zeeb static boolean_t 13889ffc202SBjoern A. Zeeb __elfN(freebsd_trans_osrel)(const Elf_Note *note, int32_t *osrel) 13989ffc202SBjoern A. Zeeb { 14089ffc202SBjoern A. Zeeb uintptr_t p; 14189ffc202SBjoern A. Zeeb 14289ffc202SBjoern A. Zeeb p = (uintptr_t)(note + 1); 14389ffc202SBjoern A. Zeeb p += roundup2(note->n_namesz, sizeof(Elf32_Addr)); 14489ffc202SBjoern A. Zeeb *osrel = *(const int32_t *)(p); 14589ffc202SBjoern A. Zeeb 14689ffc202SBjoern A. Zeeb return (TRUE); 14789ffc202SBjoern A. Zeeb } 14889ffc202SBjoern A. Zeeb 14989ffc202SBjoern A. Zeeb static const char GNU_ABI_VENDOR[] = "GNU"; 15089ffc202SBjoern A. Zeeb static int GNU_KFREEBSD_ABI_DESC = 3; 15189ffc202SBjoern A. Zeeb 15289ffc202SBjoern A. Zeeb Elf_Brandnote __elfN(kfreebsd_brandnote) = { 15389ffc202SBjoern A. Zeeb .hdr.n_namesz = sizeof(GNU_ABI_VENDOR), 15489ffc202SBjoern A. Zeeb .hdr.n_descsz = 16, /* XXX at least 16 */ 15589ffc202SBjoern A. Zeeb .hdr.n_type = 1, 15689ffc202SBjoern A. Zeeb .vendor = GNU_ABI_VENDOR, 15789ffc202SBjoern A. Zeeb .flags = BN_TRANSLATE_OSREL, 15889ffc202SBjoern A. Zeeb .trans_osrel = kfreebsd_trans_osrel 15989ffc202SBjoern A. Zeeb }; 16089ffc202SBjoern A. Zeeb 16189ffc202SBjoern A. Zeeb static boolean_t 16289ffc202SBjoern A. Zeeb kfreebsd_trans_osrel(const Elf_Note *note, int32_t *osrel) 16389ffc202SBjoern A. Zeeb { 16489ffc202SBjoern A. Zeeb const Elf32_Word *desc; 16589ffc202SBjoern A. Zeeb uintptr_t p; 16689ffc202SBjoern A. Zeeb 16789ffc202SBjoern A. Zeeb p = (uintptr_t)(note + 1); 16889ffc202SBjoern A. Zeeb p += roundup2(note->n_namesz, sizeof(Elf32_Addr)); 16989ffc202SBjoern A. Zeeb 17089ffc202SBjoern A. Zeeb desc = (const Elf32_Word *)p; 17189ffc202SBjoern A. Zeeb if (desc[0] != GNU_KFREEBSD_ABI_DESC) 17289ffc202SBjoern A. Zeeb return (FALSE); 17389ffc202SBjoern A. Zeeb 17489ffc202SBjoern A. Zeeb /* 17589ffc202SBjoern A. Zeeb * Debian GNU/kFreeBSD embed the earliest compatible kernel version 17689ffc202SBjoern A. Zeeb * (__FreeBSD_version: <major><two digit minor>Rxx) in the LSB way. 17789ffc202SBjoern A. Zeeb */ 17889ffc202SBjoern A. Zeeb *osrel = desc[1] * 100000 + desc[2] * 1000 + desc[3]; 17989ffc202SBjoern A. Zeeb 18089ffc202SBjoern A. Zeeb return (TRUE); 18189ffc202SBjoern A. Zeeb } 18289ffc202SBjoern A. Zeeb 183e1743d02SSøren Schmidt int 1843ebc1248SPeter Wemm __elfN(insert_brand_entry)(Elf_Brandinfo *entry) 185e1743d02SSøren Schmidt { 186e1743d02SSøren Schmidt int i; 187e1743d02SSøren Schmidt 1883ebc1248SPeter Wemm for (i = 0; i < MAX_BRANDS; i++) { 189ea5a2b2eSSøren Schmidt if (elf_brand_list[i] == NULL) { 190ea5a2b2eSSøren Schmidt elf_brand_list[i] = entry; 191e1743d02SSøren Schmidt break; 192e1743d02SSøren Schmidt } 193e1743d02SSøren Schmidt } 194925c8b5bSBjoern A. Zeeb if (i == MAX_BRANDS) { 195925c8b5bSBjoern A. Zeeb printf("WARNING: %s: could not insert brandinfo entry: %p\n", 196925c8b5bSBjoern A. Zeeb __func__, entry); 197a7cddfedSJake Burkholder return (-1); 198925c8b5bSBjoern A. Zeeb } 199a7cddfedSJake Burkholder return (0); 200e1743d02SSøren Schmidt } 201e1743d02SSøren Schmidt 202e1743d02SSøren Schmidt int 2033ebc1248SPeter Wemm __elfN(remove_brand_entry)(Elf_Brandinfo *entry) 204e1743d02SSøren Schmidt { 205e1743d02SSøren Schmidt int i; 206e1743d02SSøren Schmidt 2073ebc1248SPeter Wemm for (i = 0; i < MAX_BRANDS; i++) { 208ea5a2b2eSSøren Schmidt if (elf_brand_list[i] == entry) { 209ea5a2b2eSSøren Schmidt elf_brand_list[i] = NULL; 210e1743d02SSøren Schmidt break; 211e1743d02SSøren Schmidt } 212e1743d02SSøren Schmidt } 213ea5a2b2eSSøren Schmidt if (i == MAX_BRANDS) 214a7cddfedSJake Burkholder return (-1); 215a7cddfedSJake Burkholder return (0); 216e1743d02SSøren Schmidt } 217e1743d02SSøren Schmidt 218096977faSMark Newton int 2193ebc1248SPeter Wemm __elfN(brand_inuse)(Elf_Brandinfo *entry) 220096977faSMark Newton { 221096977faSMark Newton struct proc *p; 222553629ebSJake Burkholder int rval = FALSE; 223096977faSMark Newton 2241005a129SJohn Baldwin sx_slock(&allproc_lock); 2254f506694SXin LI FOREACH_PROC_IN_SYSTEM(p) { 226553629ebSJake Burkholder if (p->p_sysent == entry->sysvec) { 227553629ebSJake Burkholder rval = TRUE; 228553629ebSJake Burkholder break; 229096977faSMark Newton } 230553629ebSJake Burkholder } 2311005a129SJohn Baldwin sx_sunlock(&allproc_lock); 232096977faSMark Newton 233553629ebSJake Burkholder return (rval); 234096977faSMark Newton } 235096977faSMark Newton 2365fe3ed62SJake Burkholder static Elf_Brandinfo * 23732c01de2SDmitry Chagin __elfN(get_brandinfo)(struct image_params *imgp, const char *interp, 23832c01de2SDmitry Chagin int32_t *osrel) 2395fe3ed62SJake Burkholder { 24032c01de2SDmitry Chagin const Elf_Ehdr *hdr = (const Elf_Ehdr *)imgp->image_header; 2415fe3ed62SJake Burkholder Elf_Brandinfo *bi; 24232c01de2SDmitry Chagin boolean_t ret; 2435fe3ed62SJake Burkholder int i; 2445fe3ed62SJake Burkholder 2455fe3ed62SJake Burkholder /* 24632c01de2SDmitry Chagin * We support four types of branding -- (1) the ELF EI_OSABI field 2475fe3ed62SJake Burkholder * that SCO added to the ELF spec, (2) FreeBSD 3.x's traditional string 24832c01de2SDmitry Chagin * branding w/in the ELF header, (3) path of the `interp_path' 24932c01de2SDmitry Chagin * field, and (4) the ".note.ABI-tag" ELF section. 2505fe3ed62SJake Burkholder */ 2515fe3ed62SJake Burkholder 25232c01de2SDmitry Chagin /* Look for an ".note.ABI-tag" ELF section */ 25332c01de2SDmitry Chagin for (i = 0; i < MAX_BRANDS; i++) { 25432c01de2SDmitry Chagin bi = elf_brand_list[i]; 255ecc2fda8SBjoern A. Zeeb if (bi == NULL) 256ecc2fda8SBjoern A. Zeeb continue; 257ecc2fda8SBjoern A. Zeeb if (hdr->e_machine == bi->machine && (bi->flags & 258ecc2fda8SBjoern A. Zeeb (BI_BRAND_NOTE|BI_BRAND_NOTE_MANDATORY)) != 0) { 25932c01de2SDmitry Chagin ret = __elfN(check_note)(imgp, bi->brand_note, osrel); 26032c01de2SDmitry Chagin if (ret) 26132c01de2SDmitry Chagin return (bi); 26232c01de2SDmitry Chagin } 26332c01de2SDmitry Chagin } 26432c01de2SDmitry Chagin 2655fe3ed62SJake Burkholder /* If the executable has a brand, search for it in the brand list. */ 2665fe3ed62SJake Burkholder for (i = 0; i < MAX_BRANDS; i++) { 2675fe3ed62SJake Burkholder bi = elf_brand_list[i]; 268ecc2fda8SBjoern A. Zeeb if (bi == NULL || bi->flags & BI_BRAND_NOTE_MANDATORY) 269ecc2fda8SBjoern A. Zeeb continue; 270ecc2fda8SBjoern A. Zeeb if (hdr->e_machine == bi->machine && 2715fe3ed62SJake Burkholder (hdr->e_ident[EI_OSABI] == bi->brand || 2725fe3ed62SJake Burkholder strncmp((const char *)&hdr->e_ident[OLD_EI_BRAND], 2735fe3ed62SJake Burkholder bi->compat_3_brand, strlen(bi->compat_3_brand)) == 0)) 2745fe3ed62SJake Burkholder return (bi); 2755fe3ed62SJake Burkholder } 2765fe3ed62SJake Burkholder 2775fe3ed62SJake Burkholder /* Lacking a known brand, search for a recognized interpreter. */ 2785fe3ed62SJake Burkholder if (interp != NULL) { 2795fe3ed62SJake Burkholder for (i = 0; i < MAX_BRANDS; i++) { 2805fe3ed62SJake Burkholder bi = elf_brand_list[i]; 281ecc2fda8SBjoern A. Zeeb if (bi == NULL || bi->flags & BI_BRAND_NOTE_MANDATORY) 282ecc2fda8SBjoern A. Zeeb continue; 283ecc2fda8SBjoern A. Zeeb if (hdr->e_machine == bi->machine && 2845fe3ed62SJake Burkholder strcmp(interp, bi->interp_path) == 0) 2855fe3ed62SJake Burkholder return (bi); 2865fe3ed62SJake Burkholder } 2875fe3ed62SJake Burkholder } 2885fe3ed62SJake Burkholder 2895fe3ed62SJake Burkholder /* Lacking a recognized interpreter, try the default brand */ 2905fe3ed62SJake Burkholder for (i = 0; i < MAX_BRANDS; i++) { 2915fe3ed62SJake Burkholder bi = elf_brand_list[i]; 292ecc2fda8SBjoern A. Zeeb if (bi == NULL || bi->flags & BI_BRAND_NOTE_MANDATORY) 293ecc2fda8SBjoern A. Zeeb continue; 294ecc2fda8SBjoern A. Zeeb if (hdr->e_machine == bi->machine && 295e548a1d4SJake Burkholder __elfN(fallback_brand) == bi->brand) 2965fe3ed62SJake Burkholder return (bi); 2975fe3ed62SJake Burkholder } 2985fe3ed62SJake Burkholder return (NULL); 2995fe3ed62SJake Burkholder } 3005fe3ed62SJake Burkholder 301e1743d02SSøren Schmidt static int 3023ebc1248SPeter Wemm __elfN(check_header)(const Elf_Ehdr *hdr) 303e1743d02SSøren Schmidt { 304d0ca7c29SPeter Wemm Elf_Brandinfo *bi; 3053ebc1248SPeter Wemm int i; 3063ebc1248SPeter Wemm 30752c24af7SPeter Wemm if (!IS_ELF(*hdr) || 30852c24af7SPeter Wemm hdr->e_ident[EI_CLASS] != ELF_TARG_CLASS || 30952c24af7SPeter Wemm hdr->e_ident[EI_DATA] != ELF_TARG_DATA || 3103dc19c46SJacques Vidrine hdr->e_ident[EI_VERSION] != EV_CURRENT || 3113dc19c46SJacques Vidrine hdr->e_phentsize != sizeof(Elf_Phdr) || 3123dc19c46SJacques Vidrine hdr->e_version != ELF_TARG_VER) 313a7cddfedSJake Burkholder return (ENOEXEC); 314e1743d02SSøren Schmidt 3153ebc1248SPeter Wemm /* 3163ebc1248SPeter Wemm * Make sure we have at least one brand for this machine. 3173ebc1248SPeter Wemm */ 3183ebc1248SPeter Wemm 3193ebc1248SPeter Wemm for (i = 0; i < MAX_BRANDS; i++) { 320d0ca7c29SPeter Wemm bi = elf_brand_list[i]; 321d0ca7c29SPeter Wemm if (bi != NULL && bi->machine == hdr->e_machine) 3223ebc1248SPeter Wemm break; 3233ebc1248SPeter Wemm } 3243ebc1248SPeter Wemm if (i == MAX_BRANDS) 325a7cddfedSJake Burkholder return (ENOEXEC); 326e1743d02SSøren Schmidt 327a7cddfedSJake Burkholder return (0); 328e1743d02SSøren Schmidt } 329e1743d02SSøren Schmidt 330e1743d02SSøren Schmidt static int 3313ebc1248SPeter Wemm __elfN(map_partial)(vm_map_t map, vm_object_t object, vm_ooffset_t offset, 332ff6f03c7SAlan Cox vm_offset_t start, vm_offset_t end, vm_prot_t prot) 3333ebc1248SPeter Wemm { 334da61b9a6SAlan Cox struct sf_buf *sf; 335da61b9a6SAlan Cox int error; 3363ebc1248SPeter Wemm vm_offset_t off; 3373ebc1248SPeter Wemm 3383ebc1248SPeter Wemm /* 3393ebc1248SPeter Wemm * Create the page if it doesn't exist yet. Ignore errors. 3403ebc1248SPeter Wemm */ 3413ebc1248SPeter Wemm vm_map_lock(map); 342ff6f03c7SAlan Cox vm_map_insert(map, NULL, 0, trunc_page(start), round_page(end), 343ff6f03c7SAlan Cox VM_PROT_ALL, VM_PROT_ALL, 0); 3443ebc1248SPeter Wemm vm_map_unlock(map); 3453ebc1248SPeter Wemm 3463ebc1248SPeter Wemm /* 3473ebc1248SPeter Wemm * Find the page from the underlying object. 3483ebc1248SPeter Wemm */ 3493ebc1248SPeter Wemm if (object) { 350da61b9a6SAlan Cox sf = vm_imgact_map_page(object, offset); 351da61b9a6SAlan Cox if (sf == NULL) 352da61b9a6SAlan Cox return (KERN_FAILURE); 3533ebc1248SPeter Wemm off = offset - trunc_page(offset); 354da61b9a6SAlan Cox error = copyout((caddr_t)sf_buf_kva(sf) + off, (caddr_t)start, 355ca0387efSJake Burkholder end - start); 356da61b9a6SAlan Cox vm_imgact_unmap_page(sf); 3573ebc1248SPeter Wemm if (error) { 358a7cddfedSJake Burkholder return (KERN_FAILURE); 3593ebc1248SPeter Wemm } 3603ebc1248SPeter Wemm } 3613ebc1248SPeter Wemm 362a7cddfedSJake Burkholder return (KERN_SUCCESS); 3633ebc1248SPeter Wemm } 3643ebc1248SPeter Wemm 3653ebc1248SPeter Wemm static int 3663ebc1248SPeter Wemm __elfN(map_insert)(vm_map_t map, vm_object_t object, vm_ooffset_t offset, 367ff6f03c7SAlan Cox vm_offset_t start, vm_offset_t end, vm_prot_t prot, int cow) 3683ebc1248SPeter Wemm { 369da61b9a6SAlan Cox struct sf_buf *sf; 370da61b9a6SAlan Cox vm_offset_t off; 371a063facbSMarcel Moolenaar vm_size_t sz; 372a063facbSMarcel Moolenaar int error, rv; 3733ebc1248SPeter Wemm 3743ebc1248SPeter Wemm if (start != trunc_page(start)) { 37581f223caSJake Burkholder rv = __elfN(map_partial)(map, object, offset, start, 376ff6f03c7SAlan Cox round_page(start), prot); 3773ebc1248SPeter Wemm if (rv) 378a7cddfedSJake Burkholder return (rv); 3793ebc1248SPeter Wemm offset += round_page(start) - start; 3803ebc1248SPeter Wemm start = round_page(start); 3813ebc1248SPeter Wemm } 3823ebc1248SPeter Wemm if (end != round_page(end)) { 38381f223caSJake Burkholder rv = __elfN(map_partial)(map, object, offset + 384ff6f03c7SAlan Cox trunc_page(end) - start, trunc_page(end), end, prot); 3853ebc1248SPeter Wemm if (rv) 386a7cddfedSJake Burkholder return (rv); 3873ebc1248SPeter Wemm end = trunc_page(end); 3883ebc1248SPeter Wemm } 3893ebc1248SPeter Wemm if (end > start) { 3903ebc1248SPeter Wemm if (offset & PAGE_MASK) { 3913ebc1248SPeter Wemm /* 3923ebc1248SPeter Wemm * The mapping is not page aligned. This means we have 3933ebc1248SPeter Wemm * to copy the data. Sigh. 3943ebc1248SPeter Wemm */ 395584716b0SAlan Cox rv = vm_map_find(map, NULL, 0, &start, end - start, 396ff6f03c7SAlan Cox FALSE, prot | VM_PROT_WRITE, VM_PROT_ALL, 0); 3973ebc1248SPeter Wemm if (rv) 398a7cddfedSJake Burkholder return (rv); 399da61b9a6SAlan Cox if (object == NULL) 400da61b9a6SAlan Cox return (KERN_SUCCESS); 401da61b9a6SAlan Cox for (; start < end; start += sz) { 402da61b9a6SAlan Cox sf = vm_imgact_map_page(object, offset); 403da61b9a6SAlan Cox if (sf == NULL) 404da61b9a6SAlan Cox return (KERN_FAILURE); 4053ebc1248SPeter Wemm off = offset - trunc_page(offset); 4063ebc1248SPeter Wemm sz = end - start; 407da61b9a6SAlan Cox if (sz > PAGE_SIZE - off) 408da61b9a6SAlan Cox sz = PAGE_SIZE - off; 409da61b9a6SAlan Cox error = copyout((caddr_t)sf_buf_kva(sf) + off, 4103ebc1248SPeter Wemm (caddr_t)start, sz); 411da61b9a6SAlan Cox vm_imgact_unmap_page(sf); 4123ebc1248SPeter Wemm if (error) { 413a7cddfedSJake Burkholder return (KERN_FAILURE); 4143ebc1248SPeter Wemm } 415da61b9a6SAlan Cox offset += sz; 4163ebc1248SPeter Wemm } 4173ebc1248SPeter Wemm rv = KERN_SUCCESS; 4183ebc1248SPeter Wemm } else { 419e5e6093bSAlan Cox vm_object_reference(object); 4203ebc1248SPeter Wemm vm_map_lock(map); 4213ebc1248SPeter Wemm rv = vm_map_insert(map, object, offset, start, end, 422ff6f03c7SAlan Cox prot, VM_PROT_ALL, cow); 4233ebc1248SPeter Wemm vm_map_unlock(map); 424e5e6093bSAlan Cox if (rv != KERN_SUCCESS) 425e5e6093bSAlan Cox vm_object_deallocate(object); 4263ebc1248SPeter Wemm } 427a7cddfedSJake Burkholder return (rv); 4283ebc1248SPeter Wemm } else { 429a7cddfedSJake Burkholder return (KERN_SUCCESS); 4303ebc1248SPeter Wemm } 4313ebc1248SPeter Wemm } 4323ebc1248SPeter Wemm 4333ebc1248SPeter Wemm static int 434373d1a3fSAlan Cox __elfN(load_section)(struct vmspace *vmspace, 435373d1a3fSAlan Cox vm_object_t object, vm_offset_t offset, 4363ebc1248SPeter Wemm caddr_t vmaddr, size_t memsz, size_t filsz, vm_prot_t prot, 4373ebc1248SPeter Wemm size_t pagesize) 438e1743d02SSøren Schmidt { 439da61b9a6SAlan Cox struct sf_buf *sf; 440e1743d02SSøren Schmidt size_t map_len; 441e1743d02SSøren Schmidt vm_offset_t map_addr; 442fa7dd9c5SMatthew Dillon int error, rv, cow; 443e1743d02SSøren Schmidt size_t copy_len; 44452c24af7SPeter Wemm vm_offset_t file_addr; 44552c24af7SPeter Wemm 44625ead034SBrian Feldman /* 44725ead034SBrian Feldman * It's necessary to fail if the filsz + offset taken from the 44825ead034SBrian Feldman * header is greater than the actual file pager object's size. 44925ead034SBrian Feldman * If we were to allow this, then the vm_map_find() below would 45025ead034SBrian Feldman * walk right off the end of the file object and into the ether. 45125ead034SBrian Feldman * 45225ead034SBrian Feldman * While I'm here, might as well check for something else that 45325ead034SBrian Feldman * is invalid: filsz cannot be greater than memsz. 45425ead034SBrian Feldman */ 45525ead034SBrian Feldman if ((off_t)filsz + offset > object->un_pager.vnp.vnp_size || 45625ead034SBrian Feldman filsz > memsz) { 45725ead034SBrian Feldman uprintf("elf_load_section: truncated ELF file\n"); 45825ead034SBrian Feldman return (ENOEXEC); 45925ead034SBrian Feldman } 46025ead034SBrian Feldman 4613ebc1248SPeter Wemm map_addr = trunc_page_ps((vm_offset_t)vmaddr, pagesize); 4623ebc1248SPeter Wemm file_addr = trunc_page_ps(offset, pagesize); 463e1743d02SSøren Schmidt 464e1743d02SSøren Schmidt /* 46552c24af7SPeter Wemm * We have two choices. We can either clear the data in the last page 46652c24af7SPeter Wemm * of an oversized mapping, or we can start the anon mapping a page 46752c24af7SPeter Wemm * early and copy the initialized data into that first page. We 46852c24af7SPeter Wemm * choose the second.. 46952c24af7SPeter Wemm */ 47052c24af7SPeter Wemm if (memsz > filsz) 4713ebc1248SPeter Wemm map_len = trunc_page_ps(offset + filsz, pagesize) - file_addr; 47252c24af7SPeter Wemm else 4733ebc1248SPeter Wemm map_len = round_page_ps(offset + filsz, pagesize) - file_addr; 47452c24af7SPeter Wemm 47552c24af7SPeter Wemm if (map_len != 0) { 476fa7dd9c5SMatthew Dillon /* cow flags: don't dump readonly sections in core */ 477fa7dd9c5SMatthew Dillon cow = MAP_COPY_ON_WRITE | MAP_PREFAULT | 478fa7dd9c5SMatthew Dillon (prot & VM_PROT_WRITE ? 0 : MAP_DISABLE_COREDUMP); 479fa7dd9c5SMatthew Dillon 4803ebc1248SPeter Wemm rv = __elfN(map_insert)(&vmspace->vm_map, 48152c24af7SPeter Wemm object, 48252c24af7SPeter Wemm file_addr, /* file offset */ 48352c24af7SPeter Wemm map_addr, /* virtual start */ 48452c24af7SPeter Wemm map_addr + map_len,/* virtual end */ 48552c24af7SPeter Wemm prot, 486fa7dd9c5SMatthew Dillon cow); 487e5e6093bSAlan Cox if (rv != KERN_SUCCESS) 488a7cddfedSJake Burkholder return (EINVAL); 48952c24af7SPeter Wemm 49052c24af7SPeter Wemm /* we can stop now if we've covered it all */ 49123955314SAlfred Perlstein if (memsz == filsz) { 492a7cddfedSJake Burkholder return (0); 49352c24af7SPeter Wemm } 49423955314SAlfred Perlstein } 49552c24af7SPeter Wemm 49652c24af7SPeter Wemm 49752c24af7SPeter Wemm /* 49852c24af7SPeter Wemm * We have to get the remaining bit of the file into the first part 49952c24af7SPeter Wemm * of the oversized map segment. This is normally because the .data 50052c24af7SPeter Wemm * segment in the file is extended to provide bss. It's a neat idea 50152c24af7SPeter Wemm * to try and save a page, but it's a pain in the behind to implement. 502e1743d02SSøren Schmidt */ 5033ebc1248SPeter Wemm copy_len = (offset + filsz) - trunc_page_ps(offset + filsz, pagesize); 5043ebc1248SPeter Wemm map_addr = trunc_page_ps((vm_offset_t)vmaddr + filsz, pagesize); 505ca0387efSJake Burkholder map_len = round_page_ps((vm_offset_t)vmaddr + memsz, pagesize) - 506ca0387efSJake Burkholder map_addr; 507e1743d02SSøren Schmidt 50852c24af7SPeter Wemm /* This had damn well better be true! */ 5098191d577SPeter Wemm if (map_len != 0) { 51081f223caSJake Burkholder rv = __elfN(map_insert)(&vmspace->vm_map, NULL, 0, map_addr, 511ff6f03c7SAlan Cox map_addr + map_len, VM_PROT_ALL, 0); 51223955314SAlfred Perlstein if (rv != KERN_SUCCESS) { 513a7cddfedSJake Burkholder return (EINVAL); 5148191d577SPeter Wemm } 51523955314SAlfred Perlstein } 516e1743d02SSøren Schmidt 51752c24af7SPeter Wemm if (copy_len != 0) { 5183ebc1248SPeter Wemm vm_offset_t off; 519da61b9a6SAlan Cox 520da61b9a6SAlan Cox sf = vm_imgact_map_page(object, offset + filsz); 521da61b9a6SAlan Cox if (sf == NULL) 522da61b9a6SAlan Cox return (EIO); 523e1743d02SSøren Schmidt 52452c24af7SPeter Wemm /* send the page fragment to user space */ 52581f223caSJake Burkholder off = trunc_page_ps(offset + filsz, pagesize) - 52681f223caSJake Burkholder trunc_page(offset + filsz); 527da61b9a6SAlan Cox error = copyout((caddr_t)sf_buf_kva(sf) + off, 528da61b9a6SAlan Cox (caddr_t)map_addr, copy_len); 529da61b9a6SAlan Cox vm_imgact_unmap_page(sf); 53023955314SAlfred Perlstein if (error) { 53152c24af7SPeter Wemm return (error); 53252c24af7SPeter Wemm } 53323955314SAlfred Perlstein } 534e1743d02SSøren Schmidt 535e1743d02SSøren Schmidt /* 5363ebc1248SPeter Wemm * set it to the specified protection. 5373ebc1248SPeter Wemm * XXX had better undo the damage from pasting over the cracks here! 538e1743d02SSøren Schmidt */ 5393ebc1248SPeter Wemm vm_map_protect(&vmspace->vm_map, trunc_page(map_addr), 5403ebc1248SPeter Wemm round_page(map_addr + map_len), prot, FALSE); 5418191d577SPeter Wemm 542ff6f03c7SAlan Cox return (0); 543e1743d02SSøren Schmidt } 544e1743d02SSøren Schmidt 545c33fe779SJohn Polstra /* 546c33fe779SJohn Polstra * Load the file "file" into memory. It may be either a shared object 547c33fe779SJohn Polstra * or an executable. 548c33fe779SJohn Polstra * 549c33fe779SJohn Polstra * The "addr" reference parameter is in/out. On entry, it specifies 550c33fe779SJohn Polstra * the address where a shared object should be loaded. If the file is 551c33fe779SJohn Polstra * an executable, this value is ignored. On exit, "addr" specifies 552c33fe779SJohn Polstra * where the file was actually loaded. 553c33fe779SJohn Polstra * 554c33fe779SJohn Polstra * The "entry" reference parameter is out only. On exit, it specifies 555c33fe779SJohn Polstra * the entry point for the loaded file. 556c33fe779SJohn Polstra */ 557e1743d02SSøren Schmidt static int 5583ebc1248SPeter Wemm __elfN(load_file)(struct proc *p, const char *file, u_long *addr, 5593ebc1248SPeter Wemm u_long *entry, size_t pagesize) 560e1743d02SSøren Schmidt { 561911c2be0SMark Peek struct { 562911c2be0SMark Peek struct nameidata nd; 563911c2be0SMark Peek struct vattr attr; 564911c2be0SMark Peek struct image_params image_params; 565911c2be0SMark Peek } *tempdata; 566d254af07SMatthew Dillon const Elf_Ehdr *hdr = NULL; 567d254af07SMatthew Dillon const Elf_Phdr *phdr = NULL; 568911c2be0SMark Peek struct nameidata *nd; 569e1743d02SSøren Schmidt struct vmspace *vmspace = p->p_vmspace; 570911c2be0SMark Peek struct vattr *attr; 571911c2be0SMark Peek struct image_params *imgp; 57252c24af7SPeter Wemm vm_prot_t prot; 573c33fe779SJohn Polstra u_long rbase; 574c33fe779SJohn Polstra u_long base_addr = 0; 57568ff2a43SChristian S.J. Peron int vfslocked, error, i, numsegs; 576e1743d02SSøren Schmidt 577a163d034SWarner Losh tempdata = malloc(sizeof(*tempdata), M_TEMP, M_WAITOK); 578911c2be0SMark Peek nd = &tempdata->nd; 579911c2be0SMark Peek attr = &tempdata->attr; 580911c2be0SMark Peek imgp = &tempdata->image_params; 581911c2be0SMark Peek 582c8a79999SPeter Wemm /* 583c8a79999SPeter Wemm * Initialize part of the common data 584c8a79999SPeter Wemm */ 585c8a79999SPeter Wemm imgp->proc = p; 586911c2be0SMark Peek imgp->attr = attr; 587c8a79999SPeter Wemm imgp->firstpage = NULL; 58859c8bc40SAlan Cox imgp->image_header = NULL; 5890b2ed1aeSJeff Roberson imgp->object = NULL; 5906d7bdc8dSRobert Watson imgp->execlabel = NULL; 591c8a79999SPeter Wemm 59268ff2a43SChristian S.J. Peron NDINIT(nd, LOOKUP, MPSAFE|LOCKLEAF|FOLLOW, UIO_SYSSPACE, file, 59368ff2a43SChristian S.J. Peron curthread); 59468ff2a43SChristian S.J. Peron vfslocked = 0; 595911c2be0SMark Peek if ((error = namei(nd)) != 0) { 596911c2be0SMark Peek nd->ni_vp = NULL; 597e1743d02SSøren Schmidt goto fail; 598e1743d02SSøren Schmidt } 59968ff2a43SChristian S.J. Peron vfslocked = NDHASGIANT(nd); 600911c2be0SMark Peek NDFREE(nd, NDF_ONLY_PNBUF); 601911c2be0SMark Peek imgp->vp = nd->ni_vp; 602c8a79999SPeter Wemm 603e1743d02SSøren Schmidt /* 604e1743d02SSøren Schmidt * Check permissions, modes, uid, etc on the file, and "open" it. 605e1743d02SSøren Schmidt */ 606c8a79999SPeter Wemm error = exec_check_permissions(imgp); 607373d1a3fSAlan Cox if (error) 608c8a79999SPeter Wemm goto fail; 609e1743d02SSøren Schmidt 610c8a79999SPeter Wemm error = exec_map_first_page(imgp); 611373d1a3fSAlan Cox if (error) 612373d1a3fSAlan Cox goto fail; 613373d1a3fSAlan Cox 61425ead034SBrian Feldman /* 61525ead034SBrian Feldman * Also make certain that the interpreter stays the same, so set 616e6e370a7SJeff Roberson * its VV_TEXT flag, too. 61725ead034SBrian Feldman */ 618e6e370a7SJeff Roberson nd->ni_vp->v_vflag |= VV_TEXT; 619e6e370a7SJeff Roberson 6208516dd18SPoul-Henning Kamp imgp->object = nd->ni_vp->v_object; 621e1743d02SSøren Schmidt 622d254af07SMatthew Dillon hdr = (const Elf_Ehdr *)imgp->image_header; 6233ebc1248SPeter Wemm if ((error = __elfN(check_header)(hdr)) != 0) 624e1743d02SSøren Schmidt goto fail; 625c33fe779SJohn Polstra if (hdr->e_type == ET_DYN) 626c33fe779SJohn Polstra rbase = *addr; 627c33fe779SJohn Polstra else if (hdr->e_type == ET_EXEC) 628c33fe779SJohn Polstra rbase = 0; 629c33fe779SJohn Polstra else { 630c33fe779SJohn Polstra error = ENOEXEC; 631c33fe779SJohn Polstra goto fail; 632c33fe779SJohn Polstra } 633e1743d02SSøren Schmidt 634c8a79999SPeter Wemm /* Only support headers that fit within first page for now */ 6353dc19c46SJacques Vidrine /* (multiplication of two Elf_Half fields will not overflow) */ 63652c24af7SPeter Wemm if ((hdr->e_phoff > PAGE_SIZE) || 6373dc19c46SJacques Vidrine (hdr->e_phentsize * hdr->e_phnum) > PAGE_SIZE - hdr->e_phoff) { 638c8a79999SPeter Wemm error = ENOEXEC; 639e1743d02SSøren Schmidt goto fail; 640c8a79999SPeter Wemm } 641c8a79999SPeter Wemm 642d254af07SMatthew Dillon phdr = (const Elf_Phdr *)(imgp->image_header + hdr->e_phoff); 64393d1c728SKonstantin Belousov if (!aligned(phdr, Elf_Addr)) { 64493d1c728SKonstantin Belousov error = ENOEXEC; 64593d1c728SKonstantin Belousov goto fail; 64693d1c728SKonstantin Belousov } 647e1743d02SSøren Schmidt 648c33fe779SJohn Polstra for (i = 0, numsegs = 0; i < hdr->e_phnum; i++) { 6495b33842aSKonstantin Belousov if (phdr[i].p_type == PT_LOAD && phdr[i].p_memsz != 0) { 6505b33842aSKonstantin Belousov /* Loadable segment */ 65152c24af7SPeter Wemm prot = 0; 652e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_X) 653e1743d02SSøren Schmidt prot |= VM_PROT_EXECUTE; 654e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_W) 655e1743d02SSøren Schmidt prot |= VM_PROT_WRITE; 656e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_R) 657e1743d02SSøren Schmidt prot |= VM_PROT_READ; 658e1743d02SSøren Schmidt 659373d1a3fSAlan Cox if ((error = __elfN(load_section)(vmspace, 660373d1a3fSAlan Cox imgp->object, phdr[i].p_offset, 66181f223caSJake Burkholder (caddr_t)(uintptr_t)phdr[i].p_vaddr + rbase, 66281f223caSJake Burkholder phdr[i].p_memsz, phdr[i].p_filesz, prot, 66381f223caSJake Burkholder pagesize)) != 0) 664e1743d02SSøren Schmidt goto fail; 665e1743d02SSøren Schmidt /* 666c33fe779SJohn Polstra * Establish the base address if this is the 667c33fe779SJohn Polstra * first segment. 668e1743d02SSøren Schmidt */ 669c33fe779SJohn Polstra if (numsegs == 0) 670ca0387efSJake Burkholder base_addr = trunc_page(phdr[i].p_vaddr + 671ca0387efSJake Burkholder rbase); 672c33fe779SJohn Polstra numsegs++; 673e1743d02SSøren Schmidt } 674e1743d02SSøren Schmidt } 675c33fe779SJohn Polstra *addr = base_addr; 676c33fe779SJohn Polstra *entry = (unsigned long)hdr->e_entry + rbase; 677e1743d02SSøren Schmidt 678e1743d02SSøren Schmidt fail: 679c8a79999SPeter Wemm if (imgp->firstpage) 680c8a79999SPeter Wemm exec_unmap_first_page(imgp); 6810b2ed1aeSJeff Roberson 682911c2be0SMark Peek if (nd->ni_vp) 683373d1a3fSAlan Cox vput(nd->ni_vp); 684911c2be0SMark Peek 68568ff2a43SChristian S.J. Peron VFS_UNLOCK_GIANT(vfslocked); 686911c2be0SMark Peek free(tempdata, M_TEMP); 687e1743d02SSøren Schmidt 688a7cddfedSJake Burkholder return (error); 689e1743d02SSøren Schmidt } 690e1743d02SSøren Schmidt 691303b270bSEivind Eklund static int 6923ebc1248SPeter Wemm __CONCAT(exec_, __elfN(imgact))(struct image_params *imgp) 693e1743d02SSøren Schmidt { 694ecbb00a2SDoug Rabson const Elf_Ehdr *hdr = (const Elf_Ehdr *)imgp->image_header; 69532c01de2SDmitry Chagin const Elf_Phdr *phdr; 696e5e6093bSAlan Cox Elf_Auxargs *elf_auxargs; 6975856e12eSJohn Dyson struct vmspace *vmspace; 69852c24af7SPeter Wemm vm_prot_t prot; 69921c2d047SMatthew Dillon u_long text_size = 0, data_size = 0, total_size = 0; 700e1743d02SSøren Schmidt u_long text_addr = 0, data_addr = 0; 701cac45152SMatthew Dillon u_long seg_size, seg_addr; 7027564c4adSKonstantin Belousov u_long addr, baddr, et_dyn_addr, entry = 0, proghdr = 0; 70332c01de2SDmitry Chagin int32_t osrel = 0; 7047564c4adSKonstantin Belousov int error = 0, i, n; 7054113f8d7SPeter Wemm const char *interp = NULL, *newinterp = NULL; 706d1dbc694SJohn Polstra Elf_Brandinfo *brand_info; 707911c2be0SMark Peek char *path; 7085fe3ed62SJake Burkholder struct sysentvec *sv; 709e1743d02SSøren Schmidt 710e1743d02SSøren Schmidt /* 711e1743d02SSøren Schmidt * Do we have a valid ELF header ? 712900b28f9SMaxim Sobolev * 713900b28f9SMaxim Sobolev * Only allow ET_EXEC & ET_DYN here, reject ET_DYN later 714900b28f9SMaxim Sobolev * if particular brand doesn't support it. 715e1743d02SSøren Schmidt */ 716900b28f9SMaxim Sobolev if (__elfN(check_header)(hdr) != 0 || 717900b28f9SMaxim Sobolev (hdr->e_type != ET_EXEC && hdr->e_type != ET_DYN)) 718a7cddfedSJake Burkholder return (-1); 719e1743d02SSøren Schmidt 720e1743d02SSøren Schmidt /* 721e1743d02SSøren Schmidt * From here on down, we return an errno, not -1, as we've 722e1743d02SSøren Schmidt * detected an ELF file. 723e1743d02SSøren Schmidt */ 724e1743d02SSøren Schmidt 725e1743d02SSøren Schmidt if ((hdr->e_phoff > PAGE_SIZE) || 72652c24af7SPeter Wemm (hdr->e_phoff + hdr->e_phentsize * hdr->e_phnum) > PAGE_SIZE) { 727c8a79999SPeter Wemm /* Only support headers in first page for now */ 728a7cddfedSJake Burkholder return (ENOEXEC); 729e1743d02SSøren Schmidt } 73052c24af7SPeter Wemm phdr = (const Elf_Phdr *)(imgp->image_header + hdr->e_phoff); 73193d1c728SKonstantin Belousov if (!aligned(phdr, Elf_Addr)) 73293d1c728SKonstantin Belousov return (ENOEXEC); 7337564c4adSKonstantin Belousov n = 0; 7347564c4adSKonstantin Belousov baddr = 0; 7355fe3ed62SJake Burkholder for (i = 0; i < hdr->e_phnum; i++) { 7367564c4adSKonstantin Belousov if (phdr[i].p_type == PT_LOAD) { 7377564c4adSKonstantin Belousov if (n == 0) 7387564c4adSKonstantin Belousov baddr = phdr[i].p_vaddr; 7397564c4adSKonstantin Belousov n++; 7407564c4adSKonstantin Belousov continue; 7417564c4adSKonstantin Belousov } 742e5e6093bSAlan Cox if (phdr[i].p_type == PT_INTERP) { 743e5e6093bSAlan Cox /* Path to interpreter */ 7445fe3ed62SJake Burkholder if (phdr[i].p_filesz > MAXPATHLEN || 74560bb3943SAlan Cox phdr[i].p_offset + phdr[i].p_filesz > PAGE_SIZE) 74660bb3943SAlan Cox return (ENOEXEC); 7475fe3ed62SJake Burkholder interp = imgp->image_header + phdr[i].p_offset; 7487564c4adSKonstantin Belousov continue; 7493ebc1248SPeter Wemm } 7503ebc1248SPeter Wemm } 7513ebc1248SPeter Wemm 75232c01de2SDmitry Chagin brand_info = __elfN(get_brandinfo)(imgp, interp, &osrel); 7535fe3ed62SJake Burkholder if (brand_info == NULL) { 7545fe3ed62SJake Burkholder uprintf("ELF binary type \"%u\" not known.\n", 7555fe3ed62SJake Burkholder hdr->e_ident[EI_OSABI]); 75660bb3943SAlan Cox return (ENOEXEC); 7573ebc1248SPeter Wemm } 758ab02d85fSKonstantin Belousov if (hdr->e_type == ET_DYN) { 759ab02d85fSKonstantin Belousov if ((brand_info->flags & BI_CAN_EXEC_DYN) == 0) 760d49b2109SMaxim Sobolev return (ENOEXEC); 7617564c4adSKonstantin Belousov /* 7627564c4adSKonstantin Belousov * Honour the base load address from the dso if it is 7637564c4adSKonstantin Belousov * non-zero for some reason. 7647564c4adSKonstantin Belousov */ 7657564c4adSKonstantin Belousov if (baddr == 0) 766ab02d85fSKonstantin Belousov et_dyn_addr = ET_DYN_LOAD_ADDR; 7677564c4adSKonstantin Belousov else 7687564c4adSKonstantin Belousov et_dyn_addr = 0; 769ab02d85fSKonstantin Belousov } else 770ab02d85fSKonstantin Belousov et_dyn_addr = 0; 7715fe3ed62SJake Burkholder sv = brand_info->sysvec; 7729b68618dSPeter Wemm if (interp != NULL && brand_info->interp_newpath != NULL) 7734113f8d7SPeter Wemm newinterp = brand_info->interp_newpath; 7743ebc1248SPeter Wemm 77560bb3943SAlan Cox /* 77660bb3943SAlan Cox * Avoid a possible deadlock if the current address space is destroyed 77760bb3943SAlan Cox * and that address space maps the locked vnode. In the common case, 77860bb3943SAlan Cox * the locked vnode's v_usecount is decremented but remains greater 77960bb3943SAlan Cox * than zero. Consequently, the vnode lock is not needed by vrele(). 78060bb3943SAlan Cox * However, in cases where the vnode lock is external, such as nullfs, 78160bb3943SAlan Cox * v_usecount may become zero. 78260bb3943SAlan Cox */ 78322db15c0SAttilio Rao VOP_UNLOCK(imgp->vp, 0); 78460bb3943SAlan Cox 78589b57fcfSKonstantin Belousov error = exec_new_vmspace(imgp, sv); 78619059a13SJohn Baldwin imgp->proc->p_sysent = sv; 787e1743d02SSøren Schmidt 788cb05b60aSAttilio Rao vn_lock(imgp->vp, LK_EXCLUSIVE | LK_RETRY); 78989b57fcfSKonstantin Belousov if (error) 79089b57fcfSKonstantin Belousov return (error); 79160bb3943SAlan Cox 7925856e12eSJohn Dyson vmspace = imgp->proc->p_vmspace; 7935856e12eSJohn Dyson 794e1743d02SSøren Schmidt for (i = 0; i < hdr->e_phnum; i++) { 795e1743d02SSøren Schmidt switch (phdr[i].p_type) { 796e1743d02SSøren Schmidt case PT_LOAD: /* Loadable segment */ 7975b33842aSKonstantin Belousov if (phdr[i].p_memsz == 0) 7985b33842aSKonstantin Belousov break; 79952c24af7SPeter Wemm prot = 0; 800e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_X) 801e1743d02SSøren Schmidt prot |= VM_PROT_EXECUTE; 802e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_W) 803e1743d02SSøren Schmidt prot |= VM_PROT_WRITE; 804e1743d02SSøren Schmidt if (phdr[i].p_flags & PF_R) 805e1743d02SSøren Schmidt prot |= VM_PROT_READ; 806e1743d02SSøren Schmidt 8073ebc1248SPeter Wemm #if defined(__ia64__) && __ELF_WORD_SIZE == 32 && defined(IA32_ME_HARDER) 8083ebc1248SPeter Wemm /* 8093ebc1248SPeter Wemm * Some x86 binaries assume read == executable, 8103ebc1248SPeter Wemm * notably the M3 runtime and therefore cvsup 8113ebc1248SPeter Wemm */ 8123ebc1248SPeter Wemm if (prot & VM_PROT_READ) 8133ebc1248SPeter Wemm prot |= VM_PROT_EXECUTE; 8143ebc1248SPeter Wemm #endif 8153ebc1248SPeter Wemm 816373d1a3fSAlan Cox if ((error = __elfN(load_section)(vmspace, 817373d1a3fSAlan Cox imgp->object, phdr[i].p_offset, 818ab02d85fSKonstantin Belousov (caddr_t)(uintptr_t)phdr[i].p_vaddr + et_dyn_addr, 81981f223caSJake Burkholder phdr[i].p_memsz, phdr[i].p_filesz, prot, 8205fe3ed62SJake Burkholder sv->sv_pagesize)) != 0) 82160bb3943SAlan Cox return (error); 822e1743d02SSøren Schmidt 823cfaf7e60SDoug Rabson /* 824cfaf7e60SDoug Rabson * If this segment contains the program headers, 825cfaf7e60SDoug Rabson * remember their virtual address for the AT_PHDR 826cfaf7e60SDoug Rabson * aux entry. Static binaries don't usually include 827cfaf7e60SDoug Rabson * a PT_PHDR entry. 828cfaf7e60SDoug Rabson */ 829cfaf7e60SDoug Rabson if (phdr[i].p_offset == 0 && 830cfaf7e60SDoug Rabson hdr->e_phoff + hdr->e_phnum * hdr->e_phentsize 831cfaf7e60SDoug Rabson <= phdr[i].p_filesz) 832ab02d85fSKonstantin Belousov proghdr = phdr[i].p_vaddr + hdr->e_phoff + 833ab02d85fSKonstantin Belousov et_dyn_addr; 834cfaf7e60SDoug Rabson 835ab02d85fSKonstantin Belousov seg_addr = trunc_page(phdr[i].p_vaddr + et_dyn_addr); 836cac45152SMatthew Dillon seg_size = round_page(phdr[i].p_memsz + 837ab02d85fSKonstantin Belousov phdr[i].p_vaddr + et_dyn_addr - seg_addr); 838cac45152SMatthew Dillon 839e1743d02SSøren Schmidt /* 84021c2d047SMatthew Dillon * Is this .text or .data? We can't use 84121c2d047SMatthew Dillon * VM_PROT_WRITE or VM_PROT_EXEC, it breaks the 84221c2d047SMatthew Dillon * alpha terribly and possibly does other bad 84321c2d047SMatthew Dillon * things so we stick to the old way of figuring 84421c2d047SMatthew Dillon * it out: If the segment contains the program 84521c2d047SMatthew Dillon * entry point, it's a text segment, otherwise it 84621c2d047SMatthew Dillon * is a data segment. 84721c2d047SMatthew Dillon * 84821c2d047SMatthew Dillon * Note that obreak() assumes that data_addr + 84921c2d047SMatthew Dillon * data_size == end of data load area, and the ELF 85021c2d047SMatthew Dillon * file format expects segments to be sorted by 85121c2d047SMatthew Dillon * address. If multiple data segments exist, the 85221c2d047SMatthew Dillon * last one will be used. 853e1743d02SSøren Schmidt */ 8549782ecbaSPeter Wemm if (hdr->e_entry >= phdr[i].p_vaddr && 8559782ecbaSPeter Wemm hdr->e_entry < (phdr[i].p_vaddr + 8569782ecbaSPeter Wemm phdr[i].p_memsz)) { 8579782ecbaSPeter Wemm text_size = seg_size; 8589782ecbaSPeter Wemm text_addr = seg_addr; 859ab02d85fSKonstantin Belousov entry = (u_long)hdr->e_entry + et_dyn_addr; 8609782ecbaSPeter Wemm } else { 86121c2d047SMatthew Dillon data_size = seg_size; 862cac45152SMatthew Dillon data_addr = seg_addr; 863cac45152SMatthew Dillon } 86421c2d047SMatthew Dillon total_size += seg_size; 86596725dd0SAlexander Kabaev break; 86696725dd0SAlexander Kabaev case PT_PHDR: /* Program header table info */ 867ab02d85fSKonstantin Belousov proghdr = phdr[i].p_vaddr + et_dyn_addr; 86896725dd0SAlexander Kabaev break; 86996725dd0SAlexander Kabaev default: 87096725dd0SAlexander Kabaev break; 87196725dd0SAlexander Kabaev } 87296725dd0SAlexander Kabaev } 87396725dd0SAlexander Kabaev 87496725dd0SAlexander Kabaev if (data_addr == 0 && data_size == 0) { 87596725dd0SAlexander Kabaev data_addr = text_addr; 87696725dd0SAlexander Kabaev data_size = text_size; 87796725dd0SAlexander Kabaev } 878cac45152SMatthew Dillon 879cac45152SMatthew Dillon /* 880cac45152SMatthew Dillon * Check limits. It should be safe to check the 88196725dd0SAlexander Kabaev * limits after loading the segments since we do 88296725dd0SAlexander Kabaev * not actually fault in all the segments pages. 883cac45152SMatthew Dillon */ 88491d5354aSJohn Baldwin PROC_LOCK(imgp->proc); 88591d5354aSJohn Baldwin if (data_size > lim_cur(imgp->proc, RLIMIT_DATA) || 886cac45152SMatthew Dillon text_size > maxtsiz || 88791d5354aSJohn Baldwin total_size > lim_cur(imgp->proc, RLIMIT_VMEM)) { 88891d5354aSJohn Baldwin PROC_UNLOCK(imgp->proc); 88960bb3943SAlan Cox return (ENOMEM); 890cac45152SMatthew Dillon } 891e1743d02SSøren Schmidt 892e1743d02SSøren Schmidt vmspace->vm_tsize = text_size >> PAGE_SHIFT; 8937cd99438SBruce Evans vmspace->vm_taddr = (caddr_t)(uintptr_t)text_addr; 894e1743d02SSøren Schmidt vmspace->vm_dsize = data_size >> PAGE_SHIFT; 8957cd99438SBruce Evans vmspace->vm_daddr = (caddr_t)(uintptr_t)data_addr; 896e1743d02SSøren Schmidt 897c460ac3aSPeter Wemm /* 898c460ac3aSPeter Wemm * We load the dynamic linker where a userland call 899c460ac3aSPeter Wemm * to mmap(0, ...) would put it. The rationale behind this 900c460ac3aSPeter Wemm * calculation is that it leaves room for the heap to grow to 901c460ac3aSPeter Wemm * its maximum allowed size. 902c460ac3aSPeter Wemm */ 903c460ac3aSPeter Wemm addr = round_page((vm_offset_t)imgp->proc->p_vmspace->vm_daddr + 90491d5354aSJohn Baldwin lim_max(imgp->proc, RLIMIT_DATA)); 90591d5354aSJohn Baldwin PROC_UNLOCK(imgp->proc); 906e1743d02SSøren Schmidt 907ea5a2b2eSSøren Schmidt imgp->entry_addr = entry; 908ea5a2b2eSSøren Schmidt 90960bb3943SAlan Cox if (interp != NULL) { 9104113f8d7SPeter Wemm int have_interp = FALSE; 91122db15c0SAttilio Rao VOP_UNLOCK(imgp->vp, 0); 91260bb3943SAlan Cox if (brand_info->emul_path != NULL && 9139b68618dSPeter Wemm brand_info->emul_path[0] != '\0') { 914a163d034SWarner Losh path = malloc(MAXPATHLEN, M_TEMP, M_WAITOK); 91560bb3943SAlan Cox snprintf(path, MAXPATHLEN, "%s%s", 91660bb3943SAlan Cox brand_info->emul_path, interp); 9179b68618dSPeter Wemm error = __elfN(load_file)(imgp->proc, path, &addr, 9189b68618dSPeter Wemm &imgp->entry_addr, sv->sv_pagesize); 919911c2be0SMark Peek free(path, M_TEMP); 9209b68618dSPeter Wemm if (error == 0) 9214113f8d7SPeter Wemm have_interp = TRUE; 9229b68618dSPeter Wemm } 9234113f8d7SPeter Wemm if (!have_interp && newinterp != NULL) { 9244113f8d7SPeter Wemm error = __elfN(load_file)(imgp->proc, newinterp, &addr, 9254113f8d7SPeter Wemm &imgp->entry_addr, sv->sv_pagesize); 926387ad998SKonstantin Belousov if (error == 0) 9274113f8d7SPeter Wemm have_interp = TRUE; 9284113f8d7SPeter Wemm } 9294113f8d7SPeter Wemm if (!have_interp) { 9309b68618dSPeter Wemm error = __elfN(load_file)(imgp->proc, interp, &addr, 9319b68618dSPeter Wemm &imgp->entry_addr, sv->sv_pagesize); 93260bb3943SAlan Cox } 933cb05b60aSAttilio Rao vn_lock(imgp->vp, LK_EXCLUSIVE | LK_RETRY); 9349b68618dSPeter Wemm if (error != 0) { 9359b68618dSPeter Wemm uprintf("ELF interpreter %s not found\n", interp); 93660bb3943SAlan Cox return (error); 937e1743d02SSøren Schmidt } 93895c807cfSRobert Watson } else 9397564c4adSKonstantin Belousov addr = et_dyn_addr; 940ea5a2b2eSSøren Schmidt 941e1743d02SSøren Schmidt /* 942e1743d02SSøren Schmidt * Construct auxargs table (used by the fixup routine) 943e1743d02SSøren Schmidt */ 944a163d034SWarner Losh elf_auxargs = malloc(sizeof(Elf_Auxargs), M_TEMP, M_WAITOK); 945e1743d02SSøren Schmidt elf_auxargs->execfd = -1; 946e1743d02SSøren Schmidt elf_auxargs->phdr = proghdr; 947e1743d02SSøren Schmidt elf_auxargs->phent = hdr->e_phentsize; 948e1743d02SSøren Schmidt elf_auxargs->phnum = hdr->e_phnum; 949e1743d02SSøren Schmidt elf_auxargs->pagesz = PAGE_SIZE; 950e1743d02SSøren Schmidt elf_auxargs->base = addr; 951e1743d02SSøren Schmidt elf_auxargs->flags = 0; 952e1743d02SSøren Schmidt elf_auxargs->entry = entry; 953e1743d02SSøren Schmidt 954e1743d02SSøren Schmidt imgp->auxargs = elf_auxargs; 955e1743d02SSøren Schmidt imgp->interpreted = 0; 95632c01de2SDmitry Chagin imgp->proc->p_osrel = osrel; 957f231de47SKonstantin Belousov 958a7cddfedSJake Burkholder return (error); 959e1743d02SSøren Schmidt } 960e1743d02SSøren Schmidt 961a360a43dSJake Burkholder #define suword __CONCAT(suword, __ELF_WORD_SIZE) 9623ebc1248SPeter Wemm 9633ebc1248SPeter Wemm int 9643ebc1248SPeter Wemm __elfN(freebsd_fixup)(register_t **stack_base, struct image_params *imgp) 965e1743d02SSøren Schmidt { 966ecbb00a2SDoug Rabson Elf_Auxargs *args = (Elf_Auxargs *)imgp->auxargs; 967a360a43dSJake Burkholder Elf_Addr *base; 968a360a43dSJake Burkholder Elf_Addr *pos; 969e1743d02SSøren Schmidt 970a360a43dSJake Burkholder base = (Elf_Addr *)*stack_base; 971610ecfe0SMaxim Sobolev pos = base + (imgp->args->argc + imgp->args->envc + 2); 972e1743d02SSøren Schmidt 97335c2a5a8SWarner Losh if (args->execfd != -1) 974e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_EXECFD, args->execfd); 975e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PHDR, args->phdr); 976e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PHENT, args->phent); 977e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PHNUM, args->phnum); 978e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PAGESZ, args->pagesz); 979e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_FLAGS, args->flags); 980e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_ENTRY, args->entry); 981e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_BASE, args->base); 9823ff06357SKonstantin Belousov if (imgp->execpathp != 0) 9833ff06357SKonstantin Belousov AUXARGS_ENTRY(pos, AT_EXECPATH, imgp->execpathp); 984e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_NULL, 0); 985e1743d02SSøren Schmidt 986e1743d02SSøren Schmidt free(imgp->auxargs, M_TEMP); 987e1743d02SSøren Schmidt imgp->auxargs = NULL; 988e1743d02SSøren Schmidt 9893ebc1248SPeter Wemm base--; 990610ecfe0SMaxim Sobolev suword(base, (long)imgp->args->argc); 9913ebc1248SPeter Wemm *stack_base = (register_t *)base; 992a7cddfedSJake Burkholder return (0); 993e1743d02SSøren Schmidt } 994e1743d02SSøren Schmidt 995e1743d02SSøren Schmidt /* 9968c64af4fSJohn Polstra * Code for generating ELF core dumps. 9978c64af4fSJohn Polstra */ 9988c64af4fSJohn Polstra 9994d77a549SAlfred Perlstein typedef void (*segment_callback)(vm_map_entry_t, void *); 10000ff27d31SJohn Polstra 10010ff27d31SJohn Polstra /* Closure for cb_put_phdr(). */ 10020ff27d31SJohn Polstra struct phdr_closure { 10030ff27d31SJohn Polstra Elf_Phdr *phdr; /* Program header to fill in */ 10040ff27d31SJohn Polstra Elf_Off offset; /* Offset of segment in core file */ 10050ff27d31SJohn Polstra }; 10060ff27d31SJohn Polstra 10070ff27d31SJohn Polstra /* Closure for cb_size_segment(). */ 10080ff27d31SJohn Polstra struct sseg_closure { 10090ff27d31SJohn Polstra int count; /* Count of writable segments. */ 10100ff27d31SJohn Polstra size_t size; /* Total size of all writable segments. */ 10110ff27d31SJohn Polstra }; 10120ff27d31SJohn Polstra 10134d77a549SAlfred Perlstein static void cb_put_phdr(vm_map_entry_t, void *); 10144d77a549SAlfred Perlstein static void cb_size_segment(vm_map_entry_t, void *); 1015247aba24SMarcel Moolenaar static void each_writable_segment(struct thread *, segment_callback, void *); 10163ebc1248SPeter Wemm static int __elfN(corehdr)(struct thread *, struct vnode *, struct ucred *, 1017e7228204SAlfred Perlstein int, void *, size_t, gzFile); 1018247aba24SMarcel Moolenaar static void __elfN(puthdr)(struct thread *, void *, size_t *, int); 10193ebc1248SPeter Wemm static void __elfN(putnote)(void *, size_t *, const char *, int, 10204d77a549SAlfred Perlstein const void *, size_t); 10218c64af4fSJohn Polstra 1022e7228204SAlfred Perlstein #ifdef COMPRESS_USER_CORES 1023e7228204SAlfred Perlstein extern int compress_user_cores; 1024e7228204SAlfred Perlstein extern int compress_user_cores_gzlevel; 1025e7228204SAlfred Perlstein #endif 1026e7228204SAlfred Perlstein 1027e7228204SAlfred Perlstein static int 1028e7228204SAlfred Perlstein core_output(struct vnode *vp, void *base, size_t len, off_t offset, 1029e7228204SAlfred Perlstein struct ucred *active_cred, struct ucred *file_cred, 1030e7228204SAlfred Perlstein struct thread *td, char *core_buf, gzFile gzfile) { 1031e7228204SAlfred Perlstein 1032e7228204SAlfred Perlstein int error; 1033e7228204SAlfred Perlstein if (gzfile) { 1034e7228204SAlfred Perlstein #ifdef COMPRESS_USER_CORES 1035e7228204SAlfred Perlstein error = compress_core(gzfile, base, core_buf, len, td); 1036e7228204SAlfred Perlstein #else 1037e7228204SAlfred Perlstein panic("shouldn't be here"); 1038e7228204SAlfred Perlstein #endif 1039e7228204SAlfred Perlstein } else { 1040e7228204SAlfred Perlstein error = vn_rdwr_inchunks(UIO_WRITE, vp, base, len, offset, 1041e7228204SAlfred Perlstein UIO_USERSPACE, IO_UNIT | IO_DIRECT, active_cred, file_cred, 1042e7228204SAlfred Perlstein NULL, td); 1043e7228204SAlfred Perlstein } 1044e7228204SAlfred Perlstein return (error); 1045e7228204SAlfred Perlstein } 1046e7228204SAlfred Perlstein 10478c64af4fSJohn Polstra int 1048e7228204SAlfred Perlstein __elfN(coredump)(struct thread *td, struct vnode *vp, off_t limit, int flags) 1049fca666a1SJulian Elischer { 1050247aba24SMarcel Moolenaar struct ucred *cred = td->td_ucred; 1051fca666a1SJulian Elischer int error = 0; 10520ff27d31SJohn Polstra struct sseg_closure seginfo; 10530ff27d31SJohn Polstra void *hdr; 10548c64af4fSJohn Polstra size_t hdrsize; 10558c64af4fSJohn Polstra 1056e7228204SAlfred Perlstein gzFile gzfile = Z_NULL; 1057e7228204SAlfred Perlstein char *core_buf = NULL; 1058e7228204SAlfred Perlstein #ifdef COMPRESS_USER_CORES 1059e7228204SAlfred Perlstein char gzopen_flags[8]; 1060e7228204SAlfred Perlstein char *p; 1061e7228204SAlfred Perlstein int doing_compress = flags & IMGACT_CORE_COMPRESS; 1062e7228204SAlfred Perlstein #endif 1063e7228204SAlfred Perlstein 1064e7228204SAlfred Perlstein hdr = NULL; 1065e7228204SAlfred Perlstein 1066e7228204SAlfred Perlstein #ifdef COMPRESS_USER_CORES 1067e7228204SAlfred Perlstein if (doing_compress) { 1068e7228204SAlfred Perlstein p = gzopen_flags; 1069e7228204SAlfred Perlstein *p++ = 'w'; 1070e7228204SAlfred Perlstein if (compress_user_cores_gzlevel >= 0 && 1071e7228204SAlfred Perlstein compress_user_cores_gzlevel <= 9) 1072e7228204SAlfred Perlstein *p++ = '0' + compress_user_cores_gzlevel; 1073e7228204SAlfred Perlstein *p = 0; 1074e7228204SAlfred Perlstein gzfile = gz_open("", gzopen_flags, vp); 1075e7228204SAlfred Perlstein if (gzfile == Z_NULL) { 1076e7228204SAlfred Perlstein error = EFAULT; 1077e7228204SAlfred Perlstein goto done; 1078e7228204SAlfred Perlstein } 1079e7228204SAlfred Perlstein core_buf = malloc(CORE_BUF_SIZE, M_TEMP, M_WAITOK | M_ZERO); 1080e7228204SAlfred Perlstein if (!core_buf) { 1081e7228204SAlfred Perlstein error = ENOMEM; 1082e7228204SAlfred Perlstein goto done; 1083e7228204SAlfred Perlstein } 1084e7228204SAlfred Perlstein } 1085e7228204SAlfred Perlstein #endif 1086e7228204SAlfred Perlstein 10870ff27d31SJohn Polstra /* Size the program segments. */ 10880ff27d31SJohn Polstra seginfo.count = 0; 10890ff27d31SJohn Polstra seginfo.size = 0; 1090247aba24SMarcel Moolenaar each_writable_segment(td, cb_size_segment, &seginfo); 10910ff27d31SJohn Polstra 10920ff27d31SJohn Polstra /* 10930ff27d31SJohn Polstra * Calculate the size of the core file header area by making 10940ff27d31SJohn Polstra * a dry run of generating it. Nothing is written, but the 10950ff27d31SJohn Polstra * size is calculated. 10960ff27d31SJohn Polstra */ 10970ff27d31SJohn Polstra hdrsize = 0; 1098247aba24SMarcel Moolenaar __elfN(puthdr)(td, (void *)NULL, &hdrsize, seginfo.count); 10990ff27d31SJohn Polstra 1100fca666a1SJulian Elischer if (hdrsize + seginfo.size >= limit) 11018c64af4fSJohn Polstra return (EFAULT); 11020ff27d31SJohn Polstra 11030ff27d31SJohn Polstra /* 11040ff27d31SJohn Polstra * Allocate memory for building the header, fill it up, 11050ff27d31SJohn Polstra * and write it out. 11060ff27d31SJohn Polstra */ 1107a163d034SWarner Losh hdr = malloc(hdrsize, M_TEMP, M_WAITOK); 11080ff27d31SJohn Polstra if (hdr == NULL) { 1109a7cddfedSJake Burkholder return (EINVAL); 11100ff27d31SJohn Polstra } 1111e7228204SAlfred Perlstein error = __elfN(corehdr)(td, vp, cred, seginfo.count, hdr, hdrsize, 1112e7228204SAlfred Perlstein gzfile); 11130ff27d31SJohn Polstra 11140ff27d31SJohn Polstra /* Write the contents of all of the writable segments. */ 11150ff27d31SJohn Polstra if (error == 0) { 11160ff27d31SJohn Polstra Elf_Phdr *php; 11172b471bc6STim J. Robbins off_t offset; 11180ff27d31SJohn Polstra int i; 11190ff27d31SJohn Polstra 11200ff27d31SJohn Polstra php = (Elf_Phdr *)((char *)hdr + sizeof(Elf_Ehdr)) + 1; 11210ff27d31SJohn Polstra offset = hdrsize; 11220ff27d31SJohn Polstra for (i = 0; i < seginfo.count; i++) { 1123e7228204SAlfred Perlstein error = core_output(vp, (caddr_t)(uintptr_t)php->p_vaddr, 1124e7228204SAlfred Perlstein php->p_filesz, offset, cred, NOCRED, curthread, core_buf, gzfile); 11250ff27d31SJohn Polstra if (error != 0) 11262b471bc6STim J. Robbins break; 11270ff27d31SJohn Polstra offset += php->p_filesz; 11280ff27d31SJohn Polstra php++; 11290ff27d31SJohn Polstra } 11300ff27d31SJohn Polstra } 1131e7228204SAlfred Perlstein if (error) { 1132e7228204SAlfred Perlstein log(LOG_WARNING, 1133e7228204SAlfred Perlstein "Failed to write core file for process %s (error %d)\n", 1134e7228204SAlfred Perlstein curproc->p_comm, error); 1135e7228204SAlfred Perlstein } 1136e7228204SAlfred Perlstein 1137e7228204SAlfred Perlstein #ifdef COMPRESS_USER_CORES 1138e7228204SAlfred Perlstein done: 1139e7228204SAlfred Perlstein #endif 1140e7228204SAlfred Perlstein if (core_buf) 1141e7228204SAlfred Perlstein free(core_buf, M_TEMP); 1142e7228204SAlfred Perlstein if (gzfile) 1143e7228204SAlfred Perlstein gzclose(gzfile); 1144e7228204SAlfred Perlstein 11450ff27d31SJohn Polstra free(hdr, M_TEMP); 11460ff27d31SJohn Polstra 1147a7cddfedSJake Burkholder return (error); 11488c64af4fSJohn Polstra } 11498c64af4fSJohn Polstra 11500ff27d31SJohn Polstra /* 11510ff27d31SJohn Polstra * A callback for each_writable_segment() to write out the segment's 11520ff27d31SJohn Polstra * program header entry. 11530ff27d31SJohn Polstra */ 11540ff27d31SJohn Polstra static void 11550ff27d31SJohn Polstra cb_put_phdr(entry, closure) 11560ff27d31SJohn Polstra vm_map_entry_t entry; 11570ff27d31SJohn Polstra void *closure; 11580ff27d31SJohn Polstra { 11590ff27d31SJohn Polstra struct phdr_closure *phc = (struct phdr_closure *)closure; 11600ff27d31SJohn Polstra Elf_Phdr *phdr = phc->phdr; 11610ff27d31SJohn Polstra 11620ff27d31SJohn Polstra phc->offset = round_page(phc->offset); 11630ff27d31SJohn Polstra 11640ff27d31SJohn Polstra phdr->p_type = PT_LOAD; 11650ff27d31SJohn Polstra phdr->p_offset = phc->offset; 11660ff27d31SJohn Polstra phdr->p_vaddr = entry->start; 11670ff27d31SJohn Polstra phdr->p_paddr = 0; 11680ff27d31SJohn Polstra phdr->p_filesz = phdr->p_memsz = entry->end - entry->start; 11690ff27d31SJohn Polstra phdr->p_align = PAGE_SIZE; 11700ff27d31SJohn Polstra phdr->p_flags = 0; 11710ff27d31SJohn Polstra if (entry->protection & VM_PROT_READ) 11720ff27d31SJohn Polstra phdr->p_flags |= PF_R; 11730ff27d31SJohn Polstra if (entry->protection & VM_PROT_WRITE) 11740ff27d31SJohn Polstra phdr->p_flags |= PF_W; 11750ff27d31SJohn Polstra if (entry->protection & VM_PROT_EXECUTE) 11760ff27d31SJohn Polstra phdr->p_flags |= PF_X; 11770ff27d31SJohn Polstra 11780ff27d31SJohn Polstra phc->offset += phdr->p_filesz; 11790ff27d31SJohn Polstra phc->phdr++; 11800ff27d31SJohn Polstra } 11810ff27d31SJohn Polstra 11820ff27d31SJohn Polstra /* 11830ff27d31SJohn Polstra * A callback for each_writable_segment() to gather information about 11840ff27d31SJohn Polstra * the number of segments and their total size. 11850ff27d31SJohn Polstra */ 11860ff27d31SJohn Polstra static void 11870ff27d31SJohn Polstra cb_size_segment(entry, closure) 11880ff27d31SJohn Polstra vm_map_entry_t entry; 11890ff27d31SJohn Polstra void *closure; 11900ff27d31SJohn Polstra { 11910ff27d31SJohn Polstra struct sseg_closure *ssc = (struct sseg_closure *)closure; 11920ff27d31SJohn Polstra 11930ff27d31SJohn Polstra ssc->count++; 11940ff27d31SJohn Polstra ssc->size += entry->end - entry->start; 11950ff27d31SJohn Polstra } 11960ff27d31SJohn Polstra 11970ff27d31SJohn Polstra /* 11980ff27d31SJohn Polstra * For each writable segment in the process's memory map, call the given 11990ff27d31SJohn Polstra * function with a pointer to the map entry and some arbitrary 12000ff27d31SJohn Polstra * caller-supplied data. 12010ff27d31SJohn Polstra */ 12020ff27d31SJohn Polstra static void 1203247aba24SMarcel Moolenaar each_writable_segment(td, func, closure) 1204247aba24SMarcel Moolenaar struct thread *td; 12050ff27d31SJohn Polstra segment_callback func; 12060ff27d31SJohn Polstra void *closure; 12070ff27d31SJohn Polstra { 1208247aba24SMarcel Moolenaar struct proc *p = td->td_proc; 12090ff27d31SJohn Polstra vm_map_t map = &p->p_vmspace->vm_map; 12100ff27d31SJohn Polstra vm_map_entry_t entry; 1211976a87a2SAlan Cox vm_object_t backing_object, object; 1212976a87a2SAlan Cox boolean_t ignore_entry; 12130ff27d31SJohn Polstra 1214976a87a2SAlan Cox vm_map_lock_read(map); 12150ff27d31SJohn Polstra for (entry = map->header.next; entry != &map->header; 12160ff27d31SJohn Polstra entry = entry->next) { 1217fa7dd9c5SMatthew Dillon /* 1218fa7dd9c5SMatthew Dillon * Don't dump inaccessible mappings, deal with legacy 1219fa7dd9c5SMatthew Dillon * coredump mode. 1220fa7dd9c5SMatthew Dillon * 1221fa7dd9c5SMatthew Dillon * Note that read-only segments related to the elf binary 1222fa7dd9c5SMatthew Dillon * are marked MAP_ENTRY_NOCOREDUMP now so we no longer 1223fa7dd9c5SMatthew Dillon * need to arbitrarily ignore such segments. 1224fa7dd9c5SMatthew Dillon */ 1225fa7dd9c5SMatthew Dillon if (elf_legacy_coredump) { 1226fa7dd9c5SMatthew Dillon if ((entry->protection & VM_PROT_RW) != VM_PROT_RW) 12270ff27d31SJohn Polstra continue; 1228fa7dd9c5SMatthew Dillon } else { 1229fa7dd9c5SMatthew Dillon if ((entry->protection & VM_PROT_ALL) == 0) 1230fa7dd9c5SMatthew Dillon continue; 1231fa7dd9c5SMatthew Dillon } 12320ff27d31SJohn Polstra 12339730a5daSPaul Saab /* 1234fa7dd9c5SMatthew Dillon * Dont include memory segment in the coredump if 1235fa7dd9c5SMatthew Dillon * MAP_NOCORE is set in mmap(2) or MADV_NOCORE in 1236fa7dd9c5SMatthew Dillon * madvise(2). Do not dump submaps (i.e. parts of the 1237fa7dd9c5SMatthew Dillon * kernel map). 12389730a5daSPaul Saab */ 1239fa7dd9c5SMatthew Dillon if (entry->eflags & (MAP_ENTRY_NOCOREDUMP|MAP_ENTRY_IS_SUB_MAP)) 12409730a5daSPaul Saab continue; 12419730a5daSPaul Saab 1242976a87a2SAlan Cox if ((object = entry->object.vm_object) == NULL) 12430ff27d31SJohn Polstra continue; 12440ff27d31SJohn Polstra 12450ff27d31SJohn Polstra /* Ignore memory-mapped devices and such things. */ 1246976a87a2SAlan Cox VM_OBJECT_LOCK(object); 1247976a87a2SAlan Cox while ((backing_object = object->backing_object) != NULL) { 1248976a87a2SAlan Cox VM_OBJECT_LOCK(backing_object); 1249976a87a2SAlan Cox VM_OBJECT_UNLOCK(object); 1250976a87a2SAlan Cox object = backing_object; 1251976a87a2SAlan Cox } 1252976a87a2SAlan Cox ignore_entry = object->type != OBJT_DEFAULT && 1253976a87a2SAlan Cox object->type != OBJT_SWAP && object->type != OBJT_VNODE; 1254976a87a2SAlan Cox VM_OBJECT_UNLOCK(object); 1255976a87a2SAlan Cox if (ignore_entry) 12560ff27d31SJohn Polstra continue; 12570ff27d31SJohn Polstra 12580ff27d31SJohn Polstra (*func)(entry, closure); 12590ff27d31SJohn Polstra } 1260976a87a2SAlan Cox vm_map_unlock_read(map); 12610ff27d31SJohn Polstra } 12620ff27d31SJohn Polstra 12630ff27d31SJohn Polstra /* 12640ff27d31SJohn Polstra * Write the core file header to the file, including padding up to 12650ff27d31SJohn Polstra * the page boundary. 12660ff27d31SJohn Polstra */ 12678c64af4fSJohn Polstra static int 1268e7228204SAlfred Perlstein __elfN(corehdr)(td, vp, cred, numsegs, hdr, hdrsize, gzfile) 1269b40ce416SJulian Elischer struct thread *td; 12708c64af4fSJohn Polstra struct vnode *vp; 12718c64af4fSJohn Polstra struct ucred *cred; 12720ff27d31SJohn Polstra int numsegs; 12730ff27d31SJohn Polstra size_t hdrsize; 12740ff27d31SJohn Polstra void *hdr; 1275e7228204SAlfred Perlstein gzFile gzfile; 12768c64af4fSJohn Polstra { 1277911c2be0SMark Peek size_t off; 12788c64af4fSJohn Polstra 12798c64af4fSJohn Polstra /* Fill in the header. */ 12800ff27d31SJohn Polstra bzero(hdr, hdrsize); 12818c64af4fSJohn Polstra off = 0; 1282247aba24SMarcel Moolenaar __elfN(puthdr)(td, hdr, &off, numsegs); 12838c64af4fSJohn Polstra 1284e7228204SAlfred Perlstein if (!gzfile) { 12858c64af4fSJohn Polstra /* Write it to the core file. */ 1286a7cddfedSJake Burkholder return (vn_rdwr_inchunks(UIO_WRITE, vp, hdr, hdrsize, (off_t)0, 12879ca43589SRobert Watson UIO_SYSSPACE, IO_UNIT | IO_DIRECT, cred, NOCRED, NULL, 12886617724cSJeff Roberson td)); 1289e7228204SAlfred Perlstein } else { 1290e7228204SAlfred Perlstein #ifdef COMPRESS_USER_CORES 1291e7228204SAlfred Perlstein if (gzwrite(gzfile, hdr, hdrsize) != hdrsize) { 1292e7228204SAlfred Perlstein log(LOG_WARNING, 1293e7228204SAlfred Perlstein "Failed to compress core file header for process" 1294e7228204SAlfred Perlstein " %s.\n", curproc->p_comm); 1295e7228204SAlfred Perlstein return (EFAULT); 1296e7228204SAlfred Perlstein } 1297e7228204SAlfred Perlstein else { 1298e7228204SAlfred Perlstein return (0); 1299e7228204SAlfred Perlstein } 1300e7228204SAlfred Perlstein #else 1301e7228204SAlfred Perlstein panic("shouldn't be here"); 1302e7228204SAlfred Perlstein #endif 1303e7228204SAlfred Perlstein } 1304dada0278SJohn Polstra } 1305dada0278SJohn Polstra 130662919d78SPeter Wemm #if defined(COMPAT_IA32) && __ELF_WORD_SIZE == 32 130762919d78SPeter Wemm typedef struct prstatus32 elf_prstatus_t; 130862919d78SPeter Wemm typedef struct prpsinfo32 elf_prpsinfo_t; 130962919d78SPeter Wemm typedef struct fpreg32 elf_prfpregset_t; 131062919d78SPeter Wemm typedef struct fpreg32 elf_fpregset_t; 131162919d78SPeter Wemm typedef struct reg32 elf_gregset_t; 131262919d78SPeter Wemm #else 131362919d78SPeter Wemm typedef prstatus_t elf_prstatus_t; 131462919d78SPeter Wemm typedef prpsinfo_t elf_prpsinfo_t; 131562919d78SPeter Wemm typedef prfpregset_t elf_prfpregset_t; 131662919d78SPeter Wemm typedef prfpregset_t elf_fpregset_t; 131762919d78SPeter Wemm typedef gregset_t elf_gregset_t; 131862919d78SPeter Wemm #endif 131962919d78SPeter Wemm 13208c64af4fSJohn Polstra static void 1321247aba24SMarcel Moolenaar __elfN(puthdr)(struct thread *td, void *dst, size_t *off, int numsegs) 13228c64af4fSJohn Polstra { 13238c9b7b2cSMarcel Moolenaar struct { 132462919d78SPeter Wemm elf_prstatus_t status; 132562919d78SPeter Wemm elf_prfpregset_t fpregset; 132662919d78SPeter Wemm elf_prpsinfo_t psinfo; 13278c9b7b2cSMarcel Moolenaar } *tempdata; 132862919d78SPeter Wemm elf_prstatus_t *status; 132962919d78SPeter Wemm elf_prfpregset_t *fpregset; 133062919d78SPeter Wemm elf_prpsinfo_t *psinfo; 1331247aba24SMarcel Moolenaar struct proc *p; 1332247aba24SMarcel Moolenaar struct thread *thr; 13338c9b7b2cSMarcel Moolenaar size_t ehoff, noteoff, notesz, phoff; 13348c64af4fSJohn Polstra 1335247aba24SMarcel Moolenaar p = td->td_proc; 1336247aba24SMarcel Moolenaar 13378c64af4fSJohn Polstra ehoff = *off; 13388c64af4fSJohn Polstra *off += sizeof(Elf_Ehdr); 13398c64af4fSJohn Polstra 13408c64af4fSJohn Polstra phoff = *off; 13410ff27d31SJohn Polstra *off += (numsegs + 1) * sizeof(Elf_Phdr); 13428c64af4fSJohn Polstra 13438c64af4fSJohn Polstra noteoff = *off; 13448c9b7b2cSMarcel Moolenaar /* 13458c9b7b2cSMarcel Moolenaar * Don't allocate space for the notes if we're just calculating 13468c9b7b2cSMarcel Moolenaar * the size of the header. We also don't collect the data. 13478c9b7b2cSMarcel Moolenaar */ 13488c9b7b2cSMarcel Moolenaar if (dst != NULL) { 13498c9b7b2cSMarcel Moolenaar tempdata = malloc(sizeof(*tempdata), M_TEMP, M_ZERO|M_WAITOK); 13508c9b7b2cSMarcel Moolenaar status = &tempdata->status; 13518c9b7b2cSMarcel Moolenaar fpregset = &tempdata->fpregset; 13528c9b7b2cSMarcel Moolenaar psinfo = &tempdata->psinfo; 13538c9b7b2cSMarcel Moolenaar } else { 13548c9b7b2cSMarcel Moolenaar tempdata = NULL; 13558c9b7b2cSMarcel Moolenaar status = NULL; 13568c9b7b2cSMarcel Moolenaar fpregset = NULL; 13578c9b7b2cSMarcel Moolenaar psinfo = NULL; 13588c9b7b2cSMarcel Moolenaar } 13598c9b7b2cSMarcel Moolenaar 13608c9b7b2cSMarcel Moolenaar if (dst != NULL) { 13618c9b7b2cSMarcel Moolenaar psinfo->pr_version = PRPSINFO_VERSION; 136262919d78SPeter Wemm psinfo->pr_psinfosz = sizeof(elf_prpsinfo_t); 1363ccd3953eSJohn Baldwin strlcpy(psinfo->pr_fname, p->p_comm, sizeof(psinfo->pr_fname)); 13648c9b7b2cSMarcel Moolenaar /* 13658c9b7b2cSMarcel Moolenaar * XXX - We don't fill in the command line arguments properly 13668c9b7b2cSMarcel Moolenaar * yet. 13678c9b7b2cSMarcel Moolenaar */ 1368ccd3953eSJohn Baldwin strlcpy(psinfo->pr_psargs, p->p_comm, 13698c9b7b2cSMarcel Moolenaar sizeof(psinfo->pr_psargs)); 13708c9b7b2cSMarcel Moolenaar } 13718c9b7b2cSMarcel Moolenaar __elfN(putnote)(dst, off, "FreeBSD", NT_PRPSINFO, psinfo, 13728c9b7b2cSMarcel Moolenaar sizeof *psinfo); 13738c9b7b2cSMarcel Moolenaar 13748c9b7b2cSMarcel Moolenaar /* 13751f7a1baaSMarcel Moolenaar * To have the debugger select the right thread (LWP) as the initial 13761f7a1baaSMarcel Moolenaar * thread, we dump the state of the thread passed to us in td first. 13771f7a1baaSMarcel Moolenaar * This is the thread that causes the core dump and thus likely to 13781f7a1baaSMarcel Moolenaar * be the right thread one wants to have selected in the debugger. 13798c9b7b2cSMarcel Moolenaar */ 1380247aba24SMarcel Moolenaar thr = td; 1381247aba24SMarcel Moolenaar while (thr != NULL) { 13828c9b7b2cSMarcel Moolenaar if (dst != NULL) { 13838c9b7b2cSMarcel Moolenaar status->pr_version = PRSTATUS_VERSION; 138462919d78SPeter Wemm status->pr_statussz = sizeof(elf_prstatus_t); 138562919d78SPeter Wemm status->pr_gregsetsz = sizeof(elf_gregset_t); 138662919d78SPeter Wemm status->pr_fpregsetsz = sizeof(elf_fpregset_t); 13878c9b7b2cSMarcel Moolenaar status->pr_osreldate = osreldate; 13888c9b7b2cSMarcel Moolenaar status->pr_cursig = p->p_sig; 13891f7a1baaSMarcel Moolenaar status->pr_pid = thr->td_tid; 139062919d78SPeter Wemm #if defined(COMPAT_IA32) && __ELF_WORD_SIZE == 32 139162919d78SPeter Wemm fill_regs32(thr, &status->pr_reg); 139262919d78SPeter Wemm fill_fpregs32(thr, fpregset); 139362919d78SPeter Wemm #else 13948c9b7b2cSMarcel Moolenaar fill_regs(thr, &status->pr_reg); 13958c9b7b2cSMarcel Moolenaar fill_fpregs(thr, fpregset); 139662919d78SPeter Wemm #endif 13978c9b7b2cSMarcel Moolenaar } 13983ebc1248SPeter Wemm __elfN(putnote)(dst, off, "FreeBSD", NT_PRSTATUS, status, 13998c64af4fSJohn Polstra sizeof *status); 14003ebc1248SPeter Wemm __elfN(putnote)(dst, off, "FreeBSD", NT_FPREGSET, fpregset, 14018c64af4fSJohn Polstra sizeof *fpregset); 14024da47b2fSMarcel Moolenaar /* 14034da47b2fSMarcel Moolenaar * Allow for MD specific notes, as well as any MD 14044da47b2fSMarcel Moolenaar * specific preparations for writing MI notes. 14054da47b2fSMarcel Moolenaar */ 14064da47b2fSMarcel Moolenaar __elfN(dump_thread)(thr, dst, off); 1407247aba24SMarcel Moolenaar 1408247aba24SMarcel Moolenaar thr = (thr == td) ? TAILQ_FIRST(&p->p_threads) : 14098c9b7b2cSMarcel Moolenaar TAILQ_NEXT(thr, td_plist); 1410247aba24SMarcel Moolenaar if (thr == td) 14118c9b7b2cSMarcel Moolenaar thr = TAILQ_NEXT(thr, td_plist); 1412247aba24SMarcel Moolenaar } 14138c9b7b2cSMarcel Moolenaar 14148c64af4fSJohn Polstra notesz = *off - noteoff; 14158c64af4fSJohn Polstra 14168c9b7b2cSMarcel Moolenaar if (dst != NULL) 14178c9b7b2cSMarcel Moolenaar free(tempdata, M_TEMP); 14188c9b7b2cSMarcel Moolenaar 14190ff27d31SJohn Polstra /* Align up to a page boundary for the program segments. */ 14208c64af4fSJohn Polstra *off = round_page(*off); 14218c64af4fSJohn Polstra 14228c64af4fSJohn Polstra if (dst != NULL) { 14238c64af4fSJohn Polstra Elf_Ehdr *ehdr; 14248c64af4fSJohn Polstra Elf_Phdr *phdr; 14250ff27d31SJohn Polstra struct phdr_closure phc; 14268c64af4fSJohn Polstra 14278c64af4fSJohn Polstra /* 14288c64af4fSJohn Polstra * Fill in the ELF header. 14298c64af4fSJohn Polstra */ 14308c64af4fSJohn Polstra ehdr = (Elf_Ehdr *)((char *)dst + ehoff); 14318c64af4fSJohn Polstra ehdr->e_ident[EI_MAG0] = ELFMAG0; 14328c64af4fSJohn Polstra ehdr->e_ident[EI_MAG1] = ELFMAG1; 14338c64af4fSJohn Polstra ehdr->e_ident[EI_MAG2] = ELFMAG2; 14348c64af4fSJohn Polstra ehdr->e_ident[EI_MAG3] = ELFMAG3; 14358c64af4fSJohn Polstra ehdr->e_ident[EI_CLASS] = ELF_CLASS; 14368c64af4fSJohn Polstra ehdr->e_ident[EI_DATA] = ELF_DATA; 14378c64af4fSJohn Polstra ehdr->e_ident[EI_VERSION] = EV_CURRENT; 1438c815a20cSDavid E. O'Brien ehdr->e_ident[EI_OSABI] = ELFOSABI_FREEBSD; 1439c815a20cSDavid E. O'Brien ehdr->e_ident[EI_ABIVERSION] = 0; 14408c64af4fSJohn Polstra ehdr->e_ident[EI_PAD] = 0; 14418c64af4fSJohn Polstra ehdr->e_type = ET_CORE; 144262919d78SPeter Wemm #if defined(COMPAT_IA32) && __ELF_WORD_SIZE == 32 144362919d78SPeter Wemm ehdr->e_machine = EM_386; 144462919d78SPeter Wemm #else 14458c64af4fSJohn Polstra ehdr->e_machine = ELF_ARCH; 144662919d78SPeter Wemm #endif 14478c64af4fSJohn Polstra ehdr->e_version = EV_CURRENT; 14488c64af4fSJohn Polstra ehdr->e_entry = 0; 14498c64af4fSJohn Polstra ehdr->e_phoff = phoff; 14508c64af4fSJohn Polstra ehdr->e_flags = 0; 14518c64af4fSJohn Polstra ehdr->e_ehsize = sizeof(Elf_Ehdr); 14528c64af4fSJohn Polstra ehdr->e_phentsize = sizeof(Elf_Phdr); 14530ff27d31SJohn Polstra ehdr->e_phnum = numsegs + 1; 14548c64af4fSJohn Polstra ehdr->e_shentsize = sizeof(Elf_Shdr); 14558c64af4fSJohn Polstra ehdr->e_shnum = 0; 14568c64af4fSJohn Polstra ehdr->e_shstrndx = SHN_UNDEF; 14578c64af4fSJohn Polstra 14588c64af4fSJohn Polstra /* 14598c64af4fSJohn Polstra * Fill in the program header entries. 14608c64af4fSJohn Polstra */ 14618c64af4fSJohn Polstra phdr = (Elf_Phdr *)((char *)dst + phoff); 14628c64af4fSJohn Polstra 14638c64af4fSJohn Polstra /* The note segement. */ 14648c64af4fSJohn Polstra phdr->p_type = PT_NOTE; 14658c64af4fSJohn Polstra phdr->p_offset = noteoff; 14668c64af4fSJohn Polstra phdr->p_vaddr = 0; 14678c64af4fSJohn Polstra phdr->p_paddr = 0; 14688c64af4fSJohn Polstra phdr->p_filesz = notesz; 14698c64af4fSJohn Polstra phdr->p_memsz = 0; 14708c64af4fSJohn Polstra phdr->p_flags = 0; 14718c64af4fSJohn Polstra phdr->p_align = 0; 14728c64af4fSJohn Polstra phdr++; 14738c64af4fSJohn Polstra 14740ff27d31SJohn Polstra /* All the writable segments from the program. */ 14750ff27d31SJohn Polstra phc.phdr = phdr; 14760ff27d31SJohn Polstra phc.offset = *off; 1477247aba24SMarcel Moolenaar each_writable_segment(td, cb_put_phdr, &phc); 14788c64af4fSJohn Polstra } 14798c64af4fSJohn Polstra } 14808c64af4fSJohn Polstra 14818c64af4fSJohn Polstra static void 14823ebc1248SPeter Wemm __elfN(putnote)(void *dst, size_t *off, const char *name, int type, 14838c64af4fSJohn Polstra const void *desc, size_t descsz) 14848c64af4fSJohn Polstra { 14858c64af4fSJohn Polstra Elf_Note note; 14868c64af4fSJohn Polstra 14878c64af4fSJohn Polstra note.n_namesz = strlen(name) + 1; 14888c64af4fSJohn Polstra note.n_descsz = descsz; 14898c64af4fSJohn Polstra note.n_type = type; 14908c64af4fSJohn Polstra if (dst != NULL) 14918c64af4fSJohn Polstra bcopy(¬e, (char *)dst + *off, sizeof note); 14928c64af4fSJohn Polstra *off += sizeof note; 14938c64af4fSJohn Polstra if (dst != NULL) 14948c64af4fSJohn Polstra bcopy(name, (char *)dst + *off, note.n_namesz); 14958c64af4fSJohn Polstra *off += roundup2(note.n_namesz, sizeof(Elf_Size)); 14968c64af4fSJohn Polstra if (dst != NULL) 14978c64af4fSJohn Polstra bcopy(desc, (char *)dst + *off, note.n_descsz); 14988c64af4fSJohn Polstra *off += roundup2(note.n_descsz, sizeof(Elf_Size)); 14998c64af4fSJohn Polstra } 15008c64af4fSJohn Polstra 15018c64af4fSJohn Polstra /* 150232c01de2SDmitry Chagin * Try to find the appropriate ABI-note section for checknote, 150332c01de2SDmitry Chagin * fetch the osreldate for binary from the ELF OSABI-note. Only the 150432c01de2SDmitry Chagin * first page of the image is searched, the same as for headers. 150532c01de2SDmitry Chagin */ 150632c01de2SDmitry Chagin static boolean_t 150732c01de2SDmitry Chagin __elfN(check_note)(struct image_params *imgp, Elf_Brandnote *checknote, 150832c01de2SDmitry Chagin int32_t *osrel) 150932c01de2SDmitry Chagin { 1510267c52fcSKonstantin Belousov const Elf_Note *note, *note0, *note_end; 1511429f5a58SKonstantin Belousov const Elf_Phdr *phdr, *pnote; 1512429f5a58SKonstantin Belousov const Elf_Ehdr *hdr; 151332c01de2SDmitry Chagin const char *note_name; 151432c01de2SDmitry Chagin int i; 151532c01de2SDmitry Chagin 151632c01de2SDmitry Chagin pnote = NULL; 1517429f5a58SKonstantin Belousov hdr = (const Elf_Ehdr *)imgp->image_header; 1518429f5a58SKonstantin Belousov phdr = (const Elf_Phdr *)(imgp->image_header + hdr->e_phoff); 151932c01de2SDmitry Chagin 152032c01de2SDmitry Chagin for (i = 0; i < hdr->e_phnum; i++) { 152132c01de2SDmitry Chagin if (phdr[i].p_type == PT_NOTE) { 152232c01de2SDmitry Chagin pnote = &phdr[i]; 152332c01de2SDmitry Chagin break; 152432c01de2SDmitry Chagin } 152532c01de2SDmitry Chagin } 152632c01de2SDmitry Chagin 152732c01de2SDmitry Chagin if (pnote == NULL || pnote->p_offset >= PAGE_SIZE || 152832c01de2SDmitry Chagin pnote->p_offset + pnote->p_filesz >= PAGE_SIZE) 152932c01de2SDmitry Chagin return (FALSE); 153032c01de2SDmitry Chagin 1531267c52fcSKonstantin Belousov note = note0 = (const Elf_Note *)(imgp->image_header + pnote->p_offset); 153232c01de2SDmitry Chagin note_end = (const Elf_Note *)(imgp->image_header + 153332c01de2SDmitry Chagin pnote->p_offset + pnote->p_filesz); 1534267c52fcSKonstantin Belousov for (i = 0; i < 100 && note >= note0 && note < note_end; i++) { 1535267c52fcSKonstantin Belousov if (!aligned(note, Elf32_Addr)) 1536267c52fcSKonstantin Belousov return (FALSE); 153732c01de2SDmitry Chagin if (note->n_namesz != checknote->hdr.n_namesz || 153832c01de2SDmitry Chagin note->n_descsz != checknote->hdr.n_descsz || 153932c01de2SDmitry Chagin note->n_type != checknote->hdr.n_type) 154032c01de2SDmitry Chagin goto nextnote; 154132c01de2SDmitry Chagin note_name = (const char *)(note + 1); 154232c01de2SDmitry Chagin if (strncmp(checknote->vendor, note_name, 154332c01de2SDmitry Chagin checknote->hdr.n_namesz) != 0) 154432c01de2SDmitry Chagin goto nextnote; 154532c01de2SDmitry Chagin 154632c01de2SDmitry Chagin /* 154732c01de2SDmitry Chagin * Fetch the osreldate for binary 154832c01de2SDmitry Chagin * from the ELF OSABI-note if necessary. 154932c01de2SDmitry Chagin */ 155089ffc202SBjoern A. Zeeb if ((checknote->flags & BN_TRANSLATE_OSREL) != 0 && 155189ffc202SBjoern A. Zeeb checknote->trans_osrel != NULL) 155289ffc202SBjoern A. Zeeb return (checknote->trans_osrel(note, osrel)); 155332c01de2SDmitry Chagin return (TRUE); 155432c01de2SDmitry Chagin 155532c01de2SDmitry Chagin nextnote: 155632c01de2SDmitry Chagin note = (const Elf_Note *)((const char *)(note + 1) + 155732c01de2SDmitry Chagin roundup2(note->n_namesz, sizeof(Elf32_Addr)) + 155832c01de2SDmitry Chagin roundup2(note->n_descsz, sizeof(Elf32_Addr))); 155932c01de2SDmitry Chagin } 156032c01de2SDmitry Chagin 156132c01de2SDmitry Chagin return (FALSE); 156232c01de2SDmitry Chagin } 156332c01de2SDmitry Chagin 156432c01de2SDmitry Chagin /* 1565e1743d02SSøren Schmidt * Tell kern_execve.c about it, with a little help from the linker. 1566e1743d02SSøren Schmidt */ 1567a360a43dSJake Burkholder static struct execsw __elfN(execsw) = { 1568a360a43dSJake Burkholder __CONCAT(exec_, __elfN(imgact)), 1569a360a43dSJake Burkholder __XSTRING(__CONCAT(ELF, __ELF_WORD_SIZE)) 1570a360a43dSJake Burkholder }; 1571a360a43dSJake Burkholder EXEC_SET(__CONCAT(elf, __ELF_WORD_SIZE), __elfN(execsw)); 1572e7228204SAlfred Perlstein 1573e7228204SAlfred Perlstein #ifdef COMPRESS_USER_CORES 1574e7228204SAlfred Perlstein /* 1575e7228204SAlfred Perlstein * Compress and write out a core segment for a user process. 1576e7228204SAlfred Perlstein * 1577e7228204SAlfred Perlstein * 'inbuf' is the starting address of a VM segment in the process' address 1578e7228204SAlfred Perlstein * space that is to be compressed and written out to the core file. 'dest_buf' 1579e7228204SAlfred Perlstein * is a buffer in the kernel's address space. The segment is copied from 1580e7228204SAlfred Perlstein * 'inbuf' to 'dest_buf' first before being processed by the compression 1581e7228204SAlfred Perlstein * routine gzwrite(). This copying is necessary because the content of the VM 1582e7228204SAlfred Perlstein * segment may change between the compression pass and the crc-computation pass 1583e7228204SAlfred Perlstein * in gzwrite(). This is because realtime threads may preempt the UNIX kernel. 1584e7228204SAlfred Perlstein */ 1585e7228204SAlfred Perlstein static int 1586e7228204SAlfred Perlstein compress_core (gzFile file, char *inbuf, char *dest_buf, unsigned int len, 1587e7228204SAlfred Perlstein struct thread *td) 1588e7228204SAlfred Perlstein { 1589e7228204SAlfred Perlstein int len_compressed; 1590e7228204SAlfred Perlstein int error = 0; 1591e7228204SAlfred Perlstein unsigned int chunk_len; 1592e7228204SAlfred Perlstein 1593e7228204SAlfred Perlstein while (len) { 1594e7228204SAlfred Perlstein chunk_len = (len > CORE_BUF_SIZE) ? CORE_BUF_SIZE : len; 1595e7228204SAlfred Perlstein copyin(inbuf, dest_buf, chunk_len); 1596e7228204SAlfred Perlstein len_compressed = gzwrite(file, dest_buf, chunk_len); 1597e7228204SAlfred Perlstein 1598e7228204SAlfred Perlstein EVENTHANDLER_INVOKE(app_coredump_progress, td, len_compressed); 1599e7228204SAlfred Perlstein 1600e7228204SAlfred Perlstein if ((unsigned int)len_compressed != chunk_len) { 1601e7228204SAlfred Perlstein log(LOG_WARNING, 1602e7228204SAlfred Perlstein "compress_core: length mismatch (0x%x returned, " 1603e7228204SAlfred Perlstein "0x%x expected)\n", len_compressed, chunk_len); 1604e7228204SAlfred Perlstein EVENTHANDLER_INVOKE(app_coredump_error, td, 1605e7228204SAlfred Perlstein "compress_core: length mismatch %x -> %x", 1606e7228204SAlfred Perlstein chunk_len, len_compressed); 1607e7228204SAlfred Perlstein error = EFAULT; 1608e7228204SAlfred Perlstein break; 1609e7228204SAlfred Perlstein } 1610e7228204SAlfred Perlstein inbuf += chunk_len; 1611e7228204SAlfred Perlstein len -= chunk_len; 1612e7228204SAlfred Perlstein if (ticks - PCPU_GET(switchticks) >= hogticks) 1613e7228204SAlfred Perlstein uio_yield(); 1614e7228204SAlfred Perlstein } 1615e7228204SAlfred Perlstein 1616e7228204SAlfred Perlstein return (error); 1617e7228204SAlfred Perlstein } 1618e7228204SAlfred Perlstein #endif /* COMPRESS_USER_CORES */ 1619