1e1743d02SSøren Schmidt /*- 221a3ee0eSDavid E. O'Brien * Copyright (c) 2000 David O'Brien 39a14aa01SUlrich Spörlein * Copyright (c) 1995-1996 Søren Schmidt 4e1743d02SSøren Schmidt * Copyright (c) 1996 Peter Wemm 5e1743d02SSøren Schmidt * All rights reserved. 6e1743d02SSøren Schmidt * 7e1743d02SSøren Schmidt * Redistribution and use in source and binary forms, with or without 8e1743d02SSøren Schmidt * modification, are permitted provided that the following conditions 9e1743d02SSøren Schmidt * are met: 10e1743d02SSøren Schmidt * 1. Redistributions of source code must retain the above copyright 11e1743d02SSøren Schmidt * notice, this list of conditions and the following disclaimer 12e1743d02SSøren Schmidt * in this position and unchanged. 13e1743d02SSøren Schmidt * 2. Redistributions in binary form must reproduce the above copyright 14e1743d02SSøren Schmidt * notice, this list of conditions and the following disclaimer in the 15e1743d02SSøren Schmidt * documentation and/or other materials provided with the distribution. 16e1743d02SSøren Schmidt * 3. The name of the author may not be used to endorse or promote products 1721dc7d4fSJens Schweikhardt * derived from this software without specific prior written permission 18e1743d02SSøren Schmidt * 19e1743d02SSøren Schmidt * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 20e1743d02SSøren Schmidt * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 21e1743d02SSøren Schmidt * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 22e1743d02SSøren Schmidt * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 23e1743d02SSøren Schmidt * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 24e1743d02SSøren Schmidt * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 25e1743d02SSøren Schmidt * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 26e1743d02SSøren Schmidt * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 27e1743d02SSøren Schmidt * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 28e1743d02SSøren Schmidt * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 29e1743d02SSøren Schmidt */ 30e1743d02SSøren Schmidt 31677b542eSDavid E. O'Brien #include <sys/cdefs.h> 32677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 33677b542eSDavid E. O'Brien 3412bc222eSJonathan Anderson #include "opt_capsicum.h" 3562919d78SPeter Wemm #include "opt_compat.h" 36aa14e9b7SMark Johnston #include "opt_gzio.h" 3762919d78SPeter Wemm 38e1743d02SSøren Schmidt #include <sys/param.h> 394a144410SRobert Watson #include <sys/capsicum.h> 40e1743d02SSøren Schmidt #include <sys/exec.h> 418c64af4fSJohn Polstra #include <sys/fcntl.h> 42aa14e9b7SMark Johnston #include <sys/gzio.h> 43e1743d02SSøren Schmidt #include <sys/imgact.h> 44e1743d02SSøren Schmidt #include <sys/imgact_elf.h> 45b96bd95bSIan Lepore #include <sys/jail.h> 46e1743d02SSøren Schmidt #include <sys/kernel.h> 47f34fa851SJohn Baldwin #include <sys/lock.h> 48e1743d02SSøren Schmidt #include <sys/malloc.h> 4968ff2a43SChristian S.J. Peron #include <sys/mount.h> 508c64af4fSJohn Polstra #include <sys/mman.h> 51a794e791SBruce Evans #include <sys/namei.h> 528c64af4fSJohn Polstra #include <sys/pioctl.h> 53a794e791SBruce Evans #include <sys/proc.h> 548c64af4fSJohn Polstra #include <sys/procfs.h> 551ba5ad42SEdward Tomasz Napierala #include <sys/racct.h> 568c64af4fSJohn Polstra #include <sys/resourcevar.h> 5789f6b863SAttilio Rao #include <sys/rwlock.h> 58bd390213SMikolaj Golub #include <sys/sbuf.h> 59da61b9a6SAlan Cox #include <sys/sf_buf.h> 60ee235befSKonstantin Belousov #include <sys/smp.h> 6136240ea5SDoug Rabson #include <sys/systm.h> 62e1743d02SSøren Schmidt #include <sys/signalvar.h> 638c64af4fSJohn Polstra #include <sys/stat.h> 641005a129SJohn Baldwin #include <sys/sx.h> 658c64af4fSJohn Polstra #include <sys/syscall.h> 66e1743d02SSøren Schmidt #include <sys/sysctl.h> 678c64af4fSJohn Polstra #include <sys/sysent.h> 68a794e791SBruce Evans #include <sys/vnode.h> 69e7228204SAlfred Perlstein #include <sys/syslog.h> 70e7228204SAlfred Perlstein #include <sys/eventhandler.h> 71f1fca82eSMikolaj Golub #include <sys/user.h> 72e7228204SAlfred Perlstein 73e1743d02SSøren Schmidt #include <vm/vm.h> 74e1743d02SSøren Schmidt #include <vm/vm_kern.h> 75e1743d02SSøren Schmidt #include <vm/vm_param.h> 76e1743d02SSøren Schmidt #include <vm/pmap.h> 77e1743d02SSøren Schmidt #include <vm/vm_map.h> 780ff27d31SJohn Polstra #include <vm/vm_object.h> 79e1743d02SSøren Schmidt #include <vm/vm_extern.h> 80e1743d02SSøren Schmidt 8152c24af7SPeter Wemm #include <machine/elf.h> 82e1743d02SSøren Schmidt #include <machine/md_var.h> 83e1743d02SSøren Schmidt 841b8388cdSMikolaj Golub #define ELF_NOTE_ROUNDSIZE 4 85c815a20cSDavid E. O'Brien #define OLD_EI_BRAND 8 86c815a20cSDavid E. O'Brien 873ebc1248SPeter Wemm static int __elfN(check_header)(const Elf_Ehdr *hdr); 8832c01de2SDmitry Chagin static Elf_Brandinfo *__elfN(get_brandinfo)(struct image_params *imgp, 89d1ae5c83SKonstantin Belousov const char *interp, int interp_name_len, int32_t *osrel); 903ebc1248SPeter Wemm static int __elfN(load_file)(struct proc *p, const char *file, u_long *addr, 913ebc1248SPeter Wemm u_long *entry, size_t pagesize); 92292177e6SAlan Cox static int __elfN(load_section)(struct image_params *imgp, vm_offset_t offset, 93292177e6SAlan Cox caddr_t vmaddr, size_t memsz, size_t filsz, vm_prot_t prot, 94292177e6SAlan Cox size_t pagesize); 953ebc1248SPeter Wemm static int __CONCAT(exec_, __elfN(imgact))(struct image_params *imgp); 9689ffc202SBjoern A. Zeeb static boolean_t __elfN(freebsd_trans_osrel)(const Elf_Note *note, 9789ffc202SBjoern A. Zeeb int32_t *osrel); 9889ffc202SBjoern A. Zeeb static boolean_t kfreebsd_trans_osrel(const Elf_Note *note, int32_t *osrel); 9932c01de2SDmitry Chagin static boolean_t __elfN(check_note)(struct image_params *imgp, 10032c01de2SDmitry Chagin Elf_Brandnote *checknote, int32_t *osrel); 101ed167eaaSKonstantin Belousov static vm_prot_t __elfN(trans_prot)(Elf_Word); 102ed167eaaSKonstantin Belousov static Elf_Word __elfN(untrans_prot)(vm_prot_t); 103e1743d02SSøren Schmidt 104a360a43dSJake Burkholder SYSCTL_NODE(_kern, OID_AUTO, __CONCAT(elf, __ELF_WORD_SIZE), CTLFLAG_RW, 0, 105a360a43dSJake Burkholder ""); 106a360a43dSJake Burkholder 107bd390213SMikolaj Golub #define CORE_BUF_SIZE (16 * 1024) 108e7228204SAlfred Perlstein 109e548a1d4SJake Burkholder int __elfN(fallback_brand) = -1; 110e548a1d4SJake Burkholder SYSCTL_INT(__CONCAT(_kern_elf, __ELF_WORD_SIZE), OID_AUTO, 111af3b2549SHans Petter Selasky fallback_brand, CTLFLAG_RWTUN, &__elfN(fallback_brand), 0, 112a360a43dSJake Burkholder __XSTRING(__CONCAT(ELF, __ELF_WORD_SIZE)) " brand of last resort"); 113a360a43dSJake Burkholder 114551d79e1SMarcel Moolenaar static int elf_legacy_coredump = 0; 115a360a43dSJake Burkholder SYSCTL_INT(_debug, OID_AUTO, __elfN(legacy_coredump), CTLFLAG_RW, 1161cbb879dSEd Maste &elf_legacy_coredump, 0, 1171cbb879dSEd Maste "include all and only RW pages in core dumps"); 118e1743d02SSøren Schmidt 11962c625fdSKonstantin Belousov int __elfN(nxstack) = 1204d22d07aSKonstantin Belousov #if defined(__amd64__) || defined(__powerpc64__) /* both 64 and 32 bit */ || \ 1214d22d07aSKonstantin Belousov (defined(__arm__) && __ARM_ARCH >= 7) || defined(__aarch64__) 12262c625fdSKonstantin Belousov 1; 12362c625fdSKonstantin Belousov #else 12462c625fdSKonstantin Belousov 0; 12562c625fdSKonstantin Belousov #endif 126291c06a1SKonstantin Belousov SYSCTL_INT(__CONCAT(_kern_elf, __ELF_WORD_SIZE), OID_AUTO, 127291c06a1SKonstantin Belousov nxstack, CTLFLAG_RW, &__elfN(nxstack), 0, 128291c06a1SKonstantin Belousov __XSTRING(__CONCAT(ELF, __ELF_WORD_SIZE)) ": enable non-executable stack"); 129291c06a1SKonstantin Belousov 130126b36a2SKonstantin Belousov #if __ELF_WORD_SIZE == 32 131e7d939bdSMarcel Moolenaar #if defined(__amd64__) 132126b36a2SKonstantin Belousov int i386_read_exec = 0; 133126b36a2SKonstantin Belousov SYSCTL_INT(_kern_elf32, OID_AUTO, read_exec, CTLFLAG_RW, &i386_read_exec, 0, 134126b36a2SKonstantin Belousov "enable execution from readable segments"); 135126b36a2SKonstantin Belousov #endif 136126b36a2SKonstantin Belousov #endif 137126b36a2SKonstantin Belousov 1383ebc1248SPeter Wemm static Elf_Brandinfo *elf_brand_list[MAX_BRANDS]; 139e1743d02SSøren Schmidt 140d9c9c81cSPedro F. Giffuni #define trunc_page_ps(va, ps) rounddown2(va, ps) 141d9c9c81cSPedro F. Giffuni #define round_page_ps(va, ps) roundup2(va, ps) 14293d1c728SKonstantin Belousov #define aligned(a, t) (trunc_page_ps((u_long)(a), sizeof(t)) == (u_long)(a)) 14393d1c728SKonstantin Belousov 14432c01de2SDmitry Chagin static const char FREEBSD_ABI_VENDOR[] = "FreeBSD"; 14532c01de2SDmitry Chagin 14632c01de2SDmitry Chagin Elf_Brandnote __elfN(freebsd_brandnote) = { 14732c01de2SDmitry Chagin .hdr.n_namesz = sizeof(FREEBSD_ABI_VENDOR), 14832c01de2SDmitry Chagin .hdr.n_descsz = sizeof(int32_t), 1494c22b468SEd Maste .hdr.n_type = NT_FREEBSD_ABI_TAG, 15032c01de2SDmitry Chagin .vendor = FREEBSD_ABI_VENDOR, 15189ffc202SBjoern A. Zeeb .flags = BN_TRANSLATE_OSREL, 15289ffc202SBjoern A. Zeeb .trans_osrel = __elfN(freebsd_trans_osrel) 15332c01de2SDmitry Chagin }; 15432c01de2SDmitry Chagin 15589ffc202SBjoern A. Zeeb static boolean_t 15689ffc202SBjoern A. Zeeb __elfN(freebsd_trans_osrel)(const Elf_Note *note, int32_t *osrel) 15789ffc202SBjoern A. Zeeb { 15889ffc202SBjoern A. Zeeb uintptr_t p; 15989ffc202SBjoern A. Zeeb 16089ffc202SBjoern A. Zeeb p = (uintptr_t)(note + 1); 1611b8388cdSMikolaj Golub p += roundup2(note->n_namesz, ELF_NOTE_ROUNDSIZE); 16289ffc202SBjoern A. Zeeb *osrel = *(const int32_t *)(p); 16389ffc202SBjoern A. Zeeb 16489ffc202SBjoern A. Zeeb return (TRUE); 16589ffc202SBjoern A. Zeeb } 16689ffc202SBjoern A. Zeeb 16789ffc202SBjoern A. Zeeb static const char GNU_ABI_VENDOR[] = "GNU"; 16889ffc202SBjoern A. Zeeb static int GNU_KFREEBSD_ABI_DESC = 3; 16989ffc202SBjoern A. Zeeb 17089ffc202SBjoern A. Zeeb Elf_Brandnote __elfN(kfreebsd_brandnote) = { 17189ffc202SBjoern A. Zeeb .hdr.n_namesz = sizeof(GNU_ABI_VENDOR), 17289ffc202SBjoern A. Zeeb .hdr.n_descsz = 16, /* XXX at least 16 */ 17389ffc202SBjoern A. Zeeb .hdr.n_type = 1, 17489ffc202SBjoern A. Zeeb .vendor = GNU_ABI_VENDOR, 17589ffc202SBjoern A. Zeeb .flags = BN_TRANSLATE_OSREL, 17689ffc202SBjoern A. Zeeb .trans_osrel = kfreebsd_trans_osrel 17789ffc202SBjoern A. Zeeb }; 17889ffc202SBjoern A. Zeeb 17989ffc202SBjoern A. Zeeb static boolean_t 18089ffc202SBjoern A. Zeeb kfreebsd_trans_osrel(const Elf_Note *note, int32_t *osrel) 18189ffc202SBjoern A. Zeeb { 18289ffc202SBjoern A. Zeeb const Elf32_Word *desc; 18389ffc202SBjoern A. Zeeb uintptr_t p; 18489ffc202SBjoern A. Zeeb 18589ffc202SBjoern A. Zeeb p = (uintptr_t)(note + 1); 1861b8388cdSMikolaj Golub p += roundup2(note->n_namesz, ELF_NOTE_ROUNDSIZE); 18789ffc202SBjoern A. Zeeb 18889ffc202SBjoern A. Zeeb desc = (const Elf32_Word *)p; 18989ffc202SBjoern A. Zeeb if (desc[0] != GNU_KFREEBSD_ABI_DESC) 19089ffc202SBjoern A. Zeeb return (FALSE); 19189ffc202SBjoern A. Zeeb 19289ffc202SBjoern A. Zeeb /* 19389ffc202SBjoern A. Zeeb * Debian GNU/kFreeBSD embed the earliest compatible kernel version 19489ffc202SBjoern A. Zeeb * (__FreeBSD_version: <major><two digit minor>Rxx) in the LSB way. 19589ffc202SBjoern A. Zeeb */ 19689ffc202SBjoern A. Zeeb *osrel = desc[1] * 100000 + desc[2] * 1000 + desc[3]; 19789ffc202SBjoern A. Zeeb 19889ffc202SBjoern A. Zeeb return (TRUE); 19989ffc202SBjoern A. Zeeb } 20089ffc202SBjoern A. Zeeb 201e1743d02SSøren Schmidt int 2023ebc1248SPeter Wemm __elfN(insert_brand_entry)(Elf_Brandinfo *entry) 203e1743d02SSøren Schmidt { 204e1743d02SSøren Schmidt int i; 205e1743d02SSøren Schmidt 2063ebc1248SPeter Wemm for (i = 0; i < MAX_BRANDS; i++) { 207ea5a2b2eSSøren Schmidt if (elf_brand_list[i] == NULL) { 208ea5a2b2eSSøren Schmidt elf_brand_list[i] = entry; 209e1743d02SSøren Schmidt break; 210e1743d02SSøren Schmidt } 211e1743d02SSøren Schmidt } 212925c8b5bSBjoern A. Zeeb if (i == MAX_BRANDS) { 213925c8b5bSBjoern A. Zeeb printf("WARNING: %s: could not insert brandinfo entry: %p\n", 214925c8b5bSBjoern A. Zeeb __func__, entry); 215a7cddfedSJake Burkholder return (-1); 216925c8b5bSBjoern A. Zeeb } 217a7cddfedSJake Burkholder return (0); 218e1743d02SSøren Schmidt } 219e1743d02SSøren Schmidt 220e1743d02SSøren Schmidt int 2213ebc1248SPeter Wemm __elfN(remove_brand_entry)(Elf_Brandinfo *entry) 222e1743d02SSøren Schmidt { 223e1743d02SSøren Schmidt int i; 224e1743d02SSøren Schmidt 2253ebc1248SPeter Wemm for (i = 0; i < MAX_BRANDS; i++) { 226ea5a2b2eSSøren Schmidt if (elf_brand_list[i] == entry) { 227ea5a2b2eSSøren Schmidt elf_brand_list[i] = NULL; 228e1743d02SSøren Schmidt break; 229e1743d02SSøren Schmidt } 230e1743d02SSøren Schmidt } 231ea5a2b2eSSøren Schmidt if (i == MAX_BRANDS) 232a7cddfedSJake Burkholder return (-1); 233a7cddfedSJake Burkholder return (0); 234e1743d02SSøren Schmidt } 235e1743d02SSøren Schmidt 236096977faSMark Newton int 2373ebc1248SPeter Wemm __elfN(brand_inuse)(Elf_Brandinfo *entry) 238096977faSMark Newton { 239096977faSMark Newton struct proc *p; 240553629ebSJake Burkholder int rval = FALSE; 241096977faSMark Newton 2421005a129SJohn Baldwin sx_slock(&allproc_lock); 2434f506694SXin LI FOREACH_PROC_IN_SYSTEM(p) { 244553629ebSJake Burkholder if (p->p_sysent == entry->sysvec) { 245553629ebSJake Burkholder rval = TRUE; 246553629ebSJake Burkholder break; 247096977faSMark Newton } 248553629ebSJake Burkholder } 2491005a129SJohn Baldwin sx_sunlock(&allproc_lock); 250096977faSMark Newton 251553629ebSJake Burkholder return (rval); 252096977faSMark Newton } 253096977faSMark Newton 2545fe3ed62SJake Burkholder static Elf_Brandinfo * 25532c01de2SDmitry Chagin __elfN(get_brandinfo)(struct image_params *imgp, const char *interp, 256d1ae5c83SKonstantin Belousov int interp_name_len, int32_t *osrel) 2575fe3ed62SJake Burkholder { 25832c01de2SDmitry Chagin const Elf_Ehdr *hdr = (const Elf_Ehdr *)imgp->image_header; 259af582aaeSKonstantin Belousov Elf_Brandinfo *bi, *bi_m; 26032c01de2SDmitry Chagin boolean_t ret; 2615fe3ed62SJake Burkholder int i; 2625fe3ed62SJake Burkholder 2635fe3ed62SJake Burkholder /* 26432c01de2SDmitry Chagin * We support four types of branding -- (1) the ELF EI_OSABI field 2655fe3ed62SJake Burkholder * that SCO added to the ELF spec, (2) FreeBSD 3.x's traditional string 26632c01de2SDmitry Chagin * branding w/in the ELF header, (3) path of the `interp_path' 26732c01de2SDmitry Chagin * field, and (4) the ".note.ABI-tag" ELF section. 2685fe3ed62SJake Burkholder */ 2695fe3ed62SJake Burkholder 27032c01de2SDmitry Chagin /* Look for an ".note.ABI-tag" ELF section */ 271af582aaeSKonstantin Belousov bi_m = NULL; 27232c01de2SDmitry Chagin for (i = 0; i < MAX_BRANDS; i++) { 27332c01de2SDmitry Chagin bi = elf_brand_list[i]; 274ecc2fda8SBjoern A. Zeeb if (bi == NULL) 275ecc2fda8SBjoern A. Zeeb continue; 276ecc2fda8SBjoern A. Zeeb if (hdr->e_machine == bi->machine && (bi->flags & 277ecc2fda8SBjoern A. Zeeb (BI_BRAND_NOTE|BI_BRAND_NOTE_MANDATORY)) != 0) { 27832c01de2SDmitry Chagin ret = __elfN(check_note)(imgp, bi->brand_note, osrel); 279f19d421aSNathan Whitehorn /* Give brand a chance to veto check_note's guess */ 280f19d421aSNathan Whitehorn if (ret && bi->header_supported) 281f19d421aSNathan Whitehorn ret = bi->header_supported(imgp); 282af582aaeSKonstantin Belousov /* 283af582aaeSKonstantin Belousov * If note checker claimed the binary, but the 284af582aaeSKonstantin Belousov * interpreter path in the image does not 285af582aaeSKonstantin Belousov * match default one for the brand, try to 286af582aaeSKonstantin Belousov * search for other brands with the same 287af582aaeSKonstantin Belousov * interpreter. Either there is better brand 288af582aaeSKonstantin Belousov * with the right interpreter, or, failing 289af582aaeSKonstantin Belousov * this, we return first brand which accepted 290af582aaeSKonstantin Belousov * our note and, optionally, header. 291af582aaeSKonstantin Belousov */ 292af582aaeSKonstantin Belousov if (ret && bi_m == NULL && (strlen(bi->interp_path) + 293af582aaeSKonstantin Belousov 1 != interp_name_len || strncmp(interp, 294af582aaeSKonstantin Belousov bi->interp_path, interp_name_len) != 0)) { 295af582aaeSKonstantin Belousov bi_m = bi; 296af582aaeSKonstantin Belousov ret = 0; 297af582aaeSKonstantin Belousov } 29832c01de2SDmitry Chagin if (ret) 29932c01de2SDmitry Chagin return (bi); 30032c01de2SDmitry Chagin } 30132c01de2SDmitry Chagin } 302af582aaeSKonstantin Belousov if (bi_m != NULL) 303af582aaeSKonstantin Belousov return (bi_m); 30432c01de2SDmitry Chagin 3055fe3ed62SJake Burkholder /* If the executable has a brand, search for it in the brand list. */ 3065fe3ed62SJake Burkholder for (i = 0; i < MAX_BRANDS; i++) { 3075fe3ed62SJake Burkholder bi = elf_brand_list[i]; 308ecc2fda8SBjoern A. Zeeb if (bi == NULL || bi->flags & BI_BRAND_NOTE_MANDATORY) 309ecc2fda8SBjoern A. Zeeb continue; 310ecc2fda8SBjoern A. Zeeb if (hdr->e_machine == bi->machine && 3115fe3ed62SJake Burkholder (hdr->e_ident[EI_OSABI] == bi->brand || 3125fe3ed62SJake Burkholder strncmp((const char *)&hdr->e_ident[OLD_EI_BRAND], 313686d2f31SNathan Whitehorn bi->compat_3_brand, strlen(bi->compat_3_brand)) == 0)) { 314686d2f31SNathan Whitehorn /* Looks good, but give brand a chance to veto */ 315686d2f31SNathan Whitehorn if (!bi->header_supported || bi->header_supported(imgp)) 3165fe3ed62SJake Burkholder return (bi); 3175fe3ed62SJake Burkholder } 318686d2f31SNathan Whitehorn } 3195fe3ed62SJake Burkholder 320817dc004SWarner Losh /* No known brand, see if the header is recognized by any brand */ 321817dc004SWarner Losh for (i = 0; i < MAX_BRANDS; i++) { 322817dc004SWarner Losh bi = elf_brand_list[i]; 323817dc004SWarner Losh if (bi == NULL || bi->flags & BI_BRAND_NOTE_MANDATORY || 324817dc004SWarner Losh bi->header_supported == NULL) 325817dc004SWarner Losh continue; 326817dc004SWarner Losh if (hdr->e_machine == bi->machine) { 327817dc004SWarner Losh ret = bi->header_supported(imgp); 328817dc004SWarner Losh if (ret) 329817dc004SWarner Losh return (bi); 330817dc004SWarner Losh } 331817dc004SWarner Losh } 332817dc004SWarner Losh 3335fe3ed62SJake Burkholder /* Lacking a known brand, search for a recognized interpreter. */ 3345fe3ed62SJake Burkholder if (interp != NULL) { 3355fe3ed62SJake Burkholder for (i = 0; i < MAX_BRANDS; i++) { 3365fe3ed62SJake Burkholder bi = elf_brand_list[i]; 337ecc2fda8SBjoern A. Zeeb if (bi == NULL || bi->flags & BI_BRAND_NOTE_MANDATORY) 338ecc2fda8SBjoern A. Zeeb continue; 339ecc2fda8SBjoern A. Zeeb if (hdr->e_machine == bi->machine && 340d1ae5c83SKonstantin Belousov /* ELF image p_filesz includes terminating zero */ 341d1ae5c83SKonstantin Belousov strlen(bi->interp_path) + 1 == interp_name_len && 342d1ae5c83SKonstantin Belousov strncmp(interp, bi->interp_path, interp_name_len) 343d1ae5c83SKonstantin Belousov == 0) 3445fe3ed62SJake Burkholder return (bi); 3455fe3ed62SJake Burkholder } 3465fe3ed62SJake Burkholder } 3475fe3ed62SJake Burkholder 3485fe3ed62SJake Burkholder /* Lacking a recognized interpreter, try the default brand */ 3495fe3ed62SJake Burkholder for (i = 0; i < MAX_BRANDS; i++) { 3505fe3ed62SJake Burkholder bi = elf_brand_list[i]; 351ecc2fda8SBjoern A. Zeeb if (bi == NULL || bi->flags & BI_BRAND_NOTE_MANDATORY) 352ecc2fda8SBjoern A. Zeeb continue; 353ecc2fda8SBjoern A. Zeeb if (hdr->e_machine == bi->machine && 354e548a1d4SJake Burkholder __elfN(fallback_brand) == bi->brand) 3555fe3ed62SJake Burkholder return (bi); 3565fe3ed62SJake Burkholder } 3575fe3ed62SJake Burkholder return (NULL); 3585fe3ed62SJake Burkholder } 3595fe3ed62SJake Burkholder 360e1743d02SSøren Schmidt static int 3613ebc1248SPeter Wemm __elfN(check_header)(const Elf_Ehdr *hdr) 362e1743d02SSøren Schmidt { 363d0ca7c29SPeter Wemm Elf_Brandinfo *bi; 3643ebc1248SPeter Wemm int i; 3653ebc1248SPeter Wemm 36652c24af7SPeter Wemm if (!IS_ELF(*hdr) || 36752c24af7SPeter Wemm hdr->e_ident[EI_CLASS] != ELF_TARG_CLASS || 36852c24af7SPeter Wemm hdr->e_ident[EI_DATA] != ELF_TARG_DATA || 3693dc19c46SJacques Vidrine hdr->e_ident[EI_VERSION] != EV_CURRENT || 3703dc19c46SJacques Vidrine hdr->e_phentsize != sizeof(Elf_Phdr) || 3713dc19c46SJacques Vidrine hdr->e_version != ELF_TARG_VER) 372a7cddfedSJake Burkholder return (ENOEXEC); 373e1743d02SSøren Schmidt 3743ebc1248SPeter Wemm /* 3753ebc1248SPeter Wemm * Make sure we have at least one brand for this machine. 3763ebc1248SPeter Wemm */ 3773ebc1248SPeter Wemm 3783ebc1248SPeter Wemm for (i = 0; i < MAX_BRANDS; i++) { 379d0ca7c29SPeter Wemm bi = elf_brand_list[i]; 380d0ca7c29SPeter Wemm if (bi != NULL && bi->machine == hdr->e_machine) 3813ebc1248SPeter Wemm break; 3823ebc1248SPeter Wemm } 3833ebc1248SPeter Wemm if (i == MAX_BRANDS) 384a7cddfedSJake Burkholder return (ENOEXEC); 385e1743d02SSøren Schmidt 386a7cddfedSJake Burkholder return (0); 387e1743d02SSøren Schmidt } 388e1743d02SSøren Schmidt 389e1743d02SSøren Schmidt static int 3903ebc1248SPeter Wemm __elfN(map_partial)(vm_map_t map, vm_object_t object, vm_ooffset_t offset, 391ff6f03c7SAlan Cox vm_offset_t start, vm_offset_t end, vm_prot_t prot) 3923ebc1248SPeter Wemm { 393da61b9a6SAlan Cox struct sf_buf *sf; 394da61b9a6SAlan Cox int error; 3953ebc1248SPeter Wemm vm_offset_t off; 3963ebc1248SPeter Wemm 3973ebc1248SPeter Wemm /* 3983ebc1248SPeter Wemm * Create the page if it doesn't exist yet. Ignore errors. 3993ebc1248SPeter Wemm */ 4003ebc1248SPeter Wemm vm_map_lock(map); 401ff6f03c7SAlan Cox vm_map_insert(map, NULL, 0, trunc_page(start), round_page(end), 402ff6f03c7SAlan Cox VM_PROT_ALL, VM_PROT_ALL, 0); 4033ebc1248SPeter Wemm vm_map_unlock(map); 4043ebc1248SPeter Wemm 4053ebc1248SPeter Wemm /* 4063ebc1248SPeter Wemm * Find the page from the underlying object. 4073ebc1248SPeter Wemm */ 408*28e8da65SAlan Cox if (object != NULL) { 409da61b9a6SAlan Cox sf = vm_imgact_map_page(object, offset); 410da61b9a6SAlan Cox if (sf == NULL) 411da61b9a6SAlan Cox return (KERN_FAILURE); 4123ebc1248SPeter Wemm off = offset - trunc_page(offset); 413da61b9a6SAlan Cox error = copyout((caddr_t)sf_buf_kva(sf) + off, (caddr_t)start, 414ca0387efSJake Burkholder end - start); 415be996836SAttilio Rao vm_imgact_unmap_page(sf); 416fe0a8a39SKonstantin Belousov if (error != 0) 417a7cddfedSJake Burkholder return (KERN_FAILURE); 4183ebc1248SPeter Wemm } 4193ebc1248SPeter Wemm 420a7cddfedSJake Burkholder return (KERN_SUCCESS); 4213ebc1248SPeter Wemm } 4223ebc1248SPeter Wemm 4233ebc1248SPeter Wemm static int 424e3d8f8feSKonstantin Belousov __elfN(map_insert)(struct image_params *imgp, vm_map_t map, vm_object_t object, 425e3d8f8feSKonstantin Belousov vm_ooffset_t offset, vm_offset_t start, vm_offset_t end, vm_prot_t prot, 426e3d8f8feSKonstantin Belousov int cow) 4273ebc1248SPeter Wemm { 428da61b9a6SAlan Cox struct sf_buf *sf; 429da61b9a6SAlan Cox vm_offset_t off; 430a063facbSMarcel Moolenaar vm_size_t sz; 431e3d8f8feSKonstantin Belousov int error, locked, rv; 4323ebc1248SPeter Wemm 4333ebc1248SPeter Wemm if (start != trunc_page(start)) { 43481f223caSJake Burkholder rv = __elfN(map_partial)(map, object, offset, start, 435ff6f03c7SAlan Cox round_page(start), prot); 436*28e8da65SAlan Cox if (rv != KERN_SUCCESS) 437a7cddfedSJake Burkholder return (rv); 4383ebc1248SPeter Wemm offset += round_page(start) - start; 4393ebc1248SPeter Wemm start = round_page(start); 4403ebc1248SPeter Wemm } 4413ebc1248SPeter Wemm if (end != round_page(end)) { 44281f223caSJake Burkholder rv = __elfN(map_partial)(map, object, offset + 443ff6f03c7SAlan Cox trunc_page(end) - start, trunc_page(end), end, prot); 444*28e8da65SAlan Cox if (rv != KERN_SUCCESS) 445a7cddfedSJake Burkholder return (rv); 4463ebc1248SPeter Wemm end = trunc_page(end); 4473ebc1248SPeter Wemm } 4483ebc1248SPeter Wemm if (end > start) { 4493ebc1248SPeter Wemm if (offset & PAGE_MASK) { 4503ebc1248SPeter Wemm /* 4513ebc1248SPeter Wemm * The mapping is not page aligned. This means we have 4523ebc1248SPeter Wemm * to copy the data. Sigh. 4533ebc1248SPeter Wemm */ 45455b985b4SKonstantin Belousov vm_map_lock(map); 45555b985b4SKonstantin Belousov rv = vm_map_insert(map, NULL, 0, start, end, 45655b985b4SKonstantin Belousov prot | VM_PROT_WRITE, VM_PROT_ALL, 0); 45755b985b4SKonstantin Belousov vm_map_unlock(map); 4585420f76bSKonstantin Belousov if (rv != KERN_SUCCESS) 459a7cddfedSJake Burkholder return (rv); 460da61b9a6SAlan Cox if (object == NULL) 461da61b9a6SAlan Cox return (KERN_SUCCESS); 462da61b9a6SAlan Cox for (; start < end; start += sz) { 463da61b9a6SAlan Cox sf = vm_imgact_map_page(object, offset); 464da61b9a6SAlan Cox if (sf == NULL) 465da61b9a6SAlan Cox return (KERN_FAILURE); 4663ebc1248SPeter Wemm off = offset - trunc_page(offset); 4673ebc1248SPeter Wemm sz = end - start; 468da61b9a6SAlan Cox if (sz > PAGE_SIZE - off) 469da61b9a6SAlan Cox sz = PAGE_SIZE - off; 470da61b9a6SAlan Cox error = copyout((caddr_t)sf_buf_kva(sf) + off, 4713ebc1248SPeter Wemm (caddr_t)start, sz); 472be996836SAttilio Rao vm_imgact_unmap_page(sf); 4735420f76bSKonstantin Belousov if (error != 0) 474a7cddfedSJake Burkholder return (KERN_FAILURE); 475da61b9a6SAlan Cox offset += sz; 4763ebc1248SPeter Wemm } 4773ebc1248SPeter Wemm rv = KERN_SUCCESS; 4783ebc1248SPeter Wemm } else { 479e5e6093bSAlan Cox vm_object_reference(object); 4803ebc1248SPeter Wemm vm_map_lock(map); 4813ebc1248SPeter Wemm rv = vm_map_insert(map, object, offset, start, end, 482ff6f03c7SAlan Cox prot, VM_PROT_ALL, cow); 4833ebc1248SPeter Wemm vm_map_unlock(map); 484e3d8f8feSKonstantin Belousov if (rv != KERN_SUCCESS) { 485e3d8f8feSKonstantin Belousov locked = VOP_ISLOCKED(imgp->vp); 486e3d8f8feSKonstantin Belousov VOP_UNLOCK(imgp->vp, 0); 487e5e6093bSAlan Cox vm_object_deallocate(object); 488e3d8f8feSKonstantin Belousov vn_lock(imgp->vp, locked | LK_RETRY); 489e3d8f8feSKonstantin Belousov } 4903ebc1248SPeter Wemm } 491a7cddfedSJake Burkholder return (rv); 4923ebc1248SPeter Wemm } else { 493a7cddfedSJake Burkholder return (KERN_SUCCESS); 4943ebc1248SPeter Wemm } 4953ebc1248SPeter Wemm } 4963ebc1248SPeter Wemm 4973ebc1248SPeter Wemm static int 498292177e6SAlan Cox __elfN(load_section)(struct image_params *imgp, vm_offset_t offset, 4993ebc1248SPeter Wemm caddr_t vmaddr, size_t memsz, size_t filsz, vm_prot_t prot, 5003ebc1248SPeter Wemm size_t pagesize) 501e1743d02SSøren Schmidt { 502da61b9a6SAlan Cox struct sf_buf *sf; 503e1743d02SSøren Schmidt size_t map_len; 504292177e6SAlan Cox vm_map_t map; 505292177e6SAlan Cox vm_object_t object; 506e1743d02SSøren Schmidt vm_offset_t map_addr; 507fa7dd9c5SMatthew Dillon int error, rv, cow; 508e1743d02SSøren Schmidt size_t copy_len; 50952c24af7SPeter Wemm vm_offset_t file_addr; 51052c24af7SPeter Wemm 51125ead034SBrian Feldman /* 51225ead034SBrian Feldman * It's necessary to fail if the filsz + offset taken from the 51325ead034SBrian Feldman * header is greater than the actual file pager object's size. 51425ead034SBrian Feldman * If we were to allow this, then the vm_map_find() below would 51525ead034SBrian Feldman * walk right off the end of the file object and into the ether. 51625ead034SBrian Feldman * 51725ead034SBrian Feldman * While I'm here, might as well check for something else that 51825ead034SBrian Feldman * is invalid: filsz cannot be greater than memsz. 51925ead034SBrian Feldman */ 520292177e6SAlan Cox if ((off_t)filsz + offset > imgp->attr->va_size || filsz > memsz) { 52125ead034SBrian Feldman uprintf("elf_load_section: truncated ELF file\n"); 52225ead034SBrian Feldman return (ENOEXEC); 52325ead034SBrian Feldman } 52425ead034SBrian Feldman 525292177e6SAlan Cox object = imgp->object; 526292177e6SAlan Cox map = &imgp->proc->p_vmspace->vm_map; 5273ebc1248SPeter Wemm map_addr = trunc_page_ps((vm_offset_t)vmaddr, pagesize); 5283ebc1248SPeter Wemm file_addr = trunc_page_ps(offset, pagesize); 529e1743d02SSøren Schmidt 530e1743d02SSøren Schmidt /* 53152c24af7SPeter Wemm * We have two choices. We can either clear the data in the last page 53252c24af7SPeter Wemm * of an oversized mapping, or we can start the anon mapping a page 53352c24af7SPeter Wemm * early and copy the initialized data into that first page. We 534*28e8da65SAlan Cox * choose the second. 53552c24af7SPeter Wemm */ 53652c24af7SPeter Wemm if (memsz > filsz) 5373ebc1248SPeter Wemm map_len = trunc_page_ps(offset + filsz, pagesize) - file_addr; 53852c24af7SPeter Wemm else 5393ebc1248SPeter Wemm map_len = round_page_ps(offset + filsz, pagesize) - file_addr; 54052c24af7SPeter Wemm 54152c24af7SPeter Wemm if (map_len != 0) { 542fa7dd9c5SMatthew Dillon /* cow flags: don't dump readonly sections in core */ 543fa7dd9c5SMatthew Dillon cow = MAP_COPY_ON_WRITE | MAP_PREFAULT | 544fa7dd9c5SMatthew Dillon (prot & VM_PROT_WRITE ? 0 : MAP_DISABLE_COREDUMP); 545fa7dd9c5SMatthew Dillon 546e3d8f8feSKonstantin Belousov rv = __elfN(map_insert)(imgp, map, 54752c24af7SPeter Wemm object, 54852c24af7SPeter Wemm file_addr, /* file offset */ 54952c24af7SPeter Wemm map_addr, /* virtual start */ 55052c24af7SPeter Wemm map_addr + map_len,/* virtual end */ 55152c24af7SPeter Wemm prot, 552fa7dd9c5SMatthew Dillon cow); 553e5e6093bSAlan Cox if (rv != KERN_SUCCESS) 554a7cddfedSJake Burkholder return (EINVAL); 55552c24af7SPeter Wemm 55652c24af7SPeter Wemm /* we can stop now if we've covered it all */ 55723955314SAlfred Perlstein if (memsz == filsz) { 558a7cddfedSJake Burkholder return (0); 55952c24af7SPeter Wemm } 56023955314SAlfred Perlstein } 56152c24af7SPeter Wemm 56252c24af7SPeter Wemm 56352c24af7SPeter Wemm /* 56452c24af7SPeter Wemm * We have to get the remaining bit of the file into the first part 56552c24af7SPeter Wemm * of the oversized map segment. This is normally because the .data 56652c24af7SPeter Wemm * segment in the file is extended to provide bss. It's a neat idea 56752c24af7SPeter Wemm * to try and save a page, but it's a pain in the behind to implement. 568e1743d02SSøren Schmidt */ 5693ebc1248SPeter Wemm copy_len = (offset + filsz) - trunc_page_ps(offset + filsz, pagesize); 5703ebc1248SPeter Wemm map_addr = trunc_page_ps((vm_offset_t)vmaddr + filsz, pagesize); 571ca0387efSJake Burkholder map_len = round_page_ps((vm_offset_t)vmaddr + memsz, pagesize) - 572ca0387efSJake Burkholder map_addr; 573e1743d02SSøren Schmidt 57452c24af7SPeter Wemm /* This had damn well better be true! */ 5758191d577SPeter Wemm if (map_len != 0) { 576e3d8f8feSKonstantin Belousov rv = __elfN(map_insert)(imgp, map, NULL, 0, map_addr, 577e3d8f8feSKonstantin Belousov map_addr + map_len, VM_PROT_ALL, 0); 57823955314SAlfred Perlstein if (rv != KERN_SUCCESS) { 579a7cddfedSJake Burkholder return (EINVAL); 5808191d577SPeter Wemm } 58123955314SAlfred Perlstein } 582e1743d02SSøren Schmidt 58352c24af7SPeter Wemm if (copy_len != 0) { 5843ebc1248SPeter Wemm vm_offset_t off; 585da61b9a6SAlan Cox 586da61b9a6SAlan Cox sf = vm_imgact_map_page(object, offset + filsz); 587da61b9a6SAlan Cox if (sf == NULL) 588da61b9a6SAlan Cox return (EIO); 589e1743d02SSøren Schmidt 59052c24af7SPeter Wemm /* send the page fragment to user space */ 59181f223caSJake Burkholder off = trunc_page_ps(offset + filsz, pagesize) - 59281f223caSJake Burkholder trunc_page(offset + filsz); 593da61b9a6SAlan Cox error = copyout((caddr_t)sf_buf_kva(sf) + off, 594da61b9a6SAlan Cox (caddr_t)map_addr, copy_len); 595be996836SAttilio Rao vm_imgact_unmap_page(sf); 59623955314SAlfred Perlstein if (error) { 59752c24af7SPeter Wemm return (error); 59852c24af7SPeter Wemm } 59923955314SAlfred Perlstein } 600e1743d02SSøren Schmidt 601e1743d02SSøren Schmidt /* 6023ebc1248SPeter Wemm * set it to the specified protection. 6033ebc1248SPeter Wemm * XXX had better undo the damage from pasting over the cracks here! 604e1743d02SSøren Schmidt */ 605292177e6SAlan Cox vm_map_protect(map, trunc_page(map_addr), round_page(map_addr + 606292177e6SAlan Cox map_len), prot, FALSE); 6078191d577SPeter Wemm 608ff6f03c7SAlan Cox return (0); 609e1743d02SSøren Schmidt } 610e1743d02SSøren Schmidt 611c33fe779SJohn Polstra /* 612c33fe779SJohn Polstra * Load the file "file" into memory. It may be either a shared object 613c33fe779SJohn Polstra * or an executable. 614c33fe779SJohn Polstra * 615c33fe779SJohn Polstra * The "addr" reference parameter is in/out. On entry, it specifies 616c33fe779SJohn Polstra * the address where a shared object should be loaded. If the file is 617c33fe779SJohn Polstra * an executable, this value is ignored. On exit, "addr" specifies 618c33fe779SJohn Polstra * where the file was actually loaded. 619c33fe779SJohn Polstra * 620c33fe779SJohn Polstra * The "entry" reference parameter is out only. On exit, it specifies 621c33fe779SJohn Polstra * the entry point for the loaded file. 622c33fe779SJohn Polstra */ 623e1743d02SSøren Schmidt static int 6243ebc1248SPeter Wemm __elfN(load_file)(struct proc *p, const char *file, u_long *addr, 6253ebc1248SPeter Wemm u_long *entry, size_t pagesize) 626e1743d02SSøren Schmidt { 627911c2be0SMark Peek struct { 628911c2be0SMark Peek struct nameidata nd; 629911c2be0SMark Peek struct vattr attr; 630911c2be0SMark Peek struct image_params image_params; 631911c2be0SMark Peek } *tempdata; 632d254af07SMatthew Dillon const Elf_Ehdr *hdr = NULL; 633d254af07SMatthew Dillon const Elf_Phdr *phdr = NULL; 634911c2be0SMark Peek struct nameidata *nd; 635911c2be0SMark Peek struct vattr *attr; 636911c2be0SMark Peek struct image_params *imgp; 63752c24af7SPeter Wemm vm_prot_t prot; 638c33fe779SJohn Polstra u_long rbase; 639c33fe779SJohn Polstra u_long base_addr = 0; 6405050aa86SKonstantin Belousov int error, i, numsegs; 641e1743d02SSøren Schmidt 64212bc222eSJonathan Anderson #ifdef CAPABILITY_MODE 64312bc222eSJonathan Anderson /* 64412bc222eSJonathan Anderson * XXXJA: This check can go away once we are sufficiently confident 64512bc222eSJonathan Anderson * that the checks in namei() are correct. 64612bc222eSJonathan Anderson */ 64712bc222eSJonathan Anderson if (IN_CAPABILITY_MODE(curthread)) 64812bc222eSJonathan Anderson return (ECAPMODE); 64912bc222eSJonathan Anderson #endif 65012bc222eSJonathan Anderson 651a163d034SWarner Losh tempdata = malloc(sizeof(*tempdata), M_TEMP, M_WAITOK); 652911c2be0SMark Peek nd = &tempdata->nd; 653911c2be0SMark Peek attr = &tempdata->attr; 654911c2be0SMark Peek imgp = &tempdata->image_params; 655911c2be0SMark Peek 656c8a79999SPeter Wemm /* 657c8a79999SPeter Wemm * Initialize part of the common data 658c8a79999SPeter Wemm */ 659c8a79999SPeter Wemm imgp->proc = p; 660911c2be0SMark Peek imgp->attr = attr; 661c8a79999SPeter Wemm imgp->firstpage = NULL; 66259c8bc40SAlan Cox imgp->image_header = NULL; 6630b2ed1aeSJeff Roberson imgp->object = NULL; 6646d7bdc8dSRobert Watson imgp->execlabel = NULL; 665c8a79999SPeter Wemm 6665050aa86SKonstantin Belousov NDINIT(nd, LOOKUP, LOCKLEAF | FOLLOW, UIO_SYSSPACE, file, curthread); 667911c2be0SMark Peek if ((error = namei(nd)) != 0) { 668911c2be0SMark Peek nd->ni_vp = NULL; 669e1743d02SSøren Schmidt goto fail; 670e1743d02SSøren Schmidt } 671911c2be0SMark Peek NDFREE(nd, NDF_ONLY_PNBUF); 672911c2be0SMark Peek imgp->vp = nd->ni_vp; 673c8a79999SPeter Wemm 674e1743d02SSøren Schmidt /* 675e1743d02SSøren Schmidt * Check permissions, modes, uid, etc on the file, and "open" it. 676e1743d02SSøren Schmidt */ 677c8a79999SPeter Wemm error = exec_check_permissions(imgp); 678373d1a3fSAlan Cox if (error) 679c8a79999SPeter Wemm goto fail; 680e1743d02SSøren Schmidt 681c8a79999SPeter Wemm error = exec_map_first_page(imgp); 682373d1a3fSAlan Cox if (error) 683373d1a3fSAlan Cox goto fail; 684373d1a3fSAlan Cox 68525ead034SBrian Feldman /* 68625ead034SBrian Feldman * Also make certain that the interpreter stays the same, so set 687e6e370a7SJeff Roberson * its VV_TEXT flag, too. 68825ead034SBrian Feldman */ 689877d24acSKonstantin Belousov VOP_SET_TEXT(nd->ni_vp); 690e6e370a7SJeff Roberson 6918516dd18SPoul-Henning Kamp imgp->object = nd->ni_vp->v_object; 692e1743d02SSøren Schmidt 693d254af07SMatthew Dillon hdr = (const Elf_Ehdr *)imgp->image_header; 6943ebc1248SPeter Wemm if ((error = __elfN(check_header)(hdr)) != 0) 695e1743d02SSøren Schmidt goto fail; 696c33fe779SJohn Polstra if (hdr->e_type == ET_DYN) 697c33fe779SJohn Polstra rbase = *addr; 698c33fe779SJohn Polstra else if (hdr->e_type == ET_EXEC) 699c33fe779SJohn Polstra rbase = 0; 700c33fe779SJohn Polstra else { 701c33fe779SJohn Polstra error = ENOEXEC; 702c33fe779SJohn Polstra goto fail; 703c33fe779SJohn Polstra } 704e1743d02SSøren Schmidt 705c8a79999SPeter Wemm /* Only support headers that fit within first page for now */ 70652c24af7SPeter Wemm if ((hdr->e_phoff > PAGE_SIZE) || 707d19d5bf4STijl Coosemans (u_int)hdr->e_phentsize * hdr->e_phnum > PAGE_SIZE - hdr->e_phoff) { 708c8a79999SPeter Wemm error = ENOEXEC; 709e1743d02SSøren Schmidt goto fail; 710c8a79999SPeter Wemm } 711c8a79999SPeter Wemm 712d254af07SMatthew Dillon phdr = (const Elf_Phdr *)(imgp->image_header + hdr->e_phoff); 71393d1c728SKonstantin Belousov if (!aligned(phdr, Elf_Addr)) { 71493d1c728SKonstantin Belousov error = ENOEXEC; 71593d1c728SKonstantin Belousov goto fail; 71693d1c728SKonstantin Belousov } 717e1743d02SSøren Schmidt 718c33fe779SJohn Polstra for (i = 0, numsegs = 0; i < hdr->e_phnum; i++) { 7195b33842aSKonstantin Belousov if (phdr[i].p_type == PT_LOAD && phdr[i].p_memsz != 0) { 7205b33842aSKonstantin Belousov /* Loadable segment */ 721ed167eaaSKonstantin Belousov prot = __elfN(trans_prot)(phdr[i].p_flags); 722292177e6SAlan Cox error = __elfN(load_section)(imgp, phdr[i].p_offset, 72381f223caSJake Burkholder (caddr_t)(uintptr_t)phdr[i].p_vaddr + rbase, 724292177e6SAlan Cox phdr[i].p_memsz, phdr[i].p_filesz, prot, pagesize); 725292177e6SAlan Cox if (error != 0) 726e1743d02SSøren Schmidt goto fail; 727e1743d02SSøren Schmidt /* 728c33fe779SJohn Polstra * Establish the base address if this is the 729c33fe779SJohn Polstra * first segment. 730e1743d02SSøren Schmidt */ 731c33fe779SJohn Polstra if (numsegs == 0) 732ca0387efSJake Burkholder base_addr = trunc_page(phdr[i].p_vaddr + 733ca0387efSJake Burkholder rbase); 734c33fe779SJohn Polstra numsegs++; 735e1743d02SSøren Schmidt } 736e1743d02SSøren Schmidt } 737c33fe779SJohn Polstra *addr = base_addr; 738c33fe779SJohn Polstra *entry = (unsigned long)hdr->e_entry + rbase; 739e1743d02SSøren Schmidt 740e1743d02SSøren Schmidt fail: 741c8a79999SPeter Wemm if (imgp->firstpage) 742c8a79999SPeter Wemm exec_unmap_first_page(imgp); 7430b2ed1aeSJeff Roberson 744911c2be0SMark Peek if (nd->ni_vp) 745373d1a3fSAlan Cox vput(nd->ni_vp); 746911c2be0SMark Peek 747911c2be0SMark Peek free(tempdata, M_TEMP); 748e1743d02SSøren Schmidt 749a7cddfedSJake Burkholder return (error); 750e1743d02SSøren Schmidt } 751e1743d02SSøren Schmidt 752303b270bSEivind Eklund static int 7533ebc1248SPeter Wemm __CONCAT(exec_, __elfN(imgact))(struct image_params *imgp) 754e1743d02SSøren Schmidt { 7556c775eb6SKonstantin Belousov struct thread *td; 7566c775eb6SKonstantin Belousov const Elf_Ehdr *hdr; 75732c01de2SDmitry Chagin const Elf_Phdr *phdr; 758e5e6093bSAlan Cox Elf_Auxargs *elf_auxargs; 7595856e12eSJohn Dyson struct vmspace *vmspace; 7606c775eb6SKonstantin Belousov const char *err_str, *newinterp; 7616c775eb6SKonstantin Belousov char *interp, *interp_buf, *path; 762d1dbc694SJohn Polstra Elf_Brandinfo *brand_info; 7635fe3ed62SJake Burkholder struct sysentvec *sv; 7646c775eb6SKonstantin Belousov vm_prot_t prot; 7656c775eb6SKonstantin Belousov u_long text_size, data_size, total_size, text_addr, data_addr; 7666c775eb6SKonstantin Belousov u_long seg_size, seg_addr, addr, baddr, et_dyn_addr, entry, proghdr; 7676c775eb6SKonstantin Belousov int32_t osrel; 7686c775eb6SKonstantin Belousov int error, i, n, interp_name_len, have_interp; 7696c775eb6SKonstantin Belousov 7706c775eb6SKonstantin Belousov hdr = (const Elf_Ehdr *)imgp->image_header; 771e1743d02SSøren Schmidt 772e1743d02SSøren Schmidt /* 773e1743d02SSøren Schmidt * Do we have a valid ELF header ? 774900b28f9SMaxim Sobolev * 775900b28f9SMaxim Sobolev * Only allow ET_EXEC & ET_DYN here, reject ET_DYN later 776900b28f9SMaxim Sobolev * if particular brand doesn't support it. 777e1743d02SSøren Schmidt */ 778900b28f9SMaxim Sobolev if (__elfN(check_header)(hdr) != 0 || 779900b28f9SMaxim Sobolev (hdr->e_type != ET_EXEC && hdr->e_type != ET_DYN)) 780a7cddfedSJake Burkholder return (-1); 781e1743d02SSøren Schmidt 782e1743d02SSøren Schmidt /* 783e1743d02SSøren Schmidt * From here on down, we return an errno, not -1, as we've 784e1743d02SSøren Schmidt * detected an ELF file. 785e1743d02SSøren Schmidt */ 786e1743d02SSøren Schmidt 787e1743d02SSøren Schmidt if ((hdr->e_phoff > PAGE_SIZE) || 788d19d5bf4STijl Coosemans (u_int)hdr->e_phentsize * hdr->e_phnum > PAGE_SIZE - hdr->e_phoff) { 789c8a79999SPeter Wemm /* Only support headers in first page for now */ 7906b16d664SEd Maste uprintf("Program headers not in the first page\n"); 791a7cddfedSJake Burkholder return (ENOEXEC); 792e1743d02SSøren Schmidt } 79352c24af7SPeter Wemm phdr = (const Elf_Phdr *)(imgp->image_header + hdr->e_phoff); 7946b16d664SEd Maste if (!aligned(phdr, Elf_Addr)) { 7956b16d664SEd Maste uprintf("Unaligned program headers\n"); 79693d1c728SKonstantin Belousov return (ENOEXEC); 7976b16d664SEd Maste } 7986c775eb6SKonstantin Belousov 7996c775eb6SKonstantin Belousov n = error = 0; 8007564c4adSKonstantin Belousov baddr = 0; 8016c775eb6SKonstantin Belousov osrel = 0; 8026c775eb6SKonstantin Belousov text_size = data_size = total_size = text_addr = data_addr = 0; 8036c775eb6SKonstantin Belousov entry = proghdr = 0; 8046c775eb6SKonstantin Belousov interp_name_len = 0; 8056c775eb6SKonstantin Belousov err_str = newinterp = NULL; 8066c775eb6SKonstantin Belousov interp = interp_buf = NULL; 8076c775eb6SKonstantin Belousov td = curthread; 8086c775eb6SKonstantin Belousov 8095fe3ed62SJake Burkholder for (i = 0; i < hdr->e_phnum; i++) { 810291c06a1SKonstantin Belousov switch (phdr[i].p_type) { 811291c06a1SKonstantin Belousov case PT_LOAD: 8127564c4adSKonstantin Belousov if (n == 0) 8137564c4adSKonstantin Belousov baddr = phdr[i].p_vaddr; 8147564c4adSKonstantin Belousov n++; 815291c06a1SKonstantin Belousov break; 816291c06a1SKonstantin Belousov case PT_INTERP: 817e5e6093bSAlan Cox /* Path to interpreter */ 8186c775eb6SKonstantin Belousov if (phdr[i].p_filesz > MAXPATHLEN) { 8196b16d664SEd Maste uprintf("Invalid PT_INTERP\n"); 8206c775eb6SKonstantin Belousov error = ENOEXEC; 8216c775eb6SKonstantin Belousov goto ret; 8226b16d664SEd Maste } 823d3ee0a15SJonathan T. Looney if (interp != NULL) { 824d3ee0a15SJonathan T. Looney uprintf("Multiple PT_INTERP headers\n"); 825d3ee0a15SJonathan T. Looney error = ENOEXEC; 826d3ee0a15SJonathan T. Looney goto ret; 827d3ee0a15SJonathan T. Looney } 828d1ae5c83SKonstantin Belousov interp_name_len = phdr[i].p_filesz; 8296c775eb6SKonstantin Belousov if (phdr[i].p_offset > PAGE_SIZE || 8306c775eb6SKonstantin Belousov interp_name_len > PAGE_SIZE - phdr[i].p_offset) { 8316c775eb6SKonstantin Belousov VOP_UNLOCK(imgp->vp, 0); 8326c775eb6SKonstantin Belousov interp_buf = malloc(interp_name_len + 1, M_TEMP, 8336c775eb6SKonstantin Belousov M_WAITOK); 8346c775eb6SKonstantin Belousov vn_lock(imgp->vp, LK_EXCLUSIVE | LK_RETRY); 8356c775eb6SKonstantin Belousov error = vn_rdwr(UIO_READ, imgp->vp, interp_buf, 8366c775eb6SKonstantin Belousov interp_name_len, phdr[i].p_offset, 8376c775eb6SKonstantin Belousov UIO_SYSSPACE, IO_NODELOCKED, td->td_ucred, 8386c775eb6SKonstantin Belousov NOCRED, NULL, td); 8396c775eb6SKonstantin Belousov if (error != 0) { 8406c775eb6SKonstantin Belousov uprintf("i/o error PT_INTERP\n"); 8416c775eb6SKonstantin Belousov goto ret; 8426c775eb6SKonstantin Belousov } 8436c775eb6SKonstantin Belousov interp_buf[interp_name_len] = '\0'; 8446c775eb6SKonstantin Belousov interp = interp_buf; 8456c775eb6SKonstantin Belousov } else { 8466c775eb6SKonstantin Belousov interp = __DECONST(char *, imgp->image_header) + 8476c775eb6SKonstantin Belousov phdr[i].p_offset; 8486c775eb6SKonstantin Belousov } 849291c06a1SKonstantin Belousov break; 850291c06a1SKonstantin Belousov case PT_GNU_STACK: 851291c06a1SKonstantin Belousov if (__elfN(nxstack)) 852291c06a1SKonstantin Belousov imgp->stack_prot = 853291c06a1SKonstantin Belousov __elfN(trans_prot)(phdr[i].p_flags); 854316b3843SKonstantin Belousov imgp->stack_sz = phdr[i].p_memsz; 855291c06a1SKonstantin Belousov break; 8563ebc1248SPeter Wemm } 8573ebc1248SPeter Wemm } 8583ebc1248SPeter Wemm 859d1ae5c83SKonstantin Belousov brand_info = __elfN(get_brandinfo)(imgp, interp, interp_name_len, 860d1ae5c83SKonstantin Belousov &osrel); 8615fe3ed62SJake Burkholder if (brand_info == NULL) { 8625fe3ed62SJake Burkholder uprintf("ELF binary type \"%u\" not known.\n", 8635fe3ed62SJake Burkholder hdr->e_ident[EI_OSABI]); 8646c775eb6SKonstantin Belousov error = ENOEXEC; 8656c775eb6SKonstantin Belousov goto ret; 8663ebc1248SPeter Wemm } 86777ebe276SEd Maste et_dyn_addr = 0; 868ab02d85fSKonstantin Belousov if (hdr->e_type == ET_DYN) { 8696b16d664SEd Maste if ((brand_info->flags & BI_CAN_EXEC_DYN) == 0) { 8706b16d664SEd Maste uprintf("Cannot execute shared object\n"); 8716c775eb6SKonstantin Belousov error = ENOEXEC; 8726c775eb6SKonstantin Belousov goto ret; 8736b16d664SEd Maste } 8747564c4adSKonstantin Belousov /* 8757564c4adSKonstantin Belousov * Honour the base load address from the dso if it is 8767564c4adSKonstantin Belousov * non-zero for some reason. 8777564c4adSKonstantin Belousov */ 8787564c4adSKonstantin Belousov if (baddr == 0) 879ab02d85fSKonstantin Belousov et_dyn_addr = ET_DYN_LOAD_ADDR; 88077ebe276SEd Maste } 8815fe3ed62SJake Burkholder sv = brand_info->sysvec; 8829b68618dSPeter Wemm if (interp != NULL && brand_info->interp_newpath != NULL) 8834113f8d7SPeter Wemm newinterp = brand_info->interp_newpath; 8843ebc1248SPeter Wemm 88560bb3943SAlan Cox /* 88660bb3943SAlan Cox * Avoid a possible deadlock if the current address space is destroyed 88760bb3943SAlan Cox * and that address space maps the locked vnode. In the common case, 88860bb3943SAlan Cox * the locked vnode's v_usecount is decremented but remains greater 88960bb3943SAlan Cox * than zero. Consequently, the vnode lock is not needed by vrele(). 89060bb3943SAlan Cox * However, in cases where the vnode lock is external, such as nullfs, 89160bb3943SAlan Cox * v_usecount may become zero. 8921dfab802SAlan Cox * 8931dfab802SAlan Cox * The VV_TEXT flag prevents modifications to the executable while 8941dfab802SAlan Cox * the vnode is unlocked. 89560bb3943SAlan Cox */ 89622db15c0SAttilio Rao VOP_UNLOCK(imgp->vp, 0); 89760bb3943SAlan Cox 89889b57fcfSKonstantin Belousov error = exec_new_vmspace(imgp, sv); 89919059a13SJohn Baldwin imgp->proc->p_sysent = sv; 900e1743d02SSøren Schmidt 901cb05b60aSAttilio Rao vn_lock(imgp->vp, LK_EXCLUSIVE | LK_RETRY); 9026c775eb6SKonstantin Belousov if (error != 0) 9036c775eb6SKonstantin Belousov goto ret; 90460bb3943SAlan Cox 905e1743d02SSøren Schmidt for (i = 0; i < hdr->e_phnum; i++) { 906e1743d02SSøren Schmidt switch (phdr[i].p_type) { 907e1743d02SSøren Schmidt case PT_LOAD: /* Loadable segment */ 9085b33842aSKonstantin Belousov if (phdr[i].p_memsz == 0) 9095b33842aSKonstantin Belousov break; 910ed167eaaSKonstantin Belousov prot = __elfN(trans_prot)(phdr[i].p_flags); 911292177e6SAlan Cox error = __elfN(load_section)(imgp, phdr[i].p_offset, 912ab02d85fSKonstantin Belousov (caddr_t)(uintptr_t)phdr[i].p_vaddr + et_dyn_addr, 91381f223caSJake Burkholder phdr[i].p_memsz, phdr[i].p_filesz, prot, 914292177e6SAlan Cox sv->sv_pagesize); 915292177e6SAlan Cox if (error != 0) 9166c775eb6SKonstantin Belousov goto ret; 917e1743d02SSøren Schmidt 918cfaf7e60SDoug Rabson /* 919cfaf7e60SDoug Rabson * If this segment contains the program headers, 920cfaf7e60SDoug Rabson * remember their virtual address for the AT_PHDR 921cfaf7e60SDoug Rabson * aux entry. Static binaries don't usually include 922cfaf7e60SDoug Rabson * a PT_PHDR entry. 923cfaf7e60SDoug Rabson */ 924cfaf7e60SDoug Rabson if (phdr[i].p_offset == 0 && 925cfaf7e60SDoug Rabson hdr->e_phoff + hdr->e_phnum * hdr->e_phentsize 926cfaf7e60SDoug Rabson <= phdr[i].p_filesz) 927ab02d85fSKonstantin Belousov proghdr = phdr[i].p_vaddr + hdr->e_phoff + 928ab02d85fSKonstantin Belousov et_dyn_addr; 929cfaf7e60SDoug Rabson 930ab02d85fSKonstantin Belousov seg_addr = trunc_page(phdr[i].p_vaddr + et_dyn_addr); 931cac45152SMatthew Dillon seg_size = round_page(phdr[i].p_memsz + 932ab02d85fSKonstantin Belousov phdr[i].p_vaddr + et_dyn_addr - seg_addr); 933cac45152SMatthew Dillon 934e1743d02SSøren Schmidt /* 935920acedbSNathan Whitehorn * Make the largest executable segment the official 936920acedbSNathan Whitehorn * text segment and all others data. 93721c2d047SMatthew Dillon * 93821c2d047SMatthew Dillon * Note that obreak() assumes that data_addr + 93921c2d047SMatthew Dillon * data_size == end of data load area, and the ELF 94021c2d047SMatthew Dillon * file format expects segments to be sorted by 94121c2d047SMatthew Dillon * address. If multiple data segments exist, the 94221c2d047SMatthew Dillon * last one will be used. 943e1743d02SSøren Schmidt */ 944920acedbSNathan Whitehorn 945920acedbSNathan Whitehorn if (phdr[i].p_flags & PF_X && text_size < seg_size) { 9469782ecbaSPeter Wemm text_size = seg_size; 9479782ecbaSPeter Wemm text_addr = seg_addr; 9489782ecbaSPeter Wemm } else { 94921c2d047SMatthew Dillon data_size = seg_size; 950cac45152SMatthew Dillon data_addr = seg_addr; 951cac45152SMatthew Dillon } 95221c2d047SMatthew Dillon total_size += seg_size; 95396725dd0SAlexander Kabaev break; 95496725dd0SAlexander Kabaev case PT_PHDR: /* Program header table info */ 955ab02d85fSKonstantin Belousov proghdr = phdr[i].p_vaddr + et_dyn_addr; 95696725dd0SAlexander Kabaev break; 95796725dd0SAlexander Kabaev default: 95896725dd0SAlexander Kabaev break; 95996725dd0SAlexander Kabaev } 96096725dd0SAlexander Kabaev } 96196725dd0SAlexander Kabaev 96296725dd0SAlexander Kabaev if (data_addr == 0 && data_size == 0) { 96396725dd0SAlexander Kabaev data_addr = text_addr; 96496725dd0SAlexander Kabaev data_size = text_size; 96596725dd0SAlexander Kabaev } 966cac45152SMatthew Dillon 967920acedbSNathan Whitehorn entry = (u_long)hdr->e_entry + et_dyn_addr; 968920acedbSNathan Whitehorn 969cac45152SMatthew Dillon /* 970cac45152SMatthew Dillon * Check limits. It should be safe to check the 97196725dd0SAlexander Kabaev * limits after loading the segments since we do 97296725dd0SAlexander Kabaev * not actually fault in all the segments pages. 973cac45152SMatthew Dillon */ 97491d5354aSJohn Baldwin PROC_LOCK(imgp->proc); 975f6f6d240SMateusz Guzik if (data_size > lim_cur_proc(imgp->proc, RLIMIT_DATA)) 9766b16d664SEd Maste err_str = "Data segment size exceeds process limit"; 9776b16d664SEd Maste else if (text_size > maxtsiz) 9786b16d664SEd Maste err_str = "Text segment size exceeds system limit"; 979f6f6d240SMateusz Guzik else if (total_size > lim_cur_proc(imgp->proc, RLIMIT_VMEM)) 9806b16d664SEd Maste err_str = "Total segment size exceeds process limit"; 9816b16d664SEd Maste else if (racct_set(imgp->proc, RACCT_DATA, data_size) != 0) 9826b16d664SEd Maste err_str = "Data segment size exceeds resource limit"; 9836b16d664SEd Maste else if (racct_set(imgp->proc, RACCT_VMEM, total_size) != 0) 9846b16d664SEd Maste err_str = "Total segment size exceeds resource limit"; 9856b16d664SEd Maste if (err_str != NULL) { 98691d5354aSJohn Baldwin PROC_UNLOCK(imgp->proc); 9876b16d664SEd Maste uprintf("%s\n", err_str); 9886c775eb6SKonstantin Belousov error = ENOMEM; 9896c775eb6SKonstantin Belousov goto ret; 990cac45152SMatthew Dillon } 991e1743d02SSøren Schmidt 992292177e6SAlan Cox vmspace = imgp->proc->p_vmspace; 993e1743d02SSøren Schmidt vmspace->vm_tsize = text_size >> PAGE_SHIFT; 9947cd99438SBruce Evans vmspace->vm_taddr = (caddr_t)(uintptr_t)text_addr; 995e1743d02SSøren Schmidt vmspace->vm_dsize = data_size >> PAGE_SHIFT; 9967cd99438SBruce Evans vmspace->vm_daddr = (caddr_t)(uintptr_t)data_addr; 997e1743d02SSøren Schmidt 998c460ac3aSPeter Wemm /* 999c460ac3aSPeter Wemm * We load the dynamic linker where a userland call 1000c460ac3aSPeter Wemm * to mmap(0, ...) would put it. The rationale behind this 1001c460ac3aSPeter Wemm * calculation is that it leaves room for the heap to grow to 1002c460ac3aSPeter Wemm * its maximum allowed size. 1003c460ac3aSPeter Wemm */ 10046c775eb6SKonstantin Belousov addr = round_page((vm_offset_t)vmspace->vm_daddr + lim_max(td, 1005292177e6SAlan Cox RLIMIT_DATA)); 100691d5354aSJohn Baldwin PROC_UNLOCK(imgp->proc); 1007e1743d02SSøren Schmidt 1008ea5a2b2eSSøren Schmidt imgp->entry_addr = entry; 1009ea5a2b2eSSøren Schmidt 101060bb3943SAlan Cox if (interp != NULL) { 10116c775eb6SKonstantin Belousov have_interp = FALSE; 101222db15c0SAttilio Rao VOP_UNLOCK(imgp->vp, 0); 101360bb3943SAlan Cox if (brand_info->emul_path != NULL && 10149b68618dSPeter Wemm brand_info->emul_path[0] != '\0') { 1015a163d034SWarner Losh path = malloc(MAXPATHLEN, M_TEMP, M_WAITOK); 101660bb3943SAlan Cox snprintf(path, MAXPATHLEN, "%s%s", 101760bb3943SAlan Cox brand_info->emul_path, interp); 10189b68618dSPeter Wemm error = __elfN(load_file)(imgp->proc, path, &addr, 10199b68618dSPeter Wemm &imgp->entry_addr, sv->sv_pagesize); 1020911c2be0SMark Peek free(path, M_TEMP); 10219b68618dSPeter Wemm if (error == 0) 10224113f8d7SPeter Wemm have_interp = TRUE; 10239b68618dSPeter Wemm } 102418995077SKonstantin Belousov if (!have_interp && newinterp != NULL && 102518995077SKonstantin Belousov (brand_info->interp_path == NULL || 102618995077SKonstantin Belousov strcmp(interp, brand_info->interp_path) == 0)) { 10274113f8d7SPeter Wemm error = __elfN(load_file)(imgp->proc, newinterp, &addr, 10284113f8d7SPeter Wemm &imgp->entry_addr, sv->sv_pagesize); 1029387ad998SKonstantin Belousov if (error == 0) 10304113f8d7SPeter Wemm have_interp = TRUE; 10314113f8d7SPeter Wemm } 10324113f8d7SPeter Wemm if (!have_interp) { 10339b68618dSPeter Wemm error = __elfN(load_file)(imgp->proc, interp, &addr, 10349b68618dSPeter Wemm &imgp->entry_addr, sv->sv_pagesize); 103560bb3943SAlan Cox } 1036cb05b60aSAttilio Rao vn_lock(imgp->vp, LK_EXCLUSIVE | LK_RETRY); 10379b68618dSPeter Wemm if (error != 0) { 1038d943fa35SKonstantin Belousov uprintf("ELF interpreter %s not found, error %d\n", 1039d943fa35SKonstantin Belousov interp, error); 10406c775eb6SKonstantin Belousov goto ret; 1041e1743d02SSøren Schmidt } 104295c807cfSRobert Watson } else 10437564c4adSKonstantin Belousov addr = et_dyn_addr; 1044ea5a2b2eSSøren Schmidt 1045e1743d02SSøren Schmidt /* 1046e1743d02SSøren Schmidt * Construct auxargs table (used by the fixup routine) 1047e1743d02SSøren Schmidt */ 1048a163d034SWarner Losh elf_auxargs = malloc(sizeof(Elf_Auxargs), M_TEMP, M_WAITOK); 1049e1743d02SSøren Schmidt elf_auxargs->execfd = -1; 1050e1743d02SSøren Schmidt elf_auxargs->phdr = proghdr; 1051e1743d02SSøren Schmidt elf_auxargs->phent = hdr->e_phentsize; 1052e1743d02SSøren Schmidt elf_auxargs->phnum = hdr->e_phnum; 1053e1743d02SSøren Schmidt elf_auxargs->pagesz = PAGE_SIZE; 1054e1743d02SSøren Schmidt elf_auxargs->base = addr; 1055e1743d02SSøren Schmidt elf_auxargs->flags = 0; 1056e1743d02SSøren Schmidt elf_auxargs->entry = entry; 1057d36eec69SWarner Losh elf_auxargs->hdr_eflags = hdr->e_flags; 1058e1743d02SSøren Schmidt 1059e1743d02SSøren Schmidt imgp->auxargs = elf_auxargs; 1060e1743d02SSøren Schmidt imgp->interpreted = 0; 1061a0ea661fSNathan Whitehorn imgp->reloc_base = addr; 106232c01de2SDmitry Chagin imgp->proc->p_osrel = osrel; 1063885f13dcSJohn Baldwin imgp->proc->p_elf_machine = hdr->e_machine; 1064885f13dcSJohn Baldwin imgp->proc->p_elf_flags = hdr->e_flags; 1065f231de47SKonstantin Belousov 10666c775eb6SKonstantin Belousov ret: 10676c775eb6SKonstantin Belousov free(interp_buf, M_TEMP); 1068a7cddfedSJake Burkholder return (error); 1069e1743d02SSøren Schmidt } 1070e1743d02SSøren Schmidt 1071a360a43dSJake Burkholder #define suword __CONCAT(suword, __ELF_WORD_SIZE) 10723ebc1248SPeter Wemm 10733ebc1248SPeter Wemm int 10743ebc1248SPeter Wemm __elfN(freebsd_fixup)(register_t **stack_base, struct image_params *imgp) 1075e1743d02SSøren Schmidt { 1076ecbb00a2SDoug Rabson Elf_Auxargs *args = (Elf_Auxargs *)imgp->auxargs; 1077a360a43dSJake Burkholder Elf_Addr *base; 1078a360a43dSJake Burkholder Elf_Addr *pos; 1079e1743d02SSøren Schmidt 1080a360a43dSJake Burkholder base = (Elf_Addr *)*stack_base; 1081610ecfe0SMaxim Sobolev pos = base + (imgp->args->argc + imgp->args->envc + 2); 1082e1743d02SSøren Schmidt 108335c2a5a8SWarner Losh if (args->execfd != -1) 1084e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_EXECFD, args->execfd); 1085e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PHDR, args->phdr); 1086e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PHENT, args->phent); 1087e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PHNUM, args->phnum); 1088e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_PAGESZ, args->pagesz); 1089e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_FLAGS, args->flags); 1090e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_ENTRY, args->entry); 1091e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_BASE, args->base); 1092ee960398SWarner Losh #ifdef AT_EHDRFLAGS 1093d36eec69SWarner Losh AUXARGS_ENTRY(pos, AT_EHDRFLAGS, args->hdr_eflags); 1094d36eec69SWarner Losh #endif 10953ff06357SKonstantin Belousov if (imgp->execpathp != 0) 10963ff06357SKonstantin Belousov AUXARGS_ENTRY(pos, AT_EXECPATH, imgp->execpathp); 1097b96bd95bSIan Lepore AUXARGS_ENTRY(pos, AT_OSRELDATE, 1098b96bd95bSIan Lepore imgp->proc->p_ucred->cr_prison->pr_osreldate); 1099ee235befSKonstantin Belousov if (imgp->canary != 0) { 1100ee235befSKonstantin Belousov AUXARGS_ENTRY(pos, AT_CANARY, imgp->canary); 1101ee235befSKonstantin Belousov AUXARGS_ENTRY(pos, AT_CANARYLEN, imgp->canarylen); 1102ee235befSKonstantin Belousov } 1103ee235befSKonstantin Belousov AUXARGS_ENTRY(pos, AT_NCPUS, mp_ncpus); 1104ee235befSKonstantin Belousov if (imgp->pagesizes != 0) { 1105ee235befSKonstantin Belousov AUXARGS_ENTRY(pos, AT_PAGESIZES, imgp->pagesizes); 1106ee235befSKonstantin Belousov AUXARGS_ENTRY(pos, AT_PAGESIZESLEN, imgp->pagesizeslen); 1107ee235befSKonstantin Belousov } 1108aea81038SKonstantin Belousov if (imgp->sysent->sv_timekeep_base != 0) { 1109aea81038SKonstantin Belousov AUXARGS_ENTRY(pos, AT_TIMEKEEP, 1110aea81038SKonstantin Belousov imgp->sysent->sv_timekeep_base); 1111aea81038SKonstantin Belousov } 111226d8f3e1SKonstantin Belousov AUXARGS_ENTRY(pos, AT_STACKPROT, imgp->sysent->sv_shared_page_obj 111326d8f3e1SKonstantin Belousov != NULL && imgp->stack_prot != 0 ? imgp->stack_prot : 111426d8f3e1SKonstantin Belousov imgp->sysent->sv_stackprot); 1115e1743d02SSøren Schmidt AUXARGS_ENTRY(pos, AT_NULL, 0); 1116e1743d02SSøren Schmidt 1117e1743d02SSøren Schmidt free(imgp->auxargs, M_TEMP); 1118e1743d02SSøren Schmidt imgp->auxargs = NULL; 1119e1743d02SSøren Schmidt 11203ebc1248SPeter Wemm base--; 1121610ecfe0SMaxim Sobolev suword(base, (long)imgp->args->argc); 11223ebc1248SPeter Wemm *stack_base = (register_t *)base; 1123a7cddfedSJake Burkholder return (0); 1124e1743d02SSøren Schmidt } 1125e1743d02SSøren Schmidt 1126e1743d02SSøren Schmidt /* 11278c64af4fSJohn Polstra * Code for generating ELF core dumps. 11288c64af4fSJohn Polstra */ 11298c64af4fSJohn Polstra 11304d77a549SAlfred Perlstein typedef void (*segment_callback)(vm_map_entry_t, void *); 11310ff27d31SJohn Polstra 11320ff27d31SJohn Polstra /* Closure for cb_put_phdr(). */ 11330ff27d31SJohn Polstra struct phdr_closure { 11340ff27d31SJohn Polstra Elf_Phdr *phdr; /* Program header to fill in */ 11350ff27d31SJohn Polstra Elf_Off offset; /* Offset of segment in core file */ 11360ff27d31SJohn Polstra }; 11370ff27d31SJohn Polstra 11380ff27d31SJohn Polstra /* Closure for cb_size_segment(). */ 11390ff27d31SJohn Polstra struct sseg_closure { 11400ff27d31SJohn Polstra int count; /* Count of writable segments. */ 11410ff27d31SJohn Polstra size_t size; /* Total size of all writable segments. */ 11420ff27d31SJohn Polstra }; 11430ff27d31SJohn Polstra 1144bd390213SMikolaj Golub typedef void (*outfunc_t)(void *, struct sbuf *, size_t *); 1145bd390213SMikolaj Golub 1146bd390213SMikolaj Golub struct note_info { 1147bd390213SMikolaj Golub int type; /* Note type. */ 1148bd390213SMikolaj Golub outfunc_t outfunc; /* Output function. */ 1149bd390213SMikolaj Golub void *outarg; /* Argument for the output function. */ 1150bd390213SMikolaj Golub size_t outsize; /* Output size. */ 1151bd390213SMikolaj Golub TAILQ_ENTRY(note_info) link; /* Link to the next note info. */ 1152bd390213SMikolaj Golub }; 1153bd390213SMikolaj Golub 1154bd390213SMikolaj Golub TAILQ_HEAD(note_info_list, note_info); 1155bd390213SMikolaj Golub 1156aa14e9b7SMark Johnston /* Coredump output parameters. */ 1157aa14e9b7SMark Johnston struct coredump_params { 1158aa14e9b7SMark Johnston off_t offset; 1159aa14e9b7SMark Johnston struct ucred *active_cred; 1160aa14e9b7SMark Johnston struct ucred *file_cred; 1161aa14e9b7SMark Johnston struct thread *td; 1162aa14e9b7SMark Johnston struct vnode *vp; 1163aa14e9b7SMark Johnston struct gzio_stream *gzs; 1164aa14e9b7SMark Johnston }; 1165aa14e9b7SMark Johnston 11664d77a549SAlfred Perlstein static void cb_put_phdr(vm_map_entry_t, void *); 11674d77a549SAlfred Perlstein static void cb_size_segment(vm_map_entry_t, void *); 1168c468ff88SAndriy Gapon static int core_write(struct coredump_params *, const void *, size_t, off_t, 1169aa14e9b7SMark Johnston enum uio_seg); 11701005d8afSConrad Meyer static void each_dumpable_segment(struct thread *, segment_callback, void *); 1171aa14e9b7SMark Johnston static int __elfN(corehdr)(struct coredump_params *, int, void *, size_t, 1172aa14e9b7SMark Johnston struct note_info_list *, size_t); 1173bd390213SMikolaj Golub static void __elfN(prepare_notes)(struct thread *, struct note_info_list *, 1174bd390213SMikolaj Golub size_t *); 1175bd390213SMikolaj Golub static void __elfN(puthdr)(struct thread *, void *, size_t, int, size_t); 1176bd390213SMikolaj Golub static void __elfN(putnote)(struct note_info *, struct sbuf *); 1177bd390213SMikolaj Golub static size_t register_note(struct note_info_list *, int, outfunc_t, void *); 1178bd390213SMikolaj Golub static int sbuf_drain_core_output(void *, const char *, int); 1179f1fca82eSMikolaj Golub static int sbuf_drain_count(void *arg, const char *data, int len); 1180bd390213SMikolaj Golub 1181bd390213SMikolaj Golub static void __elfN(note_fpregset)(void *, struct sbuf *, size_t *); 1182bd390213SMikolaj Golub static void __elfN(note_prpsinfo)(void *, struct sbuf *, size_t *); 1183bd390213SMikolaj Golub static void __elfN(note_prstatus)(void *, struct sbuf *, size_t *); 1184bd390213SMikolaj Golub static void __elfN(note_threadmd)(void *, struct sbuf *, size_t *); 1185bd390213SMikolaj Golub static void __elfN(note_thrmisc)(void *, struct sbuf *, size_t *); 1186f1fca82eSMikolaj Golub static void __elfN(note_procstat_auxv)(void *, struct sbuf *, size_t *); 1187f1fca82eSMikolaj Golub static void __elfN(note_procstat_proc)(void *, struct sbuf *, size_t *); 1188f1fca82eSMikolaj Golub static void __elfN(note_procstat_psstrings)(void *, struct sbuf *, size_t *); 1189f1fca82eSMikolaj Golub static void note_procstat_files(void *, struct sbuf *, size_t *); 1190f1fca82eSMikolaj Golub static void note_procstat_groups(void *, struct sbuf *, size_t *); 1191f1fca82eSMikolaj Golub static void note_procstat_osrel(void *, struct sbuf *, size_t *); 1192f1fca82eSMikolaj Golub static void note_procstat_rlimit(void *, struct sbuf *, size_t *); 1193f1fca82eSMikolaj Golub static void note_procstat_umask(void *, struct sbuf *, size_t *); 1194f1fca82eSMikolaj Golub static void note_procstat_vmmap(void *, struct sbuf *, size_t *); 11958c64af4fSJohn Polstra 1196aa14e9b7SMark Johnston #ifdef GZIO 1197e7228204SAlfred Perlstein extern int compress_user_cores_gzlevel; 1198e7228204SAlfred Perlstein 1199aa14e9b7SMark Johnston /* 1200aa14e9b7SMark Johnston * Write out a core segment to the compression stream. 1201aa14e9b7SMark Johnston */ 1202e7228204SAlfred Perlstein static int 1203aa14e9b7SMark Johnston compress_chunk(struct coredump_params *p, char *base, char *buf, u_int len) 1204aa14e9b7SMark Johnston { 1205aa14e9b7SMark Johnston u_int chunk_len; 1206e7228204SAlfred Perlstein int error; 1207aa14e9b7SMark Johnston 1208aa14e9b7SMark Johnston while (len > 0) { 1209aa14e9b7SMark Johnston chunk_len = MIN(len, CORE_BUF_SIZE); 1210c468ff88SAndriy Gapon 1211c468ff88SAndriy Gapon /* 1212c468ff88SAndriy Gapon * We can get EFAULT error here. 1213c468ff88SAndriy Gapon * In that case zero out the current chunk of the segment. 1214c468ff88SAndriy Gapon */ 1215c468ff88SAndriy Gapon error = copyin(base, buf, chunk_len); 1216c468ff88SAndriy Gapon if (error != 0) 1217c468ff88SAndriy Gapon bzero(buf, chunk_len); 1218aa14e9b7SMark Johnston error = gzio_write(p->gzs, buf, chunk_len); 1219aa14e9b7SMark Johnston if (error != 0) 1220aa14e9b7SMark Johnston break; 1221aa14e9b7SMark Johnston base += chunk_len; 1222aa14e9b7SMark Johnston len -= chunk_len; 1223e7228204SAlfred Perlstein } 1224e7228204SAlfred Perlstein return (error); 1225e7228204SAlfred Perlstein } 1226e7228204SAlfred Perlstein 1227aa14e9b7SMark Johnston static int 1228aa14e9b7SMark Johnston core_gz_write(void *base, size_t len, off_t offset, void *arg) 1229aa14e9b7SMark Johnston { 1230aa14e9b7SMark Johnston 1231aa14e9b7SMark Johnston return (core_write((struct coredump_params *)arg, base, len, offset, 1232aa14e9b7SMark Johnston UIO_SYSSPACE)); 1233aa14e9b7SMark Johnston } 1234aa14e9b7SMark Johnston #endif /* GZIO */ 1235aa14e9b7SMark Johnston 1236aa14e9b7SMark Johnston static int 1237c468ff88SAndriy Gapon core_write(struct coredump_params *p, const void *base, size_t len, 1238c468ff88SAndriy Gapon off_t offset, enum uio_seg seg) 1239aa14e9b7SMark Johnston { 1240aa14e9b7SMark Johnston 1241c468ff88SAndriy Gapon return (vn_rdwr_inchunks(UIO_WRITE, p->vp, __DECONST(void *, base), 1242c468ff88SAndriy Gapon len, offset, seg, IO_UNIT | IO_DIRECT | IO_RANGELOCKED, 1243aa14e9b7SMark Johnston p->active_cred, p->file_cred, NULL, p->td)); 1244aa14e9b7SMark Johnston } 1245aa14e9b7SMark Johnston 1246aa14e9b7SMark Johnston static int 1247aa14e9b7SMark Johnston core_output(void *base, size_t len, off_t offset, struct coredump_params *p, 1248aa14e9b7SMark Johnston void *tmpbuf) 1249aa14e9b7SMark Johnston { 1250c468ff88SAndriy Gapon int error; 1251aa14e9b7SMark Johnston 1252aa14e9b7SMark Johnston #ifdef GZIO 1253aa14e9b7SMark Johnston if (p->gzs != NULL) 1254aa14e9b7SMark Johnston return (compress_chunk(p, base, tmpbuf, len)); 1255bd390213SMikolaj Golub #endif 1256c468ff88SAndriy Gapon /* 1257c468ff88SAndriy Gapon * EFAULT is a non-fatal error that we can get, for example, 1258c468ff88SAndriy Gapon * if the segment is backed by a file but extends beyond its 1259c468ff88SAndriy Gapon * end. 1260c468ff88SAndriy Gapon */ 1261c468ff88SAndriy Gapon error = core_write(p, base, len, offset, UIO_USERSPACE); 1262c468ff88SAndriy Gapon if (error == EFAULT) { 1263c468ff88SAndriy Gapon log(LOG_WARNING, "Failed to fully fault in a core file segment " 1264c468ff88SAndriy Gapon "at VA %p with size 0x%zx to be written at offset 0x%jx " 1265c468ff88SAndriy Gapon "for process %s\n", base, len, offset, curproc->p_comm); 1266c468ff88SAndriy Gapon 1267c468ff88SAndriy Gapon /* 1268c468ff88SAndriy Gapon * Write a "real" zero byte at the end of the target region 1269c468ff88SAndriy Gapon * in the case this is the last segment. 1270c468ff88SAndriy Gapon * The intermediate space will be implicitly zero-filled. 1271c468ff88SAndriy Gapon */ 1272c468ff88SAndriy Gapon error = core_write(p, zero_region, 1, offset + len - 1, 1273c468ff88SAndriy Gapon UIO_SYSSPACE); 1274c468ff88SAndriy Gapon } 1275c468ff88SAndriy Gapon return (error); 1276aa14e9b7SMark Johnston } 1277bd390213SMikolaj Golub 1278bd390213SMikolaj Golub /* 1279bd390213SMikolaj Golub * Drain into a core file. 1280bd390213SMikolaj Golub */ 1281bd390213SMikolaj Golub static int 1282bd390213SMikolaj Golub sbuf_drain_core_output(void *arg, const char *data, int len) 1283bd390213SMikolaj Golub { 1284aa14e9b7SMark Johnston struct coredump_params *p; 1285f1fca82eSMikolaj Golub int error, locked; 1286bd390213SMikolaj Golub 1287aa14e9b7SMark Johnston p = (struct coredump_params *)arg; 1288f1fca82eSMikolaj Golub 1289f1fca82eSMikolaj Golub /* 1290f1fca82eSMikolaj Golub * Some kern_proc out routines that print to this sbuf may 1291f1fca82eSMikolaj Golub * call us with the process lock held. Draining with the 1292f1fca82eSMikolaj Golub * non-sleepable lock held is unsafe. The lock is needed for 1293f1fca82eSMikolaj Golub * those routines when dumping a live process. In our case we 1294f1fca82eSMikolaj Golub * can safely release the lock before draining and acquire 1295f1fca82eSMikolaj Golub * again after. 1296f1fca82eSMikolaj Golub */ 1297f1fca82eSMikolaj Golub locked = PROC_LOCKED(p->td->td_proc); 1298f1fca82eSMikolaj Golub if (locked) 1299f1fca82eSMikolaj Golub PROC_UNLOCK(p->td->td_proc); 1300aa14e9b7SMark Johnston #ifdef GZIO 1301aa14e9b7SMark Johnston if (p->gzs != NULL) 1302aa14e9b7SMark Johnston error = gzio_write(p->gzs, __DECONST(char *, data), len); 1303bd390213SMikolaj Golub else 1304bd390213SMikolaj Golub #endif 1305aa14e9b7SMark Johnston error = core_write(p, __DECONST(void *, data), len, p->offset, 1306aa14e9b7SMark Johnston UIO_SYSSPACE); 1307f1fca82eSMikolaj Golub if (locked) 1308f1fca82eSMikolaj Golub PROC_LOCK(p->td->td_proc); 1309bd390213SMikolaj Golub if (error != 0) 1310bd390213SMikolaj Golub return (-error); 1311bd390213SMikolaj Golub p->offset += len; 1312bd390213SMikolaj Golub return (len); 1313bd390213SMikolaj Golub } 1314bd390213SMikolaj Golub 1315f1fca82eSMikolaj Golub /* 1316f1fca82eSMikolaj Golub * Drain into a counter. 1317f1fca82eSMikolaj Golub */ 1318f1fca82eSMikolaj Golub static int 1319f1fca82eSMikolaj Golub sbuf_drain_count(void *arg, const char *data __unused, int len) 1320f1fca82eSMikolaj Golub { 1321f1fca82eSMikolaj Golub size_t *sizep; 1322f1fca82eSMikolaj Golub 1323f1fca82eSMikolaj Golub sizep = (size_t *)arg; 1324f1fca82eSMikolaj Golub *sizep += len; 1325f1fca82eSMikolaj Golub return (len); 1326f1fca82eSMikolaj Golub } 1327f1fca82eSMikolaj Golub 13288c64af4fSJohn Polstra int 1329e7228204SAlfred Perlstein __elfN(coredump)(struct thread *td, struct vnode *vp, off_t limit, int flags) 1330fca666a1SJulian Elischer { 1331247aba24SMarcel Moolenaar struct ucred *cred = td->td_ucred; 1332fca666a1SJulian Elischer int error = 0; 13330ff27d31SJohn Polstra struct sseg_closure seginfo; 1334bd390213SMikolaj Golub struct note_info_list notelst; 1335aa14e9b7SMark Johnston struct coredump_params params; 1336bd390213SMikolaj Golub struct note_info *ninfo; 1337aa14e9b7SMark Johnston void *hdr, *tmpbuf; 1338bd390213SMikolaj Golub size_t hdrsize, notesz, coresize; 13399a12e282SEnji Cooper #ifdef GZIO 1340aa14e9b7SMark Johnston boolean_t compress; 13418c64af4fSJohn Polstra 1342aa14e9b7SMark Johnston compress = (flags & IMGACT_CORE_COMPRESS) != 0; 13439a12e282SEnji Cooper #endif 1344e7228204SAlfred Perlstein hdr = NULL; 134502d131adSMark Johnston tmpbuf = NULL; 1346bd390213SMikolaj Golub TAILQ_INIT(¬elst); 1347e7228204SAlfred Perlstein 13480ff27d31SJohn Polstra /* Size the program segments. */ 13490ff27d31SJohn Polstra seginfo.count = 0; 13500ff27d31SJohn Polstra seginfo.size = 0; 13511005d8afSConrad Meyer each_dumpable_segment(td, cb_size_segment, &seginfo); 13520ff27d31SJohn Polstra 13530ff27d31SJohn Polstra /* 1354bd390213SMikolaj Golub * Collect info about the core file header area. 13550ff27d31SJohn Polstra */ 1356bd390213SMikolaj Golub hdrsize = sizeof(Elf_Ehdr) + sizeof(Elf_Phdr) * (1 + seginfo.count); 1357c17b0bd2SConrad Meyer if (seginfo.count + 1 >= PN_XNUM) 1358c17b0bd2SConrad Meyer hdrsize += sizeof(Elf_Shdr); 1359bd390213SMikolaj Golub __elfN(prepare_notes)(td, ¬elst, ¬esz); 1360bd390213SMikolaj Golub coresize = round_page(hdrsize + notesz) + seginfo.size; 13610ff27d31SJohn Polstra 136202d131adSMark Johnston /* Set up core dump parameters. */ 136302d131adSMark Johnston params.offset = 0; 136402d131adSMark Johnston params.active_cred = cred; 136502d131adSMark Johnston params.file_cred = NOCRED; 136602d131adSMark Johnston params.td = td; 136702d131adSMark Johnston params.vp = vp; 136802d131adSMark Johnston params.gzs = NULL; 136902d131adSMark Johnston 1370afcc55f3SEdward Tomasz Napierala #ifdef RACCT 13714b5c9cf6SEdward Tomasz Napierala if (racct_enable) { 13721ba5ad42SEdward Tomasz Napierala PROC_LOCK(td->td_proc); 1373bd390213SMikolaj Golub error = racct_add(td->td_proc, RACCT_CORE, coresize); 13741ba5ad42SEdward Tomasz Napierala PROC_UNLOCK(td->td_proc); 13751ba5ad42SEdward Tomasz Napierala if (error != 0) { 13761ba5ad42SEdward Tomasz Napierala error = EFAULT; 13771ba5ad42SEdward Tomasz Napierala goto done; 13781ba5ad42SEdward Tomasz Napierala } 13794b5c9cf6SEdward Tomasz Napierala } 1380afcc55f3SEdward Tomasz Napierala #endif 1381bd390213SMikolaj Golub if (coresize >= limit) { 1382fba6b1afSAlfred Perlstein error = EFAULT; 1383fba6b1afSAlfred Perlstein goto done; 1384fba6b1afSAlfred Perlstein } 13850ff27d31SJohn Polstra 1386aa14e9b7SMark Johnston #ifdef GZIO 1387aa14e9b7SMark Johnston /* Create a compression stream if necessary. */ 1388aa14e9b7SMark Johnston if (compress) { 1389aa14e9b7SMark Johnston params.gzs = gzio_init(core_gz_write, GZIO_DEFLATE, 1390aa14e9b7SMark Johnston CORE_BUF_SIZE, compress_user_cores_gzlevel, ¶ms); 1391aa14e9b7SMark Johnston if (params.gzs == NULL) { 1392aa14e9b7SMark Johnston error = EFAULT; 1393aa14e9b7SMark Johnston goto done; 1394aa14e9b7SMark Johnston } 1395aa14e9b7SMark Johnston tmpbuf = malloc(CORE_BUF_SIZE, M_TEMP, M_WAITOK | M_ZERO); 1396aa14e9b7SMark Johnston } 1397aa14e9b7SMark Johnston #endif 1398aa14e9b7SMark Johnston 13990ff27d31SJohn Polstra /* 14000ff27d31SJohn Polstra * Allocate memory for building the header, fill it up, 1401bd390213SMikolaj Golub * and write it out following the notes. 14020ff27d31SJohn Polstra */ 1403a163d034SWarner Losh hdr = malloc(hdrsize, M_TEMP, M_WAITOK); 1404aa14e9b7SMark Johnston error = __elfN(corehdr)(¶ms, seginfo.count, hdr, hdrsize, ¬elst, 1405aa14e9b7SMark Johnston notesz); 14060ff27d31SJohn Polstra 14070ff27d31SJohn Polstra /* Write the contents of all of the writable segments. */ 14080ff27d31SJohn Polstra if (error == 0) { 14090ff27d31SJohn Polstra Elf_Phdr *php; 14102b471bc6STim J. Robbins off_t offset; 14110ff27d31SJohn Polstra int i; 14120ff27d31SJohn Polstra 14130ff27d31SJohn Polstra php = (Elf_Phdr *)((char *)hdr + sizeof(Elf_Ehdr)) + 1; 1414bd390213SMikolaj Golub offset = round_page(hdrsize + notesz); 14150ff27d31SJohn Polstra for (i = 0; i < seginfo.count; i++) { 1416aa14e9b7SMark Johnston error = core_output((caddr_t)(uintptr_t)php->p_vaddr, 1417aa14e9b7SMark Johnston php->p_filesz, offset, ¶ms, tmpbuf); 14180ff27d31SJohn Polstra if (error != 0) 14192b471bc6STim J. Robbins break; 14200ff27d31SJohn Polstra offset += php->p_filesz; 14210ff27d31SJohn Polstra php++; 14220ff27d31SJohn Polstra } 1423aa14e9b7SMark Johnston #ifdef GZIO 1424aa14e9b7SMark Johnston if (error == 0 && compress) 1425aa14e9b7SMark Johnston error = gzio_flush(params.gzs); 1426aa14e9b7SMark Johnston #endif 14270ff27d31SJohn Polstra } 1428e7228204SAlfred Perlstein if (error) { 1429e7228204SAlfred Perlstein log(LOG_WARNING, 1430e7228204SAlfred Perlstein "Failed to write core file for process %s (error %d)\n", 1431e7228204SAlfred Perlstein curproc->p_comm, error); 1432e7228204SAlfred Perlstein } 1433e7228204SAlfred Perlstein 1434e7228204SAlfred Perlstein done: 1435aa14e9b7SMark Johnston #ifdef GZIO 1436aa14e9b7SMark Johnston if (compress) { 1437aa14e9b7SMark Johnston free(tmpbuf, M_TEMP); 143802d131adSMark Johnston if (params.gzs != NULL) 1439aa14e9b7SMark Johnston gzio_fini(params.gzs); 1440aa14e9b7SMark Johnston } 14418b325009SAlfred Perlstein #endif 1442bd390213SMikolaj Golub while ((ninfo = TAILQ_FIRST(¬elst)) != NULL) { 1443bd390213SMikolaj Golub TAILQ_REMOVE(¬elst, ninfo, link); 1444bd390213SMikolaj Golub free(ninfo, M_TEMP); 1445bd390213SMikolaj Golub } 1446bd390213SMikolaj Golub if (hdr != NULL) 14470ff27d31SJohn Polstra free(hdr, M_TEMP); 14480ff27d31SJohn Polstra 1449a7cddfedSJake Burkholder return (error); 14508c64af4fSJohn Polstra } 14518c64af4fSJohn Polstra 14520ff27d31SJohn Polstra /* 14531005d8afSConrad Meyer * A callback for each_dumpable_segment() to write out the segment's 14540ff27d31SJohn Polstra * program header entry. 14550ff27d31SJohn Polstra */ 14560ff27d31SJohn Polstra static void 14570ff27d31SJohn Polstra cb_put_phdr(entry, closure) 14580ff27d31SJohn Polstra vm_map_entry_t entry; 14590ff27d31SJohn Polstra void *closure; 14600ff27d31SJohn Polstra { 14610ff27d31SJohn Polstra struct phdr_closure *phc = (struct phdr_closure *)closure; 14620ff27d31SJohn Polstra Elf_Phdr *phdr = phc->phdr; 14630ff27d31SJohn Polstra 14640ff27d31SJohn Polstra phc->offset = round_page(phc->offset); 14650ff27d31SJohn Polstra 14660ff27d31SJohn Polstra phdr->p_type = PT_LOAD; 14670ff27d31SJohn Polstra phdr->p_offset = phc->offset; 14680ff27d31SJohn Polstra phdr->p_vaddr = entry->start; 14690ff27d31SJohn Polstra phdr->p_paddr = 0; 14700ff27d31SJohn Polstra phdr->p_filesz = phdr->p_memsz = entry->end - entry->start; 14710ff27d31SJohn Polstra phdr->p_align = PAGE_SIZE; 1472ed167eaaSKonstantin Belousov phdr->p_flags = __elfN(untrans_prot)(entry->protection); 14730ff27d31SJohn Polstra 14740ff27d31SJohn Polstra phc->offset += phdr->p_filesz; 14750ff27d31SJohn Polstra phc->phdr++; 14760ff27d31SJohn Polstra } 14770ff27d31SJohn Polstra 14780ff27d31SJohn Polstra /* 14791005d8afSConrad Meyer * A callback for each_dumpable_segment() to gather information about 14800ff27d31SJohn Polstra * the number of segments and their total size. 14810ff27d31SJohn Polstra */ 14820ff27d31SJohn Polstra static void 1483f3325003SConrad Meyer cb_size_segment(vm_map_entry_t entry, void *closure) 14840ff27d31SJohn Polstra { 14850ff27d31SJohn Polstra struct sseg_closure *ssc = (struct sseg_closure *)closure; 14860ff27d31SJohn Polstra 14870ff27d31SJohn Polstra ssc->count++; 14880ff27d31SJohn Polstra ssc->size += entry->end - entry->start; 14890ff27d31SJohn Polstra } 14900ff27d31SJohn Polstra 14910ff27d31SJohn Polstra /* 14920ff27d31SJohn Polstra * For each writable segment in the process's memory map, call the given 14930ff27d31SJohn Polstra * function with a pointer to the map entry and some arbitrary 14940ff27d31SJohn Polstra * caller-supplied data. 14950ff27d31SJohn Polstra */ 14960ff27d31SJohn Polstra static void 14971005d8afSConrad Meyer each_dumpable_segment(struct thread *td, segment_callback func, void *closure) 14980ff27d31SJohn Polstra { 1499247aba24SMarcel Moolenaar struct proc *p = td->td_proc; 15000ff27d31SJohn Polstra vm_map_t map = &p->p_vmspace->vm_map; 15010ff27d31SJohn Polstra vm_map_entry_t entry; 1502976a87a2SAlan Cox vm_object_t backing_object, object; 1503976a87a2SAlan Cox boolean_t ignore_entry; 15040ff27d31SJohn Polstra 1505976a87a2SAlan Cox vm_map_lock_read(map); 15060ff27d31SJohn Polstra for (entry = map->header.next; entry != &map->header; 15070ff27d31SJohn Polstra entry = entry->next) { 1508fa7dd9c5SMatthew Dillon /* 1509fa7dd9c5SMatthew Dillon * Don't dump inaccessible mappings, deal with legacy 1510fa7dd9c5SMatthew Dillon * coredump mode. 1511fa7dd9c5SMatthew Dillon * 1512fa7dd9c5SMatthew Dillon * Note that read-only segments related to the elf binary 1513fa7dd9c5SMatthew Dillon * are marked MAP_ENTRY_NOCOREDUMP now so we no longer 1514fa7dd9c5SMatthew Dillon * need to arbitrarily ignore such segments. 1515fa7dd9c5SMatthew Dillon */ 1516fa7dd9c5SMatthew Dillon if (elf_legacy_coredump) { 1517fa7dd9c5SMatthew Dillon if ((entry->protection & VM_PROT_RW) != VM_PROT_RW) 15180ff27d31SJohn Polstra continue; 1519fa7dd9c5SMatthew Dillon } else { 1520fa7dd9c5SMatthew Dillon if ((entry->protection & VM_PROT_ALL) == 0) 1521fa7dd9c5SMatthew Dillon continue; 1522fa7dd9c5SMatthew Dillon } 15230ff27d31SJohn Polstra 15249730a5daSPaul Saab /* 1525fa7dd9c5SMatthew Dillon * Dont include memory segment in the coredump if 1526fa7dd9c5SMatthew Dillon * MAP_NOCORE is set in mmap(2) or MADV_NOCORE in 1527fa7dd9c5SMatthew Dillon * madvise(2). Do not dump submaps (i.e. parts of the 1528fa7dd9c5SMatthew Dillon * kernel map). 15299730a5daSPaul Saab */ 1530fa7dd9c5SMatthew Dillon if (entry->eflags & (MAP_ENTRY_NOCOREDUMP|MAP_ENTRY_IS_SUB_MAP)) 15319730a5daSPaul Saab continue; 15329730a5daSPaul Saab 1533976a87a2SAlan Cox if ((object = entry->object.vm_object) == NULL) 15340ff27d31SJohn Polstra continue; 15350ff27d31SJohn Polstra 15360ff27d31SJohn Polstra /* Ignore memory-mapped devices and such things. */ 1537bc403f03SAttilio Rao VM_OBJECT_RLOCK(object); 1538976a87a2SAlan Cox while ((backing_object = object->backing_object) != NULL) { 1539bc403f03SAttilio Rao VM_OBJECT_RLOCK(backing_object); 1540bc403f03SAttilio Rao VM_OBJECT_RUNLOCK(object); 1541976a87a2SAlan Cox object = backing_object; 1542976a87a2SAlan Cox } 1543976a87a2SAlan Cox ignore_entry = object->type != OBJT_DEFAULT && 1544bc411bc2SJohn Baldwin object->type != OBJT_SWAP && object->type != OBJT_VNODE && 1545bc411bc2SJohn Baldwin object->type != OBJT_PHYS; 1546bc403f03SAttilio Rao VM_OBJECT_RUNLOCK(object); 1547976a87a2SAlan Cox if (ignore_entry) 15480ff27d31SJohn Polstra continue; 15490ff27d31SJohn Polstra 15500ff27d31SJohn Polstra (*func)(entry, closure); 15510ff27d31SJohn Polstra } 1552976a87a2SAlan Cox vm_map_unlock_read(map); 15530ff27d31SJohn Polstra } 15540ff27d31SJohn Polstra 15550ff27d31SJohn Polstra /* 15560ff27d31SJohn Polstra * Write the core file header to the file, including padding up to 15570ff27d31SJohn Polstra * the page boundary. 15580ff27d31SJohn Polstra */ 15598c64af4fSJohn Polstra static int 1560aa14e9b7SMark Johnston __elfN(corehdr)(struct coredump_params *p, int numsegs, void *hdr, 1561aa14e9b7SMark Johnston size_t hdrsize, struct note_info_list *notelst, size_t notesz) 15628c64af4fSJohn Polstra { 1563bd390213SMikolaj Golub struct note_info *ninfo; 1564bd390213SMikolaj Golub struct sbuf *sb; 1565bd390213SMikolaj Golub int error; 15668c64af4fSJohn Polstra 15678c64af4fSJohn Polstra /* Fill in the header. */ 15680ff27d31SJohn Polstra bzero(hdr, hdrsize); 1569aa14e9b7SMark Johnston __elfN(puthdr)(p->td, hdr, hdrsize, numsegs, notesz); 15708c64af4fSJohn Polstra 1571bd390213SMikolaj Golub sb = sbuf_new(NULL, NULL, CORE_BUF_SIZE, SBUF_FIXEDLEN); 1572aa14e9b7SMark Johnston sbuf_set_drain(sb, sbuf_drain_core_output, p); 1573bd390213SMikolaj Golub sbuf_start_section(sb, NULL); 1574bd390213SMikolaj Golub sbuf_bcat(sb, hdr, hdrsize); 1575bd390213SMikolaj Golub TAILQ_FOREACH(ninfo, notelst, link) 1576bd390213SMikolaj Golub __elfN(putnote)(ninfo, sb); 1577bd390213SMikolaj Golub /* Align up to a page boundary for the program segments. */ 1578bd390213SMikolaj Golub sbuf_end_section(sb, -1, PAGE_SIZE, 0); 1579bd390213SMikolaj Golub error = sbuf_finish(sb); 1580bd390213SMikolaj Golub sbuf_delete(sb); 1581bd390213SMikolaj Golub 1582bd390213SMikolaj Golub return (error); 1583e7228204SAlfred Perlstein } 1584bd390213SMikolaj Golub 1585bd390213SMikolaj Golub static void 1586bd390213SMikolaj Golub __elfN(prepare_notes)(struct thread *td, struct note_info_list *list, 1587bd390213SMikolaj Golub size_t *sizep) 1588bd390213SMikolaj Golub { 1589bd390213SMikolaj Golub struct proc *p; 1590bd390213SMikolaj Golub struct thread *thr; 1591bd390213SMikolaj Golub size_t size; 1592bd390213SMikolaj Golub 1593bd390213SMikolaj Golub p = td->td_proc; 1594bd390213SMikolaj Golub size = 0; 1595bd390213SMikolaj Golub 1596bd390213SMikolaj Golub size += register_note(list, NT_PRPSINFO, __elfN(note_prpsinfo), p); 1597bd390213SMikolaj Golub 1598bd390213SMikolaj Golub /* 1599bd390213SMikolaj Golub * To have the debugger select the right thread (LWP) as the initial 1600bd390213SMikolaj Golub * thread, we dump the state of the thread passed to us in td first. 1601bd390213SMikolaj Golub * This is the thread that causes the core dump and thus likely to 1602bd390213SMikolaj Golub * be the right thread one wants to have selected in the debugger. 1603bd390213SMikolaj Golub */ 1604bd390213SMikolaj Golub thr = td; 1605bd390213SMikolaj Golub while (thr != NULL) { 1606bd390213SMikolaj Golub size += register_note(list, NT_PRSTATUS, 1607bd390213SMikolaj Golub __elfN(note_prstatus), thr); 1608bd390213SMikolaj Golub size += register_note(list, NT_FPREGSET, 1609bd390213SMikolaj Golub __elfN(note_fpregset), thr); 1610bd390213SMikolaj Golub size += register_note(list, NT_THRMISC, 1611bd390213SMikolaj Golub __elfN(note_thrmisc), thr); 1612bd390213SMikolaj Golub size += register_note(list, -1, 1613bd390213SMikolaj Golub __elfN(note_threadmd), thr); 1614bd390213SMikolaj Golub 1615bd390213SMikolaj Golub thr = (thr == td) ? TAILQ_FIRST(&p->p_threads) : 1616bd390213SMikolaj Golub TAILQ_NEXT(thr, td_plist); 1617bd390213SMikolaj Golub if (thr == td) 1618bd390213SMikolaj Golub thr = TAILQ_NEXT(thr, td_plist); 1619dada0278SJohn Polstra } 1620dada0278SJohn Polstra 1621f1fca82eSMikolaj Golub size += register_note(list, NT_PROCSTAT_PROC, 1622f1fca82eSMikolaj Golub __elfN(note_procstat_proc), p); 1623f1fca82eSMikolaj Golub size += register_note(list, NT_PROCSTAT_FILES, 1624f1fca82eSMikolaj Golub note_procstat_files, p); 1625f1fca82eSMikolaj Golub size += register_note(list, NT_PROCSTAT_VMMAP, 1626f1fca82eSMikolaj Golub note_procstat_vmmap, p); 1627f1fca82eSMikolaj Golub size += register_note(list, NT_PROCSTAT_GROUPS, 1628f1fca82eSMikolaj Golub note_procstat_groups, p); 1629f1fca82eSMikolaj Golub size += register_note(list, NT_PROCSTAT_UMASK, 1630f1fca82eSMikolaj Golub note_procstat_umask, p); 1631f1fca82eSMikolaj Golub size += register_note(list, NT_PROCSTAT_RLIMIT, 1632f1fca82eSMikolaj Golub note_procstat_rlimit, p); 1633f1fca82eSMikolaj Golub size += register_note(list, NT_PROCSTAT_OSREL, 1634f1fca82eSMikolaj Golub note_procstat_osrel, p); 1635f1fca82eSMikolaj Golub size += register_note(list, NT_PROCSTAT_PSSTRINGS, 1636f1fca82eSMikolaj Golub __elfN(note_procstat_psstrings), p); 1637f1fca82eSMikolaj Golub size += register_note(list, NT_PROCSTAT_AUXV, 1638f1fca82eSMikolaj Golub __elfN(note_procstat_auxv), p); 1639f1fca82eSMikolaj Golub 1640bd390213SMikolaj Golub *sizep = size; 1641bd390213SMikolaj Golub } 1642bd390213SMikolaj Golub 1643bd390213SMikolaj Golub static void 1644bd390213SMikolaj Golub __elfN(puthdr)(struct thread *td, void *hdr, size_t hdrsize, int numsegs, 1645bd390213SMikolaj Golub size_t notesz) 1646bd390213SMikolaj Golub { 1647bd390213SMikolaj Golub Elf_Ehdr *ehdr; 1648bd390213SMikolaj Golub Elf_Phdr *phdr; 1649c17b0bd2SConrad Meyer Elf_Shdr *shdr; 1650bd390213SMikolaj Golub struct phdr_closure phc; 1651bd390213SMikolaj Golub 1652bd390213SMikolaj Golub ehdr = (Elf_Ehdr *)hdr; 1653bd390213SMikolaj Golub 1654bd390213SMikolaj Golub ehdr->e_ident[EI_MAG0] = ELFMAG0; 1655bd390213SMikolaj Golub ehdr->e_ident[EI_MAG1] = ELFMAG1; 1656bd390213SMikolaj Golub ehdr->e_ident[EI_MAG2] = ELFMAG2; 1657bd390213SMikolaj Golub ehdr->e_ident[EI_MAG3] = ELFMAG3; 1658bd390213SMikolaj Golub ehdr->e_ident[EI_CLASS] = ELF_CLASS; 1659bd390213SMikolaj Golub ehdr->e_ident[EI_DATA] = ELF_DATA; 1660bd390213SMikolaj Golub ehdr->e_ident[EI_VERSION] = EV_CURRENT; 1661bd390213SMikolaj Golub ehdr->e_ident[EI_OSABI] = ELFOSABI_FREEBSD; 1662bd390213SMikolaj Golub ehdr->e_ident[EI_ABIVERSION] = 0; 1663bd390213SMikolaj Golub ehdr->e_ident[EI_PAD] = 0; 1664bd390213SMikolaj Golub ehdr->e_type = ET_CORE; 1665885f13dcSJohn Baldwin ehdr->e_machine = td->td_proc->p_elf_machine; 1666bd390213SMikolaj Golub ehdr->e_version = EV_CURRENT; 1667bd390213SMikolaj Golub ehdr->e_entry = 0; 1668bd390213SMikolaj Golub ehdr->e_phoff = sizeof(Elf_Ehdr); 1669885f13dcSJohn Baldwin ehdr->e_flags = td->td_proc->p_elf_flags; 1670bd390213SMikolaj Golub ehdr->e_ehsize = sizeof(Elf_Ehdr); 1671bd390213SMikolaj Golub ehdr->e_phentsize = sizeof(Elf_Phdr); 1672bd390213SMikolaj Golub ehdr->e_shentsize = sizeof(Elf_Shdr); 1673bd390213SMikolaj Golub ehdr->e_shstrndx = SHN_UNDEF; 1674c17b0bd2SConrad Meyer if (numsegs + 1 < PN_XNUM) { 1675c17b0bd2SConrad Meyer ehdr->e_phnum = numsegs + 1; 1676c17b0bd2SConrad Meyer ehdr->e_shnum = 0; 1677c17b0bd2SConrad Meyer } else { 1678c17b0bd2SConrad Meyer ehdr->e_phnum = PN_XNUM; 1679c17b0bd2SConrad Meyer ehdr->e_shnum = 1; 1680c17b0bd2SConrad Meyer 1681c17b0bd2SConrad Meyer ehdr->e_shoff = ehdr->e_phoff + 1682c17b0bd2SConrad Meyer (numsegs + 1) * ehdr->e_phentsize; 1683c17b0bd2SConrad Meyer KASSERT(ehdr->e_shoff == hdrsize - sizeof(Elf_Shdr), 1684c17b0bd2SConrad Meyer ("e_shoff: %zu, hdrsize - shdr: %zu", 168507f825e8SConrad Meyer (size_t)ehdr->e_shoff, hdrsize - sizeof(Elf_Shdr))); 1686c17b0bd2SConrad Meyer 1687c17b0bd2SConrad Meyer shdr = (Elf_Shdr *)((char *)hdr + ehdr->e_shoff); 1688c17b0bd2SConrad Meyer memset(shdr, 0, sizeof(*shdr)); 1689c17b0bd2SConrad Meyer /* 1690c17b0bd2SConrad Meyer * A special first section is used to hold large segment and 1691c17b0bd2SConrad Meyer * section counts. This was proposed by Sun Microsystems in 1692c17b0bd2SConrad Meyer * Solaris and has been adopted by Linux; the standard ELF 1693c17b0bd2SConrad Meyer * tools are already familiar with the technique. 1694c17b0bd2SConrad Meyer * 1695c17b0bd2SConrad Meyer * See table 7-7 of the Solaris "Linker and Libraries Guide" 1696c17b0bd2SConrad Meyer * (or 12-7 depending on the version of the document) for more 1697c17b0bd2SConrad Meyer * details. 1698c17b0bd2SConrad Meyer */ 1699c17b0bd2SConrad Meyer shdr->sh_type = SHT_NULL; 1700c17b0bd2SConrad Meyer shdr->sh_size = ehdr->e_shnum; 1701c17b0bd2SConrad Meyer shdr->sh_link = ehdr->e_shstrndx; 1702c17b0bd2SConrad Meyer shdr->sh_info = numsegs + 1; 1703c17b0bd2SConrad Meyer } 1704bd390213SMikolaj Golub 1705bd390213SMikolaj Golub /* 1706bd390213SMikolaj Golub * Fill in the program header entries. 1707bd390213SMikolaj Golub */ 1708c17b0bd2SConrad Meyer phdr = (Elf_Phdr *)((char *)hdr + ehdr->e_phoff); 1709bd390213SMikolaj Golub 1710bd390213SMikolaj Golub /* The note segement. */ 1711bd390213SMikolaj Golub phdr->p_type = PT_NOTE; 1712bd390213SMikolaj Golub phdr->p_offset = hdrsize; 1713bd390213SMikolaj Golub phdr->p_vaddr = 0; 1714bd390213SMikolaj Golub phdr->p_paddr = 0; 1715bd390213SMikolaj Golub phdr->p_filesz = notesz; 1716bd390213SMikolaj Golub phdr->p_memsz = 0; 1717bd390213SMikolaj Golub phdr->p_flags = PF_R; 17181b8388cdSMikolaj Golub phdr->p_align = ELF_NOTE_ROUNDSIZE; 1719bd390213SMikolaj Golub phdr++; 1720bd390213SMikolaj Golub 1721bd390213SMikolaj Golub /* All the writable segments from the program. */ 1722bd390213SMikolaj Golub phc.phdr = phdr; 1723bd390213SMikolaj Golub phc.offset = round_page(hdrsize + notesz); 17241005d8afSConrad Meyer each_dumpable_segment(td, cb_put_phdr, &phc); 1725bd390213SMikolaj Golub } 1726bd390213SMikolaj Golub 1727bd390213SMikolaj Golub static size_t 1728bd390213SMikolaj Golub register_note(struct note_info_list *list, int type, outfunc_t out, void *arg) 1729bd390213SMikolaj Golub { 1730bd390213SMikolaj Golub struct note_info *ninfo; 1731bd390213SMikolaj Golub size_t size, notesize; 1732bd390213SMikolaj Golub 1733bd390213SMikolaj Golub size = 0; 1734bd390213SMikolaj Golub out(arg, NULL, &size); 1735bd390213SMikolaj Golub ninfo = malloc(sizeof(*ninfo), M_TEMP, M_ZERO | M_WAITOK); 1736bd390213SMikolaj Golub ninfo->type = type; 1737bd390213SMikolaj Golub ninfo->outfunc = out; 1738bd390213SMikolaj Golub ninfo->outarg = arg; 1739bd390213SMikolaj Golub ninfo->outsize = size; 1740bd390213SMikolaj Golub TAILQ_INSERT_TAIL(list, ninfo, link); 1741bd390213SMikolaj Golub 1742bd390213SMikolaj Golub if (type == -1) 1743bd390213SMikolaj Golub return (size); 1744bd390213SMikolaj Golub 1745bd390213SMikolaj Golub notesize = sizeof(Elf_Note) + /* note header */ 1746180e57e5SJohn Baldwin roundup2(sizeof(FREEBSD_ABI_VENDOR), ELF_NOTE_ROUNDSIZE) + 1747180e57e5SJohn Baldwin /* note name */ 1748180e57e5SJohn Baldwin roundup2(size, ELF_NOTE_ROUNDSIZE); /* note description */ 1749180e57e5SJohn Baldwin 1750180e57e5SJohn Baldwin return (notesize); 1751180e57e5SJohn Baldwin } 1752180e57e5SJohn Baldwin 1753180e57e5SJohn Baldwin static size_t 1754180e57e5SJohn Baldwin append_note_data(const void *src, void *dst, size_t len) 1755180e57e5SJohn Baldwin { 1756180e57e5SJohn Baldwin size_t padded_len; 1757180e57e5SJohn Baldwin 1758180e57e5SJohn Baldwin padded_len = roundup2(len, ELF_NOTE_ROUNDSIZE); 1759180e57e5SJohn Baldwin if (dst != NULL) { 1760180e57e5SJohn Baldwin bcopy(src, dst, len); 1761180e57e5SJohn Baldwin bzero((char *)dst + len, padded_len - len); 1762180e57e5SJohn Baldwin } 1763180e57e5SJohn Baldwin return (padded_len); 1764180e57e5SJohn Baldwin } 1765180e57e5SJohn Baldwin 1766180e57e5SJohn Baldwin size_t 1767180e57e5SJohn Baldwin __elfN(populate_note)(int type, void *src, void *dst, size_t size, void **descp) 1768180e57e5SJohn Baldwin { 1769180e57e5SJohn Baldwin Elf_Note *note; 1770180e57e5SJohn Baldwin char *buf; 1771180e57e5SJohn Baldwin size_t notesize; 1772180e57e5SJohn Baldwin 1773180e57e5SJohn Baldwin buf = dst; 1774180e57e5SJohn Baldwin if (buf != NULL) { 1775180e57e5SJohn Baldwin note = (Elf_Note *)buf; 1776180e57e5SJohn Baldwin note->n_namesz = sizeof(FREEBSD_ABI_VENDOR); 1777180e57e5SJohn Baldwin note->n_descsz = size; 1778180e57e5SJohn Baldwin note->n_type = type; 1779180e57e5SJohn Baldwin buf += sizeof(*note); 1780180e57e5SJohn Baldwin buf += append_note_data(FREEBSD_ABI_VENDOR, buf, 1781180e57e5SJohn Baldwin sizeof(FREEBSD_ABI_VENDOR)); 1782180e57e5SJohn Baldwin append_note_data(src, buf, size); 1783180e57e5SJohn Baldwin if (descp != NULL) 1784180e57e5SJohn Baldwin *descp = buf; 1785180e57e5SJohn Baldwin } 1786180e57e5SJohn Baldwin 1787180e57e5SJohn Baldwin notesize = sizeof(Elf_Note) + /* note header */ 1788180e57e5SJohn Baldwin roundup2(sizeof(FREEBSD_ABI_VENDOR), ELF_NOTE_ROUNDSIZE) + 1789180e57e5SJohn Baldwin /* note name */ 17901b8388cdSMikolaj Golub roundup2(size, ELF_NOTE_ROUNDSIZE); /* note description */ 1791bd390213SMikolaj Golub 1792bd390213SMikolaj Golub return (notesize); 1793bd390213SMikolaj Golub } 1794bd390213SMikolaj Golub 1795bd390213SMikolaj Golub static void 1796bd390213SMikolaj Golub __elfN(putnote)(struct note_info *ninfo, struct sbuf *sb) 1797bd390213SMikolaj Golub { 1798bd390213SMikolaj Golub Elf_Note note; 179914bdbaf2SConrad Meyer ssize_t old_len, sect_len; 180014bdbaf2SConrad Meyer size_t new_len, descsz, i; 1801bd390213SMikolaj Golub 1802bd390213SMikolaj Golub if (ninfo->type == -1) { 1803bd390213SMikolaj Golub ninfo->outfunc(ninfo->outarg, sb, &ninfo->outsize); 1804bd390213SMikolaj Golub return; 1805bd390213SMikolaj Golub } 1806bd390213SMikolaj Golub 1807180e57e5SJohn Baldwin note.n_namesz = sizeof(FREEBSD_ABI_VENDOR); 1808bd390213SMikolaj Golub note.n_descsz = ninfo->outsize; 1809bd390213SMikolaj Golub note.n_type = ninfo->type; 1810bd390213SMikolaj Golub 1811bd390213SMikolaj Golub sbuf_bcat(sb, ¬e, sizeof(note)); 1812bd390213SMikolaj Golub sbuf_start_section(sb, &old_len); 1813180e57e5SJohn Baldwin sbuf_bcat(sb, FREEBSD_ABI_VENDOR, sizeof(FREEBSD_ABI_VENDOR)); 18141b8388cdSMikolaj Golub sbuf_end_section(sb, old_len, ELF_NOTE_ROUNDSIZE, 0); 1815bd390213SMikolaj Golub if (note.n_descsz == 0) 1816bd390213SMikolaj Golub return; 1817bd390213SMikolaj Golub sbuf_start_section(sb, &old_len); 1818bd390213SMikolaj Golub ninfo->outfunc(ninfo->outarg, sb, &ninfo->outsize); 181914bdbaf2SConrad Meyer sect_len = sbuf_end_section(sb, old_len, ELF_NOTE_ROUNDSIZE, 0); 182014bdbaf2SConrad Meyer if (sect_len < 0) 182114bdbaf2SConrad Meyer return; 182214bdbaf2SConrad Meyer 182314bdbaf2SConrad Meyer new_len = (size_t)sect_len; 182414bdbaf2SConrad Meyer descsz = roundup(note.n_descsz, ELF_NOTE_ROUNDSIZE); 182514bdbaf2SConrad Meyer if (new_len < descsz) { 182614bdbaf2SConrad Meyer /* 182714bdbaf2SConrad Meyer * It is expected that individual note emitters will correctly 182814bdbaf2SConrad Meyer * predict their expected output size and fill up to that size 182914bdbaf2SConrad Meyer * themselves, padding in a format-specific way if needed. 183014bdbaf2SConrad Meyer * However, in case they don't, just do it here with zeros. 183114bdbaf2SConrad Meyer */ 183214bdbaf2SConrad Meyer for (i = 0; i < descsz - new_len; i++) 183314bdbaf2SConrad Meyer sbuf_putc(sb, 0); 183414bdbaf2SConrad Meyer } else if (new_len > descsz) { 183514bdbaf2SConrad Meyer /* 183614bdbaf2SConrad Meyer * We can't always truncate sb -- we may have drained some 183714bdbaf2SConrad Meyer * of it already. 183814bdbaf2SConrad Meyer */ 183914bdbaf2SConrad Meyer KASSERT(new_len == descsz, ("%s: Note type %u changed as we " 184014bdbaf2SConrad Meyer "read it (%zu > %zu). Since it is longer than " 184114bdbaf2SConrad Meyer "expected, this coredump's notes are corrupt. THIS " 184214bdbaf2SConrad Meyer "IS A BUG in the note_procstat routine for type %u.\n", 184314bdbaf2SConrad Meyer __func__, (unsigned)note.n_type, new_len, descsz, 184414bdbaf2SConrad Meyer (unsigned)note.n_type)); 184514bdbaf2SConrad Meyer } 1846bd390213SMikolaj Golub } 1847bd390213SMikolaj Golub 1848bd390213SMikolaj Golub /* 1849bd390213SMikolaj Golub * Miscellaneous note out functions. 1850bd390213SMikolaj Golub */ 1851bd390213SMikolaj Golub 1852841c0c7eSNathan Whitehorn #if defined(COMPAT_FREEBSD32) && __ELF_WORD_SIZE == 32 1853841c0c7eSNathan Whitehorn #include <compat/freebsd32/freebsd32.h> 1854841c0c7eSNathan Whitehorn 185562919d78SPeter Wemm typedef struct prstatus32 elf_prstatus_t; 185662919d78SPeter Wemm typedef struct prpsinfo32 elf_prpsinfo_t; 185762919d78SPeter Wemm typedef struct fpreg32 elf_prfpregset_t; 185862919d78SPeter Wemm typedef struct fpreg32 elf_fpregset_t; 185962919d78SPeter Wemm typedef struct reg32 elf_gregset_t; 18607f08176eSAttilio Rao typedef struct thrmisc32 elf_thrmisc_t; 1861f1fca82eSMikolaj Golub #define ELF_KERN_PROC_MASK KERN_PROC_MASK32 1862f1fca82eSMikolaj Golub typedef struct kinfo_proc32 elf_kinfo_proc_t; 1863f1fca82eSMikolaj Golub typedef uint32_t elf_ps_strings_t; 186462919d78SPeter Wemm #else 186562919d78SPeter Wemm typedef prstatus_t elf_prstatus_t; 186662919d78SPeter Wemm typedef prpsinfo_t elf_prpsinfo_t; 186762919d78SPeter Wemm typedef prfpregset_t elf_prfpregset_t; 186862919d78SPeter Wemm typedef prfpregset_t elf_fpregset_t; 186962919d78SPeter Wemm typedef gregset_t elf_gregset_t; 18707f08176eSAttilio Rao typedef thrmisc_t elf_thrmisc_t; 1871f1fca82eSMikolaj Golub #define ELF_KERN_PROC_MASK 0 1872f1fca82eSMikolaj Golub typedef struct kinfo_proc elf_kinfo_proc_t; 1873f1fca82eSMikolaj Golub typedef vm_offset_t elf_ps_strings_t; 187462919d78SPeter Wemm #endif 187562919d78SPeter Wemm 18768c64af4fSJohn Polstra static void 1877bd390213SMikolaj Golub __elfN(note_prpsinfo)(void *arg, struct sbuf *sb, size_t *sizep) 18788c64af4fSJohn Polstra { 1879c77547d2SJohn Baldwin struct sbuf sbarg; 1880c77547d2SJohn Baldwin size_t len; 1881c77547d2SJohn Baldwin char *cp, *end; 1882247aba24SMarcel Moolenaar struct proc *p; 1883bd390213SMikolaj Golub elf_prpsinfo_t *psinfo; 1884c77547d2SJohn Baldwin int error; 18858c64af4fSJohn Polstra 1886bd390213SMikolaj Golub p = (struct proc *)arg; 1887bd390213SMikolaj Golub if (sb != NULL) { 1888bd390213SMikolaj Golub KASSERT(*sizep == sizeof(*psinfo), ("invalid size")); 1889bd390213SMikolaj Golub psinfo = malloc(sizeof(*psinfo), M_TEMP, M_ZERO | M_WAITOK); 18908c9b7b2cSMarcel Moolenaar psinfo->pr_version = PRPSINFO_VERSION; 189162919d78SPeter Wemm psinfo->pr_psinfosz = sizeof(elf_prpsinfo_t); 1892ccd3953eSJohn Baldwin strlcpy(psinfo->pr_fname, p->p_comm, sizeof(psinfo->pr_fname)); 1893c77547d2SJohn Baldwin PROC_LOCK(p); 1894c77547d2SJohn Baldwin if (p->p_args != NULL) { 1895c77547d2SJohn Baldwin len = sizeof(psinfo->pr_psargs) - 1; 1896c77547d2SJohn Baldwin if (len > p->p_args->ar_length) 1897c77547d2SJohn Baldwin len = p->p_args->ar_length; 1898c77547d2SJohn Baldwin memcpy(psinfo->pr_psargs, p->p_args->ar_args, len); 1899c77547d2SJohn Baldwin PROC_UNLOCK(p); 1900c77547d2SJohn Baldwin error = 0; 1901c77547d2SJohn Baldwin } else { 1902c77547d2SJohn Baldwin _PHOLD(p); 1903c77547d2SJohn Baldwin PROC_UNLOCK(p); 1904c77547d2SJohn Baldwin sbuf_new(&sbarg, psinfo->pr_psargs, 1905c77547d2SJohn Baldwin sizeof(psinfo->pr_psargs), SBUF_FIXEDLEN); 1906c77547d2SJohn Baldwin error = proc_getargv(curthread, p, &sbarg); 1907c77547d2SJohn Baldwin PRELE(p); 1908c77547d2SJohn Baldwin if (sbuf_finish(&sbarg) == 0) 1909c77547d2SJohn Baldwin len = sbuf_len(&sbarg) - 1; 1910c77547d2SJohn Baldwin else 1911c77547d2SJohn Baldwin len = sizeof(psinfo->pr_psargs) - 1; 1912c77547d2SJohn Baldwin sbuf_delete(&sbarg); 1913c77547d2SJohn Baldwin } 1914c77547d2SJohn Baldwin if (error || len == 0) 1915ccd3953eSJohn Baldwin strlcpy(psinfo->pr_psargs, p->p_comm, 19168c9b7b2cSMarcel Moolenaar sizeof(psinfo->pr_psargs)); 1917c77547d2SJohn Baldwin else { 1918c77547d2SJohn Baldwin KASSERT(len < sizeof(psinfo->pr_psargs), 1919c77547d2SJohn Baldwin ("len is too long: %zu vs %zu", len, 1920c77547d2SJohn Baldwin sizeof(psinfo->pr_psargs))); 1921c77547d2SJohn Baldwin cp = psinfo->pr_psargs; 1922c77547d2SJohn Baldwin end = cp + len - 1; 1923c77547d2SJohn Baldwin for (;;) { 1924c77547d2SJohn Baldwin cp = memchr(cp, '\0', end - cp); 1925c77547d2SJohn Baldwin if (cp == NULL) 1926c77547d2SJohn Baldwin break; 1927c77547d2SJohn Baldwin *cp = ' '; 1928c77547d2SJohn Baldwin } 1929c77547d2SJohn Baldwin } 1930ccb83afdSJohn Baldwin psinfo->pr_pid = p->p_pid; 1931bd390213SMikolaj Golub sbuf_bcat(sb, psinfo, sizeof(*psinfo)); 1932bd390213SMikolaj Golub free(psinfo, M_TEMP); 1933bd390213SMikolaj Golub } 1934bd390213SMikolaj Golub *sizep = sizeof(*psinfo); 1935bd390213SMikolaj Golub } 1936bd390213SMikolaj Golub 1937bd390213SMikolaj Golub static void 1938bd390213SMikolaj Golub __elfN(note_prstatus)(void *arg, struct sbuf *sb, size_t *sizep) 1939bd390213SMikolaj Golub { 1940bd390213SMikolaj Golub struct thread *td; 1941bd390213SMikolaj Golub elf_prstatus_t *status; 1942bd390213SMikolaj Golub 1943bd390213SMikolaj Golub td = (struct thread *)arg; 1944bd390213SMikolaj Golub if (sb != NULL) { 1945bd390213SMikolaj Golub KASSERT(*sizep == sizeof(*status), ("invalid size")); 1946bd390213SMikolaj Golub status = malloc(sizeof(*status), M_TEMP, M_ZERO | M_WAITOK); 19478c9b7b2cSMarcel Moolenaar status->pr_version = PRSTATUS_VERSION; 194862919d78SPeter Wemm status->pr_statussz = sizeof(elf_prstatus_t); 194962919d78SPeter Wemm status->pr_gregsetsz = sizeof(elf_gregset_t); 195062919d78SPeter Wemm status->pr_fpregsetsz = sizeof(elf_fpregset_t); 19518c9b7b2cSMarcel Moolenaar status->pr_osreldate = osreldate; 1952bd390213SMikolaj Golub status->pr_cursig = td->td_proc->p_sig; 1953bd390213SMikolaj Golub status->pr_pid = td->td_tid; 1954841c0c7eSNathan Whitehorn #if defined(COMPAT_FREEBSD32) && __ELF_WORD_SIZE == 32 1955bd390213SMikolaj Golub fill_regs32(td, &status->pr_reg); 195662919d78SPeter Wemm #else 1957bd390213SMikolaj Golub fill_regs(td, &status->pr_reg); 195862919d78SPeter Wemm #endif 1959bd390213SMikolaj Golub sbuf_bcat(sb, status, sizeof(*status)); 1960bd390213SMikolaj Golub free(status, M_TEMP); 19618c9b7b2cSMarcel Moolenaar } 1962bd390213SMikolaj Golub *sizep = sizeof(*status); 1963bd390213SMikolaj Golub } 1964bd390213SMikolaj Golub 1965bd390213SMikolaj Golub static void 1966bd390213SMikolaj Golub __elfN(note_fpregset)(void *arg, struct sbuf *sb, size_t *sizep) 1967bd390213SMikolaj Golub { 1968bd390213SMikolaj Golub struct thread *td; 1969bd390213SMikolaj Golub elf_prfpregset_t *fpregset; 1970bd390213SMikolaj Golub 1971bd390213SMikolaj Golub td = (struct thread *)arg; 1972bd390213SMikolaj Golub if (sb != NULL) { 1973bd390213SMikolaj Golub KASSERT(*sizep == sizeof(*fpregset), ("invalid size")); 1974bd390213SMikolaj Golub fpregset = malloc(sizeof(*fpregset), M_TEMP, M_ZERO | M_WAITOK); 1975bd390213SMikolaj Golub #if defined(COMPAT_FREEBSD32) && __ELF_WORD_SIZE == 32 1976bd390213SMikolaj Golub fill_fpregs32(td, fpregset); 1977bd390213SMikolaj Golub #else 1978bd390213SMikolaj Golub fill_fpregs(td, fpregset); 1979bd390213SMikolaj Golub #endif 1980bd390213SMikolaj Golub sbuf_bcat(sb, fpregset, sizeof(*fpregset)); 1981bd390213SMikolaj Golub free(fpregset, M_TEMP); 1982bd390213SMikolaj Golub } 1983bd390213SMikolaj Golub *sizep = sizeof(*fpregset); 1984bd390213SMikolaj Golub } 1985bd390213SMikolaj Golub 1986bd390213SMikolaj Golub static void 1987bd390213SMikolaj Golub __elfN(note_thrmisc)(void *arg, struct sbuf *sb, size_t *sizep) 1988bd390213SMikolaj Golub { 1989bd390213SMikolaj Golub struct thread *td; 1990bd390213SMikolaj Golub elf_thrmisc_t thrmisc; 1991bd390213SMikolaj Golub 1992bd390213SMikolaj Golub td = (struct thread *)arg; 1993bd390213SMikolaj Golub if (sb != NULL) { 1994bd390213SMikolaj Golub KASSERT(*sizep == sizeof(thrmisc), ("invalid size")); 1995bd390213SMikolaj Golub bzero(&thrmisc._pad, sizeof(thrmisc._pad)); 1996bd390213SMikolaj Golub strcpy(thrmisc.pr_tname, td->td_name); 1997bd390213SMikolaj Golub sbuf_bcat(sb, &thrmisc, sizeof(thrmisc)); 1998bd390213SMikolaj Golub } 1999bd390213SMikolaj Golub *sizep = sizeof(thrmisc); 2000bd390213SMikolaj Golub } 2001bd390213SMikolaj Golub 20024da47b2fSMarcel Moolenaar /* 20034da47b2fSMarcel Moolenaar * Allow for MD specific notes, as well as any MD 20044da47b2fSMarcel Moolenaar * specific preparations for writing MI notes. 20054da47b2fSMarcel Moolenaar */ 20068c64af4fSJohn Polstra static void 2007bd390213SMikolaj Golub __elfN(note_threadmd)(void *arg, struct sbuf *sb, size_t *sizep) 20088c64af4fSJohn Polstra { 2009bd390213SMikolaj Golub struct thread *td; 2010bd390213SMikolaj Golub void *buf; 2011bd390213SMikolaj Golub size_t size; 20128c64af4fSJohn Polstra 2013bd390213SMikolaj Golub td = (struct thread *)arg; 2014bd390213SMikolaj Golub size = *sizep; 2015bd390213SMikolaj Golub if (size != 0 && sb != NULL) 2016bd390213SMikolaj Golub buf = malloc(size, M_TEMP, M_ZERO | M_WAITOK); 201783a396ceSChristian Brueffer else 201883a396ceSChristian Brueffer buf = NULL; 2019bd390213SMikolaj Golub size = 0; 2020bd390213SMikolaj Golub __elfN(dump_thread)(td, buf, &size); 202164779280SKonstantin Belousov KASSERT(sb == NULL || *sizep == size, ("invalid size")); 202283a396ceSChristian Brueffer if (size != 0 && sb != NULL) 2023bd390213SMikolaj Golub sbuf_bcat(sb, buf, size); 2024a1761d73SChristian Brueffer free(buf, M_TEMP); 2025bd390213SMikolaj Golub *sizep = size; 20268c64af4fSJohn Polstra } 20278c64af4fSJohn Polstra 2028f1fca82eSMikolaj Golub #ifdef KINFO_PROC_SIZE 2029f1fca82eSMikolaj Golub CTASSERT(sizeof(struct kinfo_proc) == KINFO_PROC_SIZE); 2030f1fca82eSMikolaj Golub #endif 2031f1fca82eSMikolaj Golub 2032f1fca82eSMikolaj Golub static void 2033f1fca82eSMikolaj Golub __elfN(note_procstat_proc)(void *arg, struct sbuf *sb, size_t *sizep) 2034f1fca82eSMikolaj Golub { 2035f1fca82eSMikolaj Golub struct proc *p; 2036f1fca82eSMikolaj Golub size_t size; 2037f1fca82eSMikolaj Golub int structsize; 2038f1fca82eSMikolaj Golub 2039f1fca82eSMikolaj Golub p = (struct proc *)arg; 2040f1fca82eSMikolaj Golub size = sizeof(structsize) + p->p_numthreads * 2041f1fca82eSMikolaj Golub sizeof(elf_kinfo_proc_t); 2042f1fca82eSMikolaj Golub 2043f1fca82eSMikolaj Golub if (sb != NULL) { 2044f1fca82eSMikolaj Golub KASSERT(*sizep == size, ("invalid size")); 2045f1fca82eSMikolaj Golub structsize = sizeof(elf_kinfo_proc_t); 2046f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 20476662ce5aSMateusz Guzik sx_slock(&proctree_lock); 2048f1fca82eSMikolaj Golub PROC_LOCK(p); 2049f1fca82eSMikolaj Golub kern_proc_out(p, sb, ELF_KERN_PROC_MASK); 20506662ce5aSMateusz Guzik sx_sunlock(&proctree_lock); 2051f1fca82eSMikolaj Golub } 2052f1fca82eSMikolaj Golub *sizep = size; 2053f1fca82eSMikolaj Golub } 2054f1fca82eSMikolaj Golub 2055f1fca82eSMikolaj Golub #ifdef KINFO_FILE_SIZE 2056f1fca82eSMikolaj Golub CTASSERT(sizeof(struct kinfo_file) == KINFO_FILE_SIZE); 2057f1fca82eSMikolaj Golub #endif 2058f1fca82eSMikolaj Golub 2059f1fca82eSMikolaj Golub static void 2060f1fca82eSMikolaj Golub note_procstat_files(void *arg, struct sbuf *sb, size_t *sizep) 2061f1fca82eSMikolaj Golub { 2062f1fca82eSMikolaj Golub struct proc *p; 206314bdbaf2SConrad Meyer size_t size, sect_sz, i; 206414bdbaf2SConrad Meyer ssize_t start_len, sect_len; 206514bdbaf2SConrad Meyer int structsize, filedesc_flags; 206614bdbaf2SConrad Meyer 2067bcb60d52SConrad Meyer if (coredump_pack_fileinfo) 206814bdbaf2SConrad Meyer filedesc_flags = KERN_FILEDESC_PACK_KINFO; 206914bdbaf2SConrad Meyer else 207014bdbaf2SConrad Meyer filedesc_flags = 0; 2071f1fca82eSMikolaj Golub 2072f1fca82eSMikolaj Golub p = (struct proc *)arg; 207314bdbaf2SConrad Meyer structsize = sizeof(struct kinfo_file); 2074f1fca82eSMikolaj Golub if (sb == NULL) { 2075f1fca82eSMikolaj Golub size = 0; 2076f1fca82eSMikolaj Golub sb = sbuf_new(NULL, NULL, 128, SBUF_FIXEDLEN); 2077f1fca82eSMikolaj Golub sbuf_set_drain(sb, sbuf_drain_count, &size); 2078f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 2079f1fca82eSMikolaj Golub PROC_LOCK(p); 208014bdbaf2SConrad Meyer kern_proc_filedesc_out(p, sb, -1, filedesc_flags); 2081f1fca82eSMikolaj Golub sbuf_finish(sb); 2082f1fca82eSMikolaj Golub sbuf_delete(sb); 2083f1fca82eSMikolaj Golub *sizep = size; 2084f1fca82eSMikolaj Golub } else { 208514bdbaf2SConrad Meyer sbuf_start_section(sb, &start_len); 208614bdbaf2SConrad Meyer 2087f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 2088f1fca82eSMikolaj Golub PROC_LOCK(p); 208914bdbaf2SConrad Meyer kern_proc_filedesc_out(p, sb, *sizep - sizeof(structsize), 209014bdbaf2SConrad Meyer filedesc_flags); 209114bdbaf2SConrad Meyer 209214bdbaf2SConrad Meyer sect_len = sbuf_end_section(sb, start_len, 0, 0); 209314bdbaf2SConrad Meyer if (sect_len < 0) 209414bdbaf2SConrad Meyer return; 209514bdbaf2SConrad Meyer sect_sz = sect_len; 209614bdbaf2SConrad Meyer 209714bdbaf2SConrad Meyer KASSERT(sect_sz <= *sizep, 209814bdbaf2SConrad Meyer ("kern_proc_filedesc_out did not respect maxlen; " 209914bdbaf2SConrad Meyer "requested %zu, got %zu", *sizep - sizeof(structsize), 210014bdbaf2SConrad Meyer sect_sz - sizeof(structsize))); 210114bdbaf2SConrad Meyer 210214bdbaf2SConrad Meyer for (i = 0; i < *sizep - sect_sz && sb->s_error == 0; i++) 210314bdbaf2SConrad Meyer sbuf_putc(sb, 0); 2104f1fca82eSMikolaj Golub } 2105f1fca82eSMikolaj Golub } 2106f1fca82eSMikolaj Golub 2107f1fca82eSMikolaj Golub #ifdef KINFO_VMENTRY_SIZE 2108f1fca82eSMikolaj Golub CTASSERT(sizeof(struct kinfo_vmentry) == KINFO_VMENTRY_SIZE); 2109f1fca82eSMikolaj Golub #endif 2110f1fca82eSMikolaj Golub 2111f1fca82eSMikolaj Golub static void 2112f1fca82eSMikolaj Golub note_procstat_vmmap(void *arg, struct sbuf *sb, size_t *sizep) 2113f1fca82eSMikolaj Golub { 2114f1fca82eSMikolaj Golub struct proc *p; 2115f1fca82eSMikolaj Golub size_t size; 2116e6b95927SConrad Meyer int structsize, vmmap_flags; 2117e6b95927SConrad Meyer 2118e6b95927SConrad Meyer if (coredump_pack_vmmapinfo) 2119e6b95927SConrad Meyer vmmap_flags = KERN_VMMAP_PACK_KINFO; 2120e6b95927SConrad Meyer else 2121e6b95927SConrad Meyer vmmap_flags = 0; 2122f1fca82eSMikolaj Golub 2123f1fca82eSMikolaj Golub p = (struct proc *)arg; 2124e6b95927SConrad Meyer structsize = sizeof(struct kinfo_vmentry); 2125f1fca82eSMikolaj Golub if (sb == NULL) { 2126f1fca82eSMikolaj Golub size = 0; 2127f1fca82eSMikolaj Golub sb = sbuf_new(NULL, NULL, 128, SBUF_FIXEDLEN); 2128f1fca82eSMikolaj Golub sbuf_set_drain(sb, sbuf_drain_count, &size); 2129f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 2130f1fca82eSMikolaj Golub PROC_LOCK(p); 2131e6b95927SConrad Meyer kern_proc_vmmap_out(p, sb, -1, vmmap_flags); 2132f1fca82eSMikolaj Golub sbuf_finish(sb); 2133f1fca82eSMikolaj Golub sbuf_delete(sb); 2134f1fca82eSMikolaj Golub *sizep = size; 2135f1fca82eSMikolaj Golub } else { 2136f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 2137f1fca82eSMikolaj Golub PROC_LOCK(p); 2138e6b95927SConrad Meyer kern_proc_vmmap_out(p, sb, *sizep - sizeof(structsize), 2139e6b95927SConrad Meyer vmmap_flags); 2140f1fca82eSMikolaj Golub } 2141f1fca82eSMikolaj Golub } 2142f1fca82eSMikolaj Golub 2143f1fca82eSMikolaj Golub static void 2144f1fca82eSMikolaj Golub note_procstat_groups(void *arg, struct sbuf *sb, size_t *sizep) 2145f1fca82eSMikolaj Golub { 2146f1fca82eSMikolaj Golub struct proc *p; 2147f1fca82eSMikolaj Golub size_t size; 2148f1fca82eSMikolaj Golub int structsize; 2149f1fca82eSMikolaj Golub 2150f1fca82eSMikolaj Golub p = (struct proc *)arg; 2151f1fca82eSMikolaj Golub size = sizeof(structsize) + p->p_ucred->cr_ngroups * sizeof(gid_t); 2152f1fca82eSMikolaj Golub if (sb != NULL) { 2153f1fca82eSMikolaj Golub KASSERT(*sizep == size, ("invalid size")); 2154f1fca82eSMikolaj Golub structsize = sizeof(gid_t); 2155f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 2156f1fca82eSMikolaj Golub sbuf_bcat(sb, p->p_ucred->cr_groups, p->p_ucred->cr_ngroups * 2157f1fca82eSMikolaj Golub sizeof(gid_t)); 2158f1fca82eSMikolaj Golub } 2159f1fca82eSMikolaj Golub *sizep = size; 2160f1fca82eSMikolaj Golub } 2161f1fca82eSMikolaj Golub 2162f1fca82eSMikolaj Golub static void 2163f1fca82eSMikolaj Golub note_procstat_umask(void *arg, struct sbuf *sb, size_t *sizep) 2164f1fca82eSMikolaj Golub { 2165f1fca82eSMikolaj Golub struct proc *p; 2166f1fca82eSMikolaj Golub size_t size; 2167f1fca82eSMikolaj Golub int structsize; 2168f1fca82eSMikolaj Golub 2169f1fca82eSMikolaj Golub p = (struct proc *)arg; 2170f1fca82eSMikolaj Golub size = sizeof(structsize) + sizeof(p->p_fd->fd_cmask); 2171f1fca82eSMikolaj Golub if (sb != NULL) { 2172f1fca82eSMikolaj Golub KASSERT(*sizep == size, ("invalid size")); 2173f1fca82eSMikolaj Golub structsize = sizeof(p->p_fd->fd_cmask); 2174f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 2175f1fca82eSMikolaj Golub sbuf_bcat(sb, &p->p_fd->fd_cmask, sizeof(p->p_fd->fd_cmask)); 2176f1fca82eSMikolaj Golub } 2177f1fca82eSMikolaj Golub *sizep = size; 2178f1fca82eSMikolaj Golub } 2179f1fca82eSMikolaj Golub 2180f1fca82eSMikolaj Golub static void 2181f1fca82eSMikolaj Golub note_procstat_rlimit(void *arg, struct sbuf *sb, size_t *sizep) 2182f1fca82eSMikolaj Golub { 2183f1fca82eSMikolaj Golub struct proc *p; 2184f1fca82eSMikolaj Golub struct rlimit rlim[RLIM_NLIMITS]; 2185f1fca82eSMikolaj Golub size_t size; 2186f1fca82eSMikolaj Golub int structsize, i; 2187f1fca82eSMikolaj Golub 2188f1fca82eSMikolaj Golub p = (struct proc *)arg; 2189f1fca82eSMikolaj Golub size = sizeof(structsize) + sizeof(rlim); 2190f1fca82eSMikolaj Golub if (sb != NULL) { 2191f1fca82eSMikolaj Golub KASSERT(*sizep == size, ("invalid size")); 2192f1fca82eSMikolaj Golub structsize = sizeof(rlim); 2193f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 2194f1fca82eSMikolaj Golub PROC_LOCK(p); 2195f1fca82eSMikolaj Golub for (i = 0; i < RLIM_NLIMITS; i++) 2196f6f6d240SMateusz Guzik lim_rlimit_proc(p, i, &rlim[i]); 2197f1fca82eSMikolaj Golub PROC_UNLOCK(p); 2198f1fca82eSMikolaj Golub sbuf_bcat(sb, rlim, sizeof(rlim)); 2199f1fca82eSMikolaj Golub } 2200f1fca82eSMikolaj Golub *sizep = size; 2201f1fca82eSMikolaj Golub } 2202f1fca82eSMikolaj Golub 2203f1fca82eSMikolaj Golub static void 2204f1fca82eSMikolaj Golub note_procstat_osrel(void *arg, struct sbuf *sb, size_t *sizep) 2205f1fca82eSMikolaj Golub { 2206f1fca82eSMikolaj Golub struct proc *p; 2207f1fca82eSMikolaj Golub size_t size; 2208f1fca82eSMikolaj Golub int structsize; 2209f1fca82eSMikolaj Golub 2210f1fca82eSMikolaj Golub p = (struct proc *)arg; 2211f1fca82eSMikolaj Golub size = sizeof(structsize) + sizeof(p->p_osrel); 2212f1fca82eSMikolaj Golub if (sb != NULL) { 2213f1fca82eSMikolaj Golub KASSERT(*sizep == size, ("invalid size")); 2214f1fca82eSMikolaj Golub structsize = sizeof(p->p_osrel); 2215f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 2216f1fca82eSMikolaj Golub sbuf_bcat(sb, &p->p_osrel, sizeof(p->p_osrel)); 2217f1fca82eSMikolaj Golub } 2218f1fca82eSMikolaj Golub *sizep = size; 2219f1fca82eSMikolaj Golub } 2220f1fca82eSMikolaj Golub 2221f1fca82eSMikolaj Golub static void 2222f1fca82eSMikolaj Golub __elfN(note_procstat_psstrings)(void *arg, struct sbuf *sb, size_t *sizep) 2223f1fca82eSMikolaj Golub { 2224f1fca82eSMikolaj Golub struct proc *p; 2225f1fca82eSMikolaj Golub elf_ps_strings_t ps_strings; 2226f1fca82eSMikolaj Golub size_t size; 2227f1fca82eSMikolaj Golub int structsize; 2228f1fca82eSMikolaj Golub 2229f1fca82eSMikolaj Golub p = (struct proc *)arg; 2230f1fca82eSMikolaj Golub size = sizeof(structsize) + sizeof(ps_strings); 2231f1fca82eSMikolaj Golub if (sb != NULL) { 2232f1fca82eSMikolaj Golub KASSERT(*sizep == size, ("invalid size")); 2233f1fca82eSMikolaj Golub structsize = sizeof(ps_strings); 2234f1fca82eSMikolaj Golub #if defined(COMPAT_FREEBSD32) && __ELF_WORD_SIZE == 32 2235f1fca82eSMikolaj Golub ps_strings = PTROUT(p->p_sysent->sv_psstrings); 2236f1fca82eSMikolaj Golub #else 2237f1fca82eSMikolaj Golub ps_strings = p->p_sysent->sv_psstrings; 2238f1fca82eSMikolaj Golub #endif 2239f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 2240f1fca82eSMikolaj Golub sbuf_bcat(sb, &ps_strings, sizeof(ps_strings)); 2241f1fca82eSMikolaj Golub } 2242f1fca82eSMikolaj Golub *sizep = size; 2243f1fca82eSMikolaj Golub } 2244f1fca82eSMikolaj Golub 2245f1fca82eSMikolaj Golub static void 2246f1fca82eSMikolaj Golub __elfN(note_procstat_auxv)(void *arg, struct sbuf *sb, size_t *sizep) 2247f1fca82eSMikolaj Golub { 2248f1fca82eSMikolaj Golub struct proc *p; 2249f1fca82eSMikolaj Golub size_t size; 2250f1fca82eSMikolaj Golub int structsize; 2251f1fca82eSMikolaj Golub 2252f1fca82eSMikolaj Golub p = (struct proc *)arg; 2253f1fca82eSMikolaj Golub if (sb == NULL) { 2254f1fca82eSMikolaj Golub size = 0; 2255f1fca82eSMikolaj Golub sb = sbuf_new(NULL, NULL, 128, SBUF_FIXEDLEN); 2256f1fca82eSMikolaj Golub sbuf_set_drain(sb, sbuf_drain_count, &size); 2257f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 2258f1fca82eSMikolaj Golub PHOLD(p); 2259f1fca82eSMikolaj Golub proc_getauxv(curthread, p, sb); 2260f1fca82eSMikolaj Golub PRELE(p); 2261f1fca82eSMikolaj Golub sbuf_finish(sb); 2262f1fca82eSMikolaj Golub sbuf_delete(sb); 2263f1fca82eSMikolaj Golub *sizep = size; 2264f1fca82eSMikolaj Golub } else { 2265f1fca82eSMikolaj Golub structsize = sizeof(Elf_Auxinfo); 2266f1fca82eSMikolaj Golub sbuf_bcat(sb, &structsize, sizeof(structsize)); 2267f1fca82eSMikolaj Golub PHOLD(p); 2268f1fca82eSMikolaj Golub proc_getauxv(curthread, p, sb); 2269f1fca82eSMikolaj Golub PRELE(p); 2270f1fca82eSMikolaj Golub } 2271f1fca82eSMikolaj Golub } 2272f1fca82eSMikolaj Golub 227332c01de2SDmitry Chagin static boolean_t 22741a9c7decSKonstantin Belousov __elfN(parse_notes)(struct image_params *imgp, Elf_Brandnote *checknote, 22751a9c7decSKonstantin Belousov int32_t *osrel, const Elf_Phdr *pnote) 227632c01de2SDmitry Chagin { 2277267c52fcSKonstantin Belousov const Elf_Note *note, *note0, *note_end; 227832c01de2SDmitry Chagin const char *note_name; 22796c775eb6SKonstantin Belousov char *buf; 22806c775eb6SKonstantin Belousov int i, error; 22816c775eb6SKonstantin Belousov boolean_t res; 228232c01de2SDmitry Chagin 22836c775eb6SKonstantin Belousov /* We need some limit, might as well use PAGE_SIZE. */ 22846c775eb6SKonstantin Belousov if (pnote == NULL || pnote->p_filesz > PAGE_SIZE) 228532c01de2SDmitry Chagin return (FALSE); 22866c775eb6SKonstantin Belousov ASSERT_VOP_LOCKED(imgp->vp, "parse_notes"); 22876c775eb6SKonstantin Belousov if (pnote->p_offset > PAGE_SIZE || 22886c775eb6SKonstantin Belousov pnote->p_filesz > PAGE_SIZE - pnote->p_offset) { 22896c775eb6SKonstantin Belousov VOP_UNLOCK(imgp->vp, 0); 22906c775eb6SKonstantin Belousov buf = malloc(pnote->p_filesz, M_TEMP, M_WAITOK); 22916c775eb6SKonstantin Belousov vn_lock(imgp->vp, LK_EXCLUSIVE | LK_RETRY); 22926c775eb6SKonstantin Belousov error = vn_rdwr(UIO_READ, imgp->vp, buf, pnote->p_filesz, 22936c775eb6SKonstantin Belousov pnote->p_offset, UIO_SYSSPACE, IO_NODELOCKED, 22946c775eb6SKonstantin Belousov curthread->td_ucred, NOCRED, NULL, curthread); 22956c775eb6SKonstantin Belousov if (error != 0) { 22966c775eb6SKonstantin Belousov uprintf("i/o error PT_NOTE\n"); 22976c775eb6SKonstantin Belousov res = FALSE; 22986c775eb6SKonstantin Belousov goto ret; 22996c775eb6SKonstantin Belousov } 23006c775eb6SKonstantin Belousov note = note0 = (const Elf_Note *)buf; 23016c775eb6SKonstantin Belousov note_end = (const Elf_Note *)(buf + pnote->p_filesz); 23026c775eb6SKonstantin Belousov } else { 23036c775eb6SKonstantin Belousov note = note0 = (const Elf_Note *)(imgp->image_header + 23046c775eb6SKonstantin Belousov pnote->p_offset); 230532c01de2SDmitry Chagin note_end = (const Elf_Note *)(imgp->image_header + 230632c01de2SDmitry Chagin pnote->p_offset + pnote->p_filesz); 23076c775eb6SKonstantin Belousov buf = NULL; 23086c775eb6SKonstantin Belousov } 2309267c52fcSKonstantin Belousov for (i = 0; i < 100 && note >= note0 && note < note_end; i++) { 2310d1ae5c83SKonstantin Belousov if (!aligned(note, Elf32_Addr) || (const char *)note_end - 23116c775eb6SKonstantin Belousov (const char *)note < sizeof(Elf_Note)) { 23126c775eb6SKonstantin Belousov res = FALSE; 23136c775eb6SKonstantin Belousov goto ret; 23146c775eb6SKonstantin Belousov } 231532c01de2SDmitry Chagin if (note->n_namesz != checknote->hdr.n_namesz || 231632c01de2SDmitry Chagin note->n_descsz != checknote->hdr.n_descsz || 231732c01de2SDmitry Chagin note->n_type != checknote->hdr.n_type) 231832c01de2SDmitry Chagin goto nextnote; 231932c01de2SDmitry Chagin note_name = (const char *)(note + 1); 2320d1ae5c83SKonstantin Belousov if (note_name + checknote->hdr.n_namesz >= 2321d1ae5c83SKonstantin Belousov (const char *)note_end || strncmp(checknote->vendor, 2322d1ae5c83SKonstantin Belousov note_name, checknote->hdr.n_namesz) != 0) 232332c01de2SDmitry Chagin goto nextnote; 232432c01de2SDmitry Chagin 232532c01de2SDmitry Chagin /* 232632c01de2SDmitry Chagin * Fetch the osreldate for binary 232732c01de2SDmitry Chagin * from the ELF OSABI-note if necessary. 232832c01de2SDmitry Chagin */ 232989ffc202SBjoern A. Zeeb if ((checknote->flags & BN_TRANSLATE_OSREL) != 0 && 23306c775eb6SKonstantin Belousov checknote->trans_osrel != NULL) { 23316c775eb6SKonstantin Belousov res = checknote->trans_osrel(note, osrel); 23326c775eb6SKonstantin Belousov goto ret; 23336c775eb6SKonstantin Belousov } 23346c775eb6SKonstantin Belousov res = TRUE; 23356c775eb6SKonstantin Belousov goto ret; 233632c01de2SDmitry Chagin nextnote: 233732c01de2SDmitry Chagin note = (const Elf_Note *)((const char *)(note + 1) + 23381b8388cdSMikolaj Golub roundup2(note->n_namesz, ELF_NOTE_ROUNDSIZE) + 23391b8388cdSMikolaj Golub roundup2(note->n_descsz, ELF_NOTE_ROUNDSIZE)); 234032c01de2SDmitry Chagin } 23416c775eb6SKonstantin Belousov res = FALSE; 23426c775eb6SKonstantin Belousov ret: 23436c775eb6SKonstantin Belousov free(buf, M_TEMP); 23446c775eb6SKonstantin Belousov return (res); 234532c01de2SDmitry Chagin } 234632c01de2SDmitry Chagin 234732c01de2SDmitry Chagin /* 23481a9c7decSKonstantin Belousov * Try to find the appropriate ABI-note section for checknote, 23491a9c7decSKonstantin Belousov * fetch the osreldate for binary from the ELF OSABI-note. Only the 23501a9c7decSKonstantin Belousov * first page of the image is searched, the same as for headers. 23511a9c7decSKonstantin Belousov */ 23521a9c7decSKonstantin Belousov static boolean_t 23531a9c7decSKonstantin Belousov __elfN(check_note)(struct image_params *imgp, Elf_Brandnote *checknote, 23541a9c7decSKonstantin Belousov int32_t *osrel) 23551a9c7decSKonstantin Belousov { 23561a9c7decSKonstantin Belousov const Elf_Phdr *phdr; 23571a9c7decSKonstantin Belousov const Elf_Ehdr *hdr; 23581a9c7decSKonstantin Belousov int i; 23591a9c7decSKonstantin Belousov 23601a9c7decSKonstantin Belousov hdr = (const Elf_Ehdr *)imgp->image_header; 23611a9c7decSKonstantin Belousov phdr = (const Elf_Phdr *)(imgp->image_header + hdr->e_phoff); 23621a9c7decSKonstantin Belousov 23631a9c7decSKonstantin Belousov for (i = 0; i < hdr->e_phnum; i++) { 23641a9c7decSKonstantin Belousov if (phdr[i].p_type == PT_NOTE && 23651a9c7decSKonstantin Belousov __elfN(parse_notes)(imgp, checknote, osrel, &phdr[i])) 23661a9c7decSKonstantin Belousov return (TRUE); 23671a9c7decSKonstantin Belousov } 23681a9c7decSKonstantin Belousov return (FALSE); 23691a9c7decSKonstantin Belousov 23701a9c7decSKonstantin Belousov } 23711a9c7decSKonstantin Belousov 23721a9c7decSKonstantin Belousov /* 2373e1743d02SSøren Schmidt * Tell kern_execve.c about it, with a little help from the linker. 2374e1743d02SSøren Schmidt */ 2375a360a43dSJake Burkholder static struct execsw __elfN(execsw) = { 2376a360a43dSJake Burkholder __CONCAT(exec_, __elfN(imgact)), 2377a360a43dSJake Burkholder __XSTRING(__CONCAT(ELF, __ELF_WORD_SIZE)) 2378a360a43dSJake Burkholder }; 2379a360a43dSJake Burkholder EXEC_SET(__CONCAT(elf, __ELF_WORD_SIZE), __elfN(execsw)); 2380e7228204SAlfred Perlstein 2381ed167eaaSKonstantin Belousov static vm_prot_t 2382ed167eaaSKonstantin Belousov __elfN(trans_prot)(Elf_Word flags) 2383ed167eaaSKonstantin Belousov { 2384ed167eaaSKonstantin Belousov vm_prot_t prot; 2385ed167eaaSKonstantin Belousov 2386ed167eaaSKonstantin Belousov prot = 0; 2387ed167eaaSKonstantin Belousov if (flags & PF_X) 2388ed167eaaSKonstantin Belousov prot |= VM_PROT_EXECUTE; 2389ed167eaaSKonstantin Belousov if (flags & PF_W) 2390ed167eaaSKonstantin Belousov prot |= VM_PROT_WRITE; 2391ed167eaaSKonstantin Belousov if (flags & PF_R) 2392ed167eaaSKonstantin Belousov prot |= VM_PROT_READ; 2393676eda08SMarcel Moolenaar #if __ELF_WORD_SIZE == 32 2394e7d939bdSMarcel Moolenaar #if defined(__amd64__) 2395126b36a2SKonstantin Belousov if (i386_read_exec && (flags & PF_R)) 2396676eda08SMarcel Moolenaar prot |= VM_PROT_EXECUTE; 2397676eda08SMarcel Moolenaar #endif 2398676eda08SMarcel Moolenaar #endif 2399ed167eaaSKonstantin Belousov return (prot); 2400ed167eaaSKonstantin Belousov } 2401ed167eaaSKonstantin Belousov 2402ed167eaaSKonstantin Belousov static Elf_Word 2403ed167eaaSKonstantin Belousov __elfN(untrans_prot)(vm_prot_t prot) 2404ed167eaaSKonstantin Belousov { 2405ed167eaaSKonstantin Belousov Elf_Word flags; 2406ed167eaaSKonstantin Belousov 2407ed167eaaSKonstantin Belousov flags = 0; 2408ed167eaaSKonstantin Belousov if (prot & VM_PROT_EXECUTE) 2409ed167eaaSKonstantin Belousov flags |= PF_X; 2410ed167eaaSKonstantin Belousov if (prot & VM_PROT_READ) 2411ed167eaaSKonstantin Belousov flags |= PF_R; 2412ed167eaaSKonstantin Belousov if (prot & VM_PROT_WRITE) 2413ed167eaaSKonstantin Belousov flags |= PF_W; 2414ed167eaaSKonstantin Belousov return (flags); 2415ed167eaaSKonstantin Belousov } 2416