126f9a767SRodney W. Grimes /* 226f9a767SRodney W. Grimes * Copyright (c) 1993, David Greenman 326f9a767SRodney W. Grimes * All rights reserved. 4df8bae1dSRodney W. Grimes * 5df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 6df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 7df8bae1dSRodney W. Grimes * are met: 8df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 9df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 10df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 12df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 13df8bae1dSRodney W. Grimes * 1426f9a767SRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 15df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 16df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 1726f9a767SRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 18df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 19df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 20df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 21df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 22df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 23df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 24df8bae1dSRodney W. Grimes * SUCH DAMAGE. 25df8bae1dSRodney W. Grimes */ 26df8bae1dSRodney W. Grimes 27677b542eSDavid E. O'Brien #include <sys/cdefs.h> 28677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 29677b542eSDavid E. O'Brien 301e9b3d91SPeter Wemm #include "opt_ktrace.h" 31339b79b9SRobert Watson #include "opt_mac.h" 321e9b3d91SPeter Wemm 33df8bae1dSRodney W. Grimes #include <sys/param.h> 3426f9a767SRodney W. Grimes #include <sys/systm.h> 3575b8b3b2SJohn Baldwin #include <sys/eventhandler.h> 36fb919e4dSMark Murray #include <sys/lock.h> 37fb919e4dSMark Murray #include <sys/mutex.h> 38d2d3e875SBruce Evans #include <sys/sysproto.h> 3926f9a767SRodney W. Grimes #include <sys/signalvar.h> 4026f9a767SRodney W. Grimes #include <sys/kernel.h> 41339b79b9SRobert Watson #include <sys/mac.h> 4226f9a767SRodney W. Grimes #include <sys/mount.h> 43797f2d22SPoul-Henning Kamp #include <sys/filedesc.h> 44079cc25bSDavid Greenman #include <sys/fcntl.h> 4526f9a767SRodney W. Grimes #include <sys/acct.h> 4626f9a767SRodney W. Grimes #include <sys/exec.h> 4726f9a767SRodney W. Grimes #include <sys/imgact.h> 48e1743d02SSøren Schmidt #include <sys/imgact_elf.h> 4926f9a767SRodney W. Grimes #include <sys/wait.h> 50333ea485SGuido van Rooij #include <sys/malloc.h> 51a794e791SBruce Evans #include <sys/proc.h> 522a024a2bSSean Eric Fagan #include <sys/pioctl.h> 53a794e791SBruce Evans #include <sys/namei.h> 5459c8bc40SAlan Cox #include <sys/sf_buf.h> 551e1e0b44SSøren Schmidt #include <sys/sysent.h> 56797f2d22SPoul-Henning Kamp #include <sys/shm.h> 5799ac3bc8SPeter Wemm #include <sys/sysctl.h> 58333ea485SGuido van Rooij #include <sys/user.h> 59a794e791SBruce Evans #include <sys/vnode.h> 60c781aea8SPeter Wemm #ifdef KTRACE 61c781aea8SPeter Wemm #include <sys/ktrace.h> 62c781aea8SPeter Wemm #endif 6326f9a767SRodney W. Grimes 6426f9a767SRodney W. Grimes #include <vm/vm.h> 65efeaf95aSDavid Greenman #include <vm/vm_param.h> 66efeaf95aSDavid Greenman #include <vm/pmap.h> 671616db3cSJohn Dyson #include <vm/vm_page.h> 68efeaf95aSDavid Greenman #include <vm/vm_map.h> 6926f9a767SRodney W. Grimes #include <vm/vm_kern.h> 70efeaf95aSDavid Greenman #include <vm/vm_extern.h> 711ebd0c59SDavid Greenman #include <vm/vm_object.h> 721616db3cSJohn Dyson #include <vm/vm_pager.h> 7326f9a767SRodney W. Grimes 7426f9a767SRodney W. Grimes #include <machine/reg.h> 7526f9a767SRodney W. Grimes 76b9df5231SPoul-Henning Kamp MALLOC_DEFINE(M_PARGS, "proc-args", "Process arguments"); 77b9df5231SPoul-Henning Kamp 7805ba50f5SJake Burkholder static int sysctl_kern_ps_strings(SYSCTL_HANDLER_ARGS); 7905ba50f5SJake Burkholder static int sysctl_kern_usrstack(SYSCTL_HANDLER_ARGS); 805dadd17bSJake Burkholder static int sysctl_kern_stackprot(SYSCTL_HANDLER_ARGS); 81450ffb44SRobert Watson static int kern_execve(struct thread *td, char *fname, char **argv, 82670cb89bSRobert Watson char **envv, struct mac *mac_p); 83906ac69dSDavid Xu static int do_execve(struct thread *td, char *fname, char **argv, 84906ac69dSDavid Xu char **envv, struct mac *mac_p); 8505ba50f5SJake Burkholder 869701cd40SJohn Baldwin /* XXX This should be vm_size_t. */ 8705ba50f5SJake Burkholder SYSCTL_PROC(_kern, KERN_PS_STRINGS, ps_strings, CTLTYPE_ULONG|CTLFLAG_RD, 8805ba50f5SJake Burkholder NULL, 0, sysctl_kern_ps_strings, "LU", ""); 89486bddb0SDoug Rabson 909701cd40SJohn Baldwin /* XXX This should be vm_size_t. */ 9105ba50f5SJake Burkholder SYSCTL_PROC(_kern, KERN_USRSTACK, usrstack, CTLTYPE_ULONG|CTLFLAG_RD, 9205ba50f5SJake Burkholder NULL, 0, sysctl_kern_usrstack, "LU", ""); 9399ac3bc8SPeter Wemm 945dadd17bSJake Burkholder SYSCTL_PROC(_kern, OID_AUTO, stackprot, CTLTYPE_INT|CTLFLAG_RD, 955dadd17bSJake Burkholder NULL, 0, sysctl_kern_stackprot, "I", ""); 965dadd17bSJake Burkholder 97b9df5231SPoul-Henning Kamp u_long ps_arg_cache_limit = PAGE_SIZE / 16; 98c3699b5fSPeter Wemm SYSCTL_ULONG(_kern, OID_AUTO, ps_arg_cache_limit, CTLFLAG_RW, 999701cd40SJohn Baldwin &ps_arg_cache_limit, 0, ""); 100b9df5231SPoul-Henning Kamp 10105ba50f5SJake Burkholder static int 10205ba50f5SJake Burkholder sysctl_kern_ps_strings(SYSCTL_HANDLER_ARGS) 10305ba50f5SJake Burkholder { 10405ba50f5SJake Burkholder struct proc *p; 105df7c361eSPeter Wemm int error; 10605ba50f5SJake Burkholder 10705ba50f5SJake Burkholder p = curproc; 108df7c361eSPeter Wemm #if defined(__amd64__) || defined(__ia64__) 109df7c361eSPeter Wemm if (req->oldlen == sizeof(unsigned int)) { 110df7c361eSPeter Wemm unsigned int val; 111df7c361eSPeter Wemm val = (unsigned int)p->p_sysent->sv_psstrings; 112df7c361eSPeter Wemm error = SYSCTL_OUT(req, &val, sizeof(val)); 113df7c361eSPeter Wemm } else 114df7c361eSPeter Wemm #endif 115df7c361eSPeter Wemm error = SYSCTL_OUT(req, &p->p_sysent->sv_psstrings, 116df7c361eSPeter Wemm sizeof(p->p_sysent->sv_psstrings)); 117df7c361eSPeter Wemm return error; 11805ba50f5SJake Burkholder } 11905ba50f5SJake Burkholder 12005ba50f5SJake Burkholder static int 12105ba50f5SJake Burkholder sysctl_kern_usrstack(SYSCTL_HANDLER_ARGS) 12205ba50f5SJake Burkholder { 12305ba50f5SJake Burkholder struct proc *p; 124df7c361eSPeter Wemm int error; 12505ba50f5SJake Burkholder 12605ba50f5SJake Burkholder p = curproc; 127df7c361eSPeter Wemm #if defined(__amd64__) || defined(__ia64__) 128df7c361eSPeter Wemm if (req->oldlen == sizeof(unsigned int)) { 129df7c361eSPeter Wemm unsigned int val; 130df7c361eSPeter Wemm val = (unsigned int)p->p_sysent->sv_usrstack; 131df7c361eSPeter Wemm error = SYSCTL_OUT(req, &val, sizeof(val)); 132df7c361eSPeter Wemm } else 133df7c361eSPeter Wemm #endif 134df7c361eSPeter Wemm error = SYSCTL_OUT(req, &p->p_sysent->sv_usrstack, 135df7c361eSPeter Wemm sizeof(p->p_sysent->sv_usrstack)); 136df7c361eSPeter Wemm return error; 13705ba50f5SJake Burkholder } 13805ba50f5SJake Burkholder 1395dadd17bSJake Burkholder static int 1405dadd17bSJake Burkholder sysctl_kern_stackprot(SYSCTL_HANDLER_ARGS) 1415dadd17bSJake Burkholder { 1425dadd17bSJake Burkholder struct proc *p; 1435dadd17bSJake Burkholder 1445dadd17bSJake Burkholder p = curproc; 1455dadd17bSJake Burkholder return (SYSCTL_OUT(req, &p->p_sysent->sv_stackprot, 1465dadd17bSJake Burkholder sizeof(p->p_sysent->sv_stackprot))); 1475dadd17bSJake Burkholder } 1485dadd17bSJake Burkholder 14999ac3bc8SPeter Wemm /* 150aa855a59SPeter Wemm * Each of the items is a pointer to a `const struct execsw', hence the 151aa855a59SPeter Wemm * double pointer here. 152df8bae1dSRodney W. Grimes */ 153aa855a59SPeter Wemm static const struct execsw **execsw; 15426f9a767SRodney W. Grimes 155ca46e90eSBruce Evans #ifndef _SYS_SYSPROTO_H_ 156ca46e90eSBruce Evans struct execve_args { 157ca46e90eSBruce Evans char *fname; 158ca46e90eSBruce Evans char **argv; 159ca46e90eSBruce Evans char **envv; 160ca46e90eSBruce Evans }; 161ca46e90eSBruce Evans #endif 162ca46e90eSBruce Evans 163ca46e90eSBruce Evans /* 164ca46e90eSBruce Evans * MPSAFE 165ca46e90eSBruce Evans */ 166ca46e90eSBruce Evans int 167ca46e90eSBruce Evans execve(td, uap) 168ca46e90eSBruce Evans struct thread *td; 169ca46e90eSBruce Evans struct execve_args /* { 170ca46e90eSBruce Evans char *fname; 171ca46e90eSBruce Evans char **argv; 172ca46e90eSBruce Evans char **envv; 173ca46e90eSBruce Evans } */ *uap; 174ca46e90eSBruce Evans { 175ca46e90eSBruce Evans 176ca46e90eSBruce Evans return (kern_execve(td, uap->fname, uap->argv, uap->envv, NULL)); 177ca46e90eSBruce Evans } 178ca46e90eSBruce Evans 179ca46e90eSBruce Evans #ifndef _SYS_SYSPROTO_H_ 180ca46e90eSBruce Evans struct __mac_execve_args { 181ca46e90eSBruce Evans char *fname; 182ca46e90eSBruce Evans char **argv; 183ca46e90eSBruce Evans char **envv; 184ca46e90eSBruce Evans struct mac *mac_p; 185ca46e90eSBruce Evans }; 186ca46e90eSBruce Evans #endif 187ca46e90eSBruce Evans 188ca46e90eSBruce Evans /* 189ca46e90eSBruce Evans * MPSAFE 190ca46e90eSBruce Evans */ 191ca46e90eSBruce Evans int 192ca46e90eSBruce Evans __mac_execve(td, uap) 193ca46e90eSBruce Evans struct thread *td; 194ca46e90eSBruce Evans struct __mac_execve_args /* { 195ca46e90eSBruce Evans char *fname; 196ca46e90eSBruce Evans char **argv; 197ca46e90eSBruce Evans char **envv; 198ca46e90eSBruce Evans struct mac *mac_p; 199ca46e90eSBruce Evans } */ *uap; 200ca46e90eSBruce Evans { 201ca46e90eSBruce Evans 202ca46e90eSBruce Evans #ifdef MAC 203ca46e90eSBruce Evans return (kern_execve(td, uap->fname, uap->argv, uap->envv, 204ca46e90eSBruce Evans uap->mac_p)); 205ca46e90eSBruce Evans #else 206ca46e90eSBruce Evans return (ENOSYS); 207ca46e90eSBruce Evans #endif 208ca46e90eSBruce Evans } 209ca46e90eSBruce Evans 210906ac69dSDavid Xu static int 211906ac69dSDavid Xu kern_execve(td, fname, argv, envv, mac_p) 212906ac69dSDavid Xu struct thread *td; 213906ac69dSDavid Xu char *fname; 214906ac69dSDavid Xu char **argv; 215906ac69dSDavid Xu char **envv; 216906ac69dSDavid Xu struct mac *mac_p; 217906ac69dSDavid Xu { 218906ac69dSDavid Xu struct proc *p = td->td_proc; 219906ac69dSDavid Xu int error; 220906ac69dSDavid Xu 221906ac69dSDavid Xu if (p->p_flag & P_HADTHREADS) { 222906ac69dSDavid Xu PROC_LOCK(p); 223906ac69dSDavid Xu if (thread_single(SINGLE_BOUNDARY)) { 224906ac69dSDavid Xu PROC_UNLOCK(p); 225906ac69dSDavid Xu return (ERESTART); /* Try again later. */ 226906ac69dSDavid Xu } 227906ac69dSDavid Xu PROC_UNLOCK(p); 228906ac69dSDavid Xu } 229906ac69dSDavid Xu 230906ac69dSDavid Xu error = do_execve(td, fname, argv, envv, mac_p); 231906ac69dSDavid Xu 232906ac69dSDavid Xu if (p->p_flag & P_HADTHREADS) { 233906ac69dSDavid Xu PROC_LOCK(p); 234906ac69dSDavid Xu /* 235906ac69dSDavid Xu * If success, we upgrade to SINGLE_EXIT state to 236906ac69dSDavid Xu * force other threads to suicide. 237906ac69dSDavid Xu */ 238906ac69dSDavid Xu if (error == 0) 239906ac69dSDavid Xu thread_single(SINGLE_EXIT); 240906ac69dSDavid Xu else 241906ac69dSDavid Xu thread_single_end(); 242906ac69dSDavid Xu PROC_UNLOCK(p); 243906ac69dSDavid Xu } 244906ac69dSDavid Xu 245906ac69dSDavid Xu return (error); 246906ac69dSDavid Xu } 247906ac69dSDavid Xu 24826f9a767SRodney W. Grimes /* 249450ffb44SRobert Watson * In-kernel implementation of execve(). All arguments are assumed to be 250450ffb44SRobert Watson * userspace pointers from the passed thread. 251116734c4SMatthew Dillon * 252116734c4SMatthew Dillon * MPSAFE 25326f9a767SRodney W. Grimes */ 254450ffb44SRobert Watson static int 255906ac69dSDavid Xu do_execve(td, fname, argv, envv, mac_p) 256b40ce416SJulian Elischer struct thread *td; 257450ffb44SRobert Watson char *fname; 258450ffb44SRobert Watson char **argv; 259450ffb44SRobert Watson char **envv; 260670cb89bSRobert Watson struct mac *mac_p; 261df8bae1dSRodney W. Grimes { 262b40ce416SJulian Elischer struct proc *p = td->td_proc; 26326f9a767SRodney W. Grimes struct nameidata nd, *ndp; 2649b3b1c5fSJohn Baldwin struct ucred *newcred = NULL, *oldcred; 2651419eacbSAlfred Perlstein struct uidinfo *euip; 266654f6be1SBruce Evans register_t *stack_base; 267bb56ec4aSPoul-Henning Kamp int error, len, i; 268c52007c2SDavid Greenman struct image_params image_params, *imgp; 26926f9a767SRodney W. Grimes struct vattr attr; 2704d77a549SAlfred Perlstein int (*img_first)(struct image_params *); 27169be5db9SAlfred Perlstein struct pargs *oldargs = NULL, *newargs = NULL; 27290af4afaSJohn Baldwin struct sigacts *oldsigacts, *newsigacts; 2736c84de02SJohn Baldwin #ifdef KTRACE 2746c84de02SJohn Baldwin struct vnode *tracevp = NULL; 275a5881ea5SJohn Baldwin struct ucred *tracecred = NULL; 2766c84de02SJohn Baldwin #endif 2776c84de02SJohn Baldwin struct vnode *textvp = NULL; 278d06c0d4dSRobert Watson int credential_changing; 279619eb6e5SJeff Roberson int textset; 280ccafe7ebSRobert Watson #ifdef MAC 281eca8a663SRobert Watson struct label *interplabel = NULL; 282eca8a663SRobert Watson int will_transition; 283ccafe7ebSRobert Watson #endif 28426f9a767SRodney W. Grimes 285c52007c2SDavid Greenman imgp = &image_params; 286df8bae1dSRodney W. Grimes 2879ca45e81SDag-Erling Smørgrav /* 2889ca45e81SDag-Erling Smørgrav * Lock the process and set the P_INEXEC flag to indicate that 2899ca45e81SDag-Erling Smørgrav * it should be left alone until we're done here. This is 2909ca45e81SDag-Erling Smørgrav * necessary to avoid race conditions - e.g. in ptrace() - 2919ca45e81SDag-Erling Smørgrav * that might allow a local user to illicitly obtain elevated 2929ca45e81SDag-Erling Smørgrav * privileges. 2939ca45e81SDag-Erling Smørgrav */ 2949ca45e81SDag-Erling Smørgrav PROC_LOCK(p); 2959ca45e81SDag-Erling Smørgrav KASSERT((p->p_flag & P_INEXEC) == 0, 29691f91617SDavid E. O'Brien ("%s(): process already has P_INEXEC flag", __func__)); 2979ca45e81SDag-Erling Smørgrav p->p_flag |= P_INEXEC; 2989ca45e81SDag-Erling Smørgrav PROC_UNLOCK(p); 2999ca45e81SDag-Erling Smørgrav 300df8bae1dSRodney W. Grimes /* 301c52007c2SDavid Greenman * Initialize part of the common data 302df8bae1dSRodney W. Grimes */ 303c52007c2SDavid Greenman imgp->proc = p; 304450ffb44SRobert Watson imgp->userspace_argv = argv; 305450ffb44SRobert Watson imgp->userspace_envv = envv; 306670cb89bSRobert Watson imgp->execlabel = NULL; 307c52007c2SDavid Greenman imgp->attr = &attr; 308c52007c2SDavid Greenman imgp->argc = imgp->envc = 0; 3095cf3d12cSAndrey A. Chernov imgp->argv0 = NULL; 310c52007c2SDavid Greenman imgp->entry_addr = 0; 311c52007c2SDavid Greenman imgp->vmspace_destroyed = 0; 312c52007c2SDavid Greenman imgp->interpreted = 0; 313c52007c2SDavid Greenman imgp->interpreter_name[0] = '\0'; 314e1743d02SSøren Schmidt imgp->auxargs = NULL; 3151616db3cSJohn Dyson imgp->vp = NULL; 3160b2ed1aeSJeff Roberson imgp->object = NULL; 3171616db3cSJohn Dyson imgp->firstpage = NULL; 3184fe88fe6SJohn Polstra imgp->ps_strings = 0; 319b9a22da4STakanori Watanabe imgp->auxarg_size = 0; 32026f9a767SRodney W. Grimes 321670cb89bSRobert Watson #ifdef MAC 322eca8a663SRobert Watson error = mac_execve_enter(imgp, mac_p); 323670cb89bSRobert Watson if (error) { 324670cb89bSRobert Watson mtx_lock(&Giant); 325670cb89bSRobert Watson goto exec_fail; 326670cb89bSRobert Watson } 327670cb89bSRobert Watson #endif 328670cb89bSRobert Watson 32926f9a767SRodney W. Grimes /* 33026f9a767SRodney W. Grimes * Allocate temporary demand zeroed space for argument and 33126f9a767SRodney W. Grimes * environment strings 33226f9a767SRodney W. Grimes */ 33359c8bc40SAlan Cox imgp->stringbase = (char *)kmem_alloc_wait(exec_map, ARG_MAX); 334c2f9f36bSDavid Greenman if (imgp->stringbase == NULL) { 33526f9a767SRodney W. Grimes error = ENOMEM; 336b3afd20dSAlan Cox mtx_lock(&Giant); 33726f9a767SRodney W. Grimes goto exec_fail; 33826f9a767SRodney W. Grimes } 339c52007c2SDavid Greenman imgp->stringp = imgp->stringbase; 340c52007c2SDavid Greenman imgp->stringspace = ARG_MAX; 34159c8bc40SAlan Cox imgp->image_header = NULL; 34226f9a767SRodney W. Grimes 34326f9a767SRodney W. Grimes /* 34426f9a767SRodney W. Grimes * Translate the file name. namei() returns a vnode pointer 34526f9a767SRodney W. Grimes * in ni_vp amoung other things. 34626f9a767SRodney W. Grimes */ 34726f9a767SRodney W. Grimes ndp = &nd; 348b35ba931SDavid Greenman NDINIT(ndp, LOOKUP, LOCKLEAF | FOLLOW | SAVENAME, 349450ffb44SRobert Watson UIO_USERSPACE, fname, td); 35026f9a767SRodney W. Grimes 351b3afd20dSAlan Cox mtx_lock(&Giant); 35226f9a767SRodney W. Grimes interpret: 35326f9a767SRodney W. Grimes 35426f9a767SRodney W. Grimes error = namei(ndp); 35526f9a767SRodney W. Grimes if (error) { 3561616db3cSJohn Dyson kmem_free_wakeup(exec_map, (vm_offset_t)imgp->stringbase, 35759c8bc40SAlan Cox ARG_MAX); 35826f9a767SRodney W. Grimes goto exec_fail; 35926f9a767SRodney W. Grimes } 36026f9a767SRodney W. Grimes 361c52007c2SDavid Greenman imgp->vp = ndp->ni_vp; 362450ffb44SRobert Watson imgp->fname = fname; 36326f9a767SRodney W. Grimes 36426f9a767SRodney W. Grimes /* 3659022e4adSDavid Greenman * Check file permissions (also 'opens' file) 3669022e4adSDavid Greenman */ 367c52007c2SDavid Greenman error = exec_check_permissions(imgp); 368619eb6e5SJeff Roberson if (error) 36926f9a767SRodney W. Grimes goto exec_fail_dealloc; 370619eb6e5SJeff Roberson 371619eb6e5SJeff Roberson if (VOP_GETVOBJECT(imgp->vp, &imgp->object) == 0) 3720b2ed1aeSJeff Roberson vm_object_reference(imgp->object); 37326f9a767SRodney W. Grimes 374619eb6e5SJeff Roberson /* 375619eb6e5SJeff Roberson * Set VV_TEXT now so no one can write to the executable while we're 376619eb6e5SJeff Roberson * activating it. 377619eb6e5SJeff Roberson * 378619eb6e5SJeff Roberson * Remember if this was set before and unset it in case this is not 379619eb6e5SJeff Roberson * actually an executable image. 380619eb6e5SJeff Roberson */ 381619eb6e5SJeff Roberson textset = imgp->vp->v_vflag & VV_TEXT; 382619eb6e5SJeff Roberson imgp->vp->v_vflag |= VV_TEXT; 383619eb6e5SJeff Roberson 3841616db3cSJohn Dyson error = exec_map_first_page(imgp); 3856d5a0a8cSDavid Greenman if (error) 38626f9a767SRodney W. Grimes goto exec_fail_dealloc; 38726f9a767SRodney W. Grimes 38826f9a767SRodney W. Grimes /* 389d323ddf3SMatthew Dillon * If the current process has a special image activator it 390d323ddf3SMatthew Dillon * wants to try first, call it. For example, emulating shell 391d323ddf3SMatthew Dillon * scripts differently. 39226f9a767SRodney W. Grimes */ 393d323ddf3SMatthew Dillon error = -1; 394d323ddf3SMatthew Dillon if ((img_first = imgp->proc->p_sysent->sv_imgact_try) != NULL) 395d323ddf3SMatthew Dillon error = img_first(imgp); 396d323ddf3SMatthew Dillon 397d323ddf3SMatthew Dillon /* 398d323ddf3SMatthew Dillon * Loop through the list of image activators, calling each one. 399d323ddf3SMatthew Dillon * An activator returns -1 if there is no match, 0 on success, 400d323ddf3SMatthew Dillon * and an error otherwise. 401d323ddf3SMatthew Dillon */ 402d323ddf3SMatthew Dillon for (i = 0; error == -1 && execsw[i]; ++i) { 403d323ddf3SMatthew Dillon if (execsw[i]->ex_imgact == NULL || 404d323ddf3SMatthew Dillon execsw[i]->ex_imgact == img_first) { 405d323ddf3SMatthew Dillon continue; 406d323ddf3SMatthew Dillon } 407c52007c2SDavid Greenman error = (*execsw[i]->ex_imgact)(imgp); 408d323ddf3SMatthew Dillon } 409d323ddf3SMatthew Dillon 410d323ddf3SMatthew Dillon if (error) { 411619eb6e5SJeff Roberson if (error == -1) { 412619eb6e5SJeff Roberson if (textset == 0) 413619eb6e5SJeff Roberson imgp->vp->v_vflag &= ~VV_TEXT; 414d323ddf3SMatthew Dillon error = ENOEXEC; 415619eb6e5SJeff Roberson } 41626f9a767SRodney W. Grimes goto exec_fail_dealloc; 417d323ddf3SMatthew Dillon } 418d323ddf3SMatthew Dillon 419d323ddf3SMatthew Dillon /* 420d323ddf3SMatthew Dillon * Special interpreter operation, cleanup and loop up to try to 421d323ddf3SMatthew Dillon * activate the interpreter. 422d323ddf3SMatthew Dillon */ 423c52007c2SDavid Greenman if (imgp->interpreted) { 4241616db3cSJohn Dyson exec_unmap_first_page(imgp); 425619eb6e5SJeff Roberson /* 426619eb6e5SJeff Roberson * VV_TEXT needs to be unset for scripts. There is a short 427619eb6e5SJeff Roberson * period before we determine that something is a script where 428619eb6e5SJeff Roberson * VV_TEXT will be set. The vnode lock is held over this 429619eb6e5SJeff Roberson * entire period so nothing should illegitimately be blocked. 430619eb6e5SJeff Roberson */ 431619eb6e5SJeff Roberson imgp->vp->v_vflag &= ~VV_TEXT; 432762e6b85SEivind Eklund /* free name buffer and old vnode */ 433762e6b85SEivind Eklund NDFREE(ndp, NDF_ONLY_PNBUF); 434670cb89bSRobert Watson #ifdef MAC 435eca8a663SRobert Watson interplabel = mac_vnode_label_alloc(); 436eca8a663SRobert Watson mac_copy_vnode_label(ndp->ni_vp->v_label, interplabel); 437670cb89bSRobert Watson #endif 438619eb6e5SJeff Roberson vput(ndp->ni_vp); 4390b2ed1aeSJeff Roberson vm_object_deallocate(imgp->object); 4400b2ed1aeSJeff Roberson imgp->object = NULL; 44126f9a767SRodney W. Grimes /* set new name to that of the interpreter */ 442b35ba931SDavid Greenman NDINIT(ndp, LOOKUP, LOCKLEAF | FOLLOW | SAVENAME, 443b40ce416SJulian Elischer UIO_SYSSPACE, imgp->interpreter_name, td); 44426f9a767SRodney W. Grimes goto interpret; 44526f9a767SRodney W. Grimes } 44626f9a767SRodney W. Grimes 44726f9a767SRodney W. Grimes /* 44826f9a767SRodney W. Grimes * Copy out strings (args and env) and initialize stack base 44926f9a767SRodney W. Grimes */ 4503ebc1248SPeter Wemm if (p->p_sysent->sv_copyout_strings) 4513ebc1248SPeter Wemm stack_base = (*p->p_sysent->sv_copyout_strings)(imgp); 4523ebc1248SPeter Wemm else 453c52007c2SDavid Greenman stack_base = exec_copyout_strings(imgp); 45426f9a767SRodney W. Grimes 45526f9a767SRodney W. Grimes /* 4561e1e0b44SSøren Schmidt * If custom stack fixup routine present for this process 4571e1e0b44SSøren Schmidt * let it do the stack setup. 4581e1e0b44SSøren Schmidt * Else stuff argument count as first item on stack 45926f9a767SRodney W. Grimes */ 460d6c847f3SBruce Evans if (p->p_sysent->sv_fixup != NULL) 461c52007c2SDavid Greenman (*p->p_sysent->sv_fixup)(&stack_base, imgp); 4621e1e0b44SSøren Schmidt else 463c52007c2SDavid Greenman suword(--stack_base, imgp->argc); 46426f9a767SRodney W. Grimes 465a78e8d2aSDavid Greenman /* 466a78e8d2aSDavid Greenman * For security and other reasons, the file descriptor table cannot 467a78e8d2aSDavid Greenman * be shared after an exec. 468a78e8d2aSDavid Greenman */ 469426da3bcSAlfred Perlstein FILEDESC_LOCK(p->p_fd); 470a78e8d2aSDavid Greenman if (p->p_fd->fd_refcnt > 1) { 471a78e8d2aSDavid Greenman struct filedesc *tmp; 472a78e8d2aSDavid Greenman 473c522c1bfSAlfred Perlstein tmp = fdcopy(td->td_proc->p_fd); 474426da3bcSAlfred Perlstein FILEDESC_UNLOCK(p->p_fd); 475b40ce416SJulian Elischer fdfree(td); 476a78e8d2aSDavid Greenman p->p_fd = tmp; 477426da3bcSAlfred Perlstein } else 478426da3bcSAlfred Perlstein FILEDESC_UNLOCK(p->p_fd); 479a78e8d2aSDavid Greenman 480333ea485SGuido van Rooij /* 4819b3b1c5fSJohn Baldwin * Malloc things before we need locks. 4829b3b1c5fSJohn Baldwin */ 4839b3b1c5fSJohn Baldwin newcred = crget(); 4841419eacbSAlfred Perlstein euip = uifind(attr.va_uid); 4859b3b1c5fSJohn Baldwin i = imgp->endargs - imgp->stringbase; 4869b3b1c5fSJohn Baldwin if (ps_arg_cache_limit >= i + sizeof(struct pargs)) 4879b3b1c5fSJohn Baldwin newargs = pargs_alloc(i); 4889b3b1c5fSJohn Baldwin 4899b3b1c5fSJohn Baldwin /* close files on exec */ 4909b3b1c5fSJohn Baldwin fdcloseexec(td); 4919b3b1c5fSJohn Baldwin 492619eb6e5SJeff Roberson /* Get a reference to the vnode prior to locking the proc */ 493619eb6e5SJeff Roberson VREF(ndp->ni_vp); 494619eb6e5SJeff Roberson 4959b3b1c5fSJohn Baldwin /* 496333ea485SGuido van Rooij * For security and other reasons, signal handlers cannot 4978688bb93SJohn Baldwin * be shared after an exec. The new process gets a copy of the old 498b2c3fa70SDima Dorfman * handlers. In execsigs(), the new process will have its signals 499333ea485SGuido van Rooij * reset. 500333ea485SGuido van Rooij */ 5019b3b1c5fSJohn Baldwin PROC_LOCK(p); 50290af4afaSJohn Baldwin if (sigacts_shared(p->p_sigacts)) { 50390af4afaSJohn Baldwin oldsigacts = p->p_sigacts; 5049b3b1c5fSJohn Baldwin PROC_UNLOCK(p); 50590af4afaSJohn Baldwin newsigacts = sigacts_alloc(); 50690af4afaSJohn Baldwin sigacts_copy(newsigacts, oldsigacts); 5079b3b1c5fSJohn Baldwin PROC_LOCK(p); 50890af4afaSJohn Baldwin p->p_sigacts = newsigacts; 50990af4afaSJohn Baldwin } else 51090af4afaSJohn Baldwin oldsigacts = NULL; 511333ea485SGuido van Rooij 512fdf4e8b3SWarner Losh /* Stop profiling */ 513fdf4e8b3SWarner Losh stopprofclock(p); 514fdf4e8b3SWarner Losh 51526f9a767SRodney W. Grimes /* reset caught signals */ 51626f9a767SRodney W. Grimes execsigs(p); 51726f9a767SRodney W. Grimes 51826f9a767SRodney W. Grimes /* name this process - nameiexec(p, ndp) */ 51926f9a767SRodney W. Grimes len = min(ndp->ni_cnd.cn_namelen,MAXCOMLEN); 52026f9a767SRodney W. Grimes bcopy(ndp->ni_cnd.cn_nameptr, p->p_comm, len); 52126f9a767SRodney W. Grimes p->p_comm[len] = 0; 52226f9a767SRodney W. Grimes 52326f9a767SRodney W. Grimes /* 52424b34f09SSujal Patel * mark as execed, wakeup the process that vforked (if any) and tell 525dc733423SDag-Erling Smørgrav * it that it now has its own resources back 52626f9a767SRodney W. Grimes */ 52726f9a767SRodney W. Grimes p->p_flag |= P_EXEC; 52826f9a767SRodney W. Grimes if (p->p_pptr && (p->p_flag & P_PPWAIT)) { 52926f9a767SRodney W. Grimes p->p_flag &= ~P_PPWAIT; 5307f05b035SAlfred Perlstein wakeup(p->p_pptr); 53126f9a767SRodney W. Grimes } 53226f9a767SRodney W. Grimes 53326f9a767SRodney W. Grimes /* 534a78e8d2aSDavid Greenman * Implement image setuid/setgid. 535a78e8d2aSDavid Greenman * 536a78e8d2aSDavid Greenman * Don't honor setuid/setgid if the filesystem prohibits it or if 537a78e8d2aSDavid Greenman * the process is being traced. 538670cb89bSRobert Watson * 539670cb89bSRobert Watson * XXXMAC: For the time being, use NOSUID to also prohibit 540670cb89bSRobert Watson * transitions on the file system. 541c52007c2SDavid Greenman */ 542b1fc0ec1SRobert Watson oldcred = p->p_ucred; 543d06c0d4dSRobert Watson credential_changing = 0; 544d06c0d4dSRobert Watson credential_changing |= (attr.va_mode & VSUID) && oldcred->cr_uid != 545d06c0d4dSRobert Watson attr.va_uid; 546d06c0d4dSRobert Watson credential_changing |= (attr.va_mode & VSGID) && oldcred->cr_gid != 547d06c0d4dSRobert Watson attr.va_gid; 548ccafe7ebSRobert Watson #ifdef MAC 549670cb89bSRobert Watson will_transition = mac_execve_will_transition(oldcred, imgp->vp, 550eca8a663SRobert Watson interplabel, imgp); 551ccafe7ebSRobert Watson credential_changing |= will_transition; 552ccafe7ebSRobert Watson #endif 553d06c0d4dSRobert Watson 554d06c0d4dSRobert Watson if (credential_changing && 555a78e8d2aSDavid Greenman (imgp->vp->v_mount->mnt_flag & MNT_NOSUID) == 0 && 556c52007c2SDavid Greenman (p->p_flag & P_TRACED) == 0) { 557c52007c2SDavid Greenman /* 558c52007c2SDavid Greenman * Turn off syscall tracing for set-id programs, except for 559b85db196SPeter Wemm * root. Record any set-id flags first to make sure that 560b85db196SPeter Wemm * we do not regain any tracing during a possible block. 56126f9a767SRodney W. Grimes */ 562b85db196SPeter Wemm setsugid(p); 5636c84de02SJohn Baldwin #ifdef KTRACE 56456f21b9dSColin Percival if (p->p_tracevp != NULL && suser_cred(oldcred, SUSER_ALLOWJAIL)) { 5656c84de02SJohn Baldwin mtx_lock(&ktrace_mtx); 56679deba82SMatthew Dillon p->p_traceflag = 0; 567a5881ea5SJohn Baldwin tracevp = p->p_tracevp; 568a5881ea5SJohn Baldwin p->p_tracevp = NULL; 569a5881ea5SJohn Baldwin tracecred = p->p_tracecred; 570a5881ea5SJohn Baldwin p->p_tracecred = NULL; 5716c84de02SJohn Baldwin mtx_unlock(&ktrace_mtx); 57226f9a767SRodney W. Grimes } 5736c84de02SJohn Baldwin #endif 57428b325aaSDon Lewis /* 575c1e2d386SNate Lawson * Close any file descriptors 0..2 that reference procfs, 576c1e2d386SNate Lawson * then make sure file descriptors 0..2 are in use. 57728b325aaSDon Lewis * 578c1e2d386SNate Lawson * setugidsafety() may call closef() and then pfind() 579c1e2d386SNate Lawson * which may grab the process lock. 58028b325aaSDon Lewis * fdcheckstd() may call falloc() which may block to 58128b325aaSDon Lewis * allocate memory, so temporarily drop the process lock. 58228b325aaSDon Lewis */ 58328b325aaSDon Lewis PROC_UNLOCK(p); 584c1e2d386SNate Lawson setugidsafety(td); 585e983a376SJacques Vidrine error = fdcheckstd(td); 58663c9e754SJohn Baldwin if (error != 0) 58769be5db9SAlfred Perlstein goto done1; 588e1b1aa3bSJohn Baldwin PROC_LOCK(p); 589c52007c2SDavid Greenman /* 590c52007c2SDavid Greenman * Set the new credentials. 591c52007c2SDavid Greenman */ 5929b3b1c5fSJohn Baldwin crcopy(newcred, oldcred); 593c52007c2SDavid Greenman if (attr.va_mode & VSUID) 5941419eacbSAlfred Perlstein change_euid(newcred, euip); 595c52007c2SDavid Greenman if (attr.va_mode & VSGID) 596b1fc0ec1SRobert Watson change_egid(newcred, attr.va_gid); 597ccafe7ebSRobert Watson #ifdef MAC 598670cb89bSRobert Watson if (will_transition) { 599670cb89bSRobert Watson mac_execve_transition(oldcred, newcred, imgp->vp, 600eca8a663SRobert Watson interplabel, imgp); 601670cb89bSRobert Watson } 602ccafe7ebSRobert Watson #endif 6039b3b1c5fSJohn Baldwin /* 6049b3b1c5fSJohn Baldwin * Implement correct POSIX saved-id behavior. 605ccafe7ebSRobert Watson * 606ccafe7ebSRobert Watson * XXXMAC: Note that the current logic will save the 607ccafe7ebSRobert Watson * uid and gid if a MAC domain transition occurs, even 608ccafe7ebSRobert Watson * though maybe it shouldn't. 6099b3b1c5fSJohn Baldwin */ 6109b3b1c5fSJohn Baldwin change_svuid(newcred, newcred->cr_uid); 6119b3b1c5fSJohn Baldwin change_svgid(newcred, newcred->cr_gid); 6129b3b1c5fSJohn Baldwin p->p_ucred = newcred; 6139b3b1c5fSJohn Baldwin newcred = NULL; 614c52007c2SDavid Greenman } else { 615b1fc0ec1SRobert Watson if (oldcred->cr_uid == oldcred->cr_ruid && 616b1fc0ec1SRobert Watson oldcred->cr_gid == oldcred->cr_rgid) 617c52007c2SDavid Greenman p->p_flag &= ~P_SUGID; 61826f9a767SRodney W. Grimes /* 619c52007c2SDavid Greenman * Implement correct POSIX saved-id behavior. 620b1fc0ec1SRobert Watson * 621b1fc0ec1SRobert Watson * XXX: It's not clear that the existing behavior is 6229b3b1c5fSJohn Baldwin * POSIX-compliant. A number of sources indicate that the 6239b3b1c5fSJohn Baldwin * saved uid/gid should only be updated if the new ruid is 6249b3b1c5fSJohn Baldwin * not equal to the old ruid, or the new euid is not equal 6259b3b1c5fSJohn Baldwin * to the old euid and the new euid is not equal to the old 6269b3b1c5fSJohn Baldwin * ruid. The FreeBSD code always updates the saved uid/gid. 6279b3b1c5fSJohn Baldwin * Also, this code uses the new (replaced) euid and egid as 6289b3b1c5fSJohn Baldwin * the source, which may or may not be the right ones to use. 62926f9a767SRodney W. Grimes */ 630b1fc0ec1SRobert Watson if (oldcred->cr_svuid != oldcred->cr_uid || 631b1fc0ec1SRobert Watson oldcred->cr_svgid != oldcred->cr_gid) { 6329b3b1c5fSJohn Baldwin crcopy(newcred, oldcred); 633b1fc0ec1SRobert Watson change_svuid(newcred, newcred->cr_uid); 634b1fc0ec1SRobert Watson change_svgid(newcred, newcred->cr_gid); 635b1fc0ec1SRobert Watson p->p_ucred = newcred; 6369b3b1c5fSJohn Baldwin newcred = NULL; 6379b3b1c5fSJohn Baldwin } 638b1fc0ec1SRobert Watson } 63926f9a767SRodney W. Grimes 64026f9a767SRodney W. Grimes /* 641619eb6e5SJeff Roberson * Store the vp for use in procfs. This vnode was referenced prior 642619eb6e5SJeff Roberson * to locking the proc lock. 6432a531c80SDavid Greenman */ 6449b3b1c5fSJohn Baldwin textvp = p->p_textvp; 6452a531c80SDavid Greenman p->p_textvp = ndp->ni_vp; 6462a531c80SDavid Greenman 6472a531c80SDavid Greenman /* 6489ca45e81SDag-Erling Smørgrav * Notify others that we exec'd, and clear the P_INEXEC flag 6499ca45e81SDag-Erling Smørgrav * as we're now a bona fide freshly-execed process. 650cb679c38SJonathan Lemon */ 651ad3b9257SJohn-Mark Gurney KNOTE_LOCKED(&p->p_klist, NOTE_EXEC); 6529ca45e81SDag-Erling Smørgrav p->p_flag &= ~P_INEXEC; 653cb679c38SJonathan Lemon 654cb679c38SJonathan Lemon /* 65526f9a767SRodney W. Grimes * If tracing the process, trap to debugger so breakpoints 65626f9a767SRodney W. Grimes * can be set before the program executes. 657906ac69dSDavid Xu * Use tdsignal to deliver signal to current thread, use 658906ac69dSDavid Xu * psignal may cause the signal to be delivered to wrong thread 659906ac69dSDavid Xu * because that thread will exit, remember we are going to enter 660906ac69dSDavid Xu * single thread mode. 66126f9a767SRodney W. Grimes */ 66226f9a767SRodney W. Grimes if (p->p_flag & P_TRACED) 663906ac69dSDavid Xu tdsignal(td, SIGTRAP, SIGTARGET_TD); 66426f9a767SRodney W. Grimes 66526f9a767SRodney W. Grimes /* clear "fork but no exec" flag, as we _are_ execing */ 66626f9a767SRodney W. Grimes p->p_acflag &= ~AFORK; 66726f9a767SRodney W. Grimes 668b9df5231SPoul-Henning Kamp /* Free any previous argument cache */ 6699b3b1c5fSJohn Baldwin oldargs = p->p_args; 670b9df5231SPoul-Henning Kamp p->p_args = NULL; 671b9df5231SPoul-Henning Kamp 672e1b1aa3bSJohn Baldwin /* Cache arguments if they fit inside our allowance */ 673e1b1aa3bSJohn Baldwin if (ps_arg_cache_limit >= i + sizeof(struct pargs)) { 674e1b1aa3bSJohn Baldwin bcopy(imgp->stringbase, newargs->ar_args, i); 675e1b1aa3bSJohn Baldwin p->p_args = newargs; 676e1b1aa3bSJohn Baldwin newargs = NULL; 677e1b1aa3bSJohn Baldwin } 678e1b1aa3bSJohn Baldwin PROC_UNLOCK(p); 679e1b1aa3bSJohn Baldwin 680e913ca22SDoug Rabson /* Set values passed into the program in registers. */ 6813ebc1248SPeter Wemm if (p->p_sysent->sv_setregs) 6823ebc1248SPeter Wemm (*p->p_sysent->sv_setregs)(td, imgp->entry_addr, 6833ebc1248SPeter Wemm (u_long)(uintptr_t)stack_base, imgp->ps_strings); 6843ebc1248SPeter Wemm else 685bafbd492SJake Burkholder exec_setregs(td, imgp->entry_addr, 686bafbd492SJake Burkholder (u_long)(uintptr_t)stack_base, imgp->ps_strings); 687e913ca22SDoug Rabson 68869be5db9SAlfred Perlstein done1: 6899b3b1c5fSJohn Baldwin /* 6909b3b1c5fSJohn Baldwin * Free any resources malloc'd earlier that we didn't use. 6919b3b1c5fSJohn Baldwin */ 6921419eacbSAlfred Perlstein uifree(euip); 6939b3b1c5fSJohn Baldwin if (newcred == NULL) 6949b3b1c5fSJohn Baldwin crfree(oldcred); 6959b3b1c5fSJohn Baldwin else 6969b3b1c5fSJohn Baldwin crfree(newcred); 6979b3b1c5fSJohn Baldwin /* 6989b3b1c5fSJohn Baldwin * Handle deferred decrement of ref counts. 6999b3b1c5fSJohn Baldwin */ 7009b3b1c5fSJohn Baldwin if (textvp != NULL) 7019b3b1c5fSJohn Baldwin vrele(textvp); 702619eb6e5SJeff Roberson if (ndp->ni_vp && error != 0) 703619eb6e5SJeff Roberson vrele(ndp->ni_vp); 7046c84de02SJohn Baldwin #ifdef KTRACE 7059b3b1c5fSJohn Baldwin if (tracevp != NULL) 7069b3b1c5fSJohn Baldwin vrele(tracevp); 707a5881ea5SJohn Baldwin if (tracecred != NULL) 708a5881ea5SJohn Baldwin crfree(tracecred); 7096c84de02SJohn Baldwin #endif 71069be5db9SAlfred Perlstein if (oldargs != NULL) 7119b3b1c5fSJohn Baldwin pargs_drop(oldargs); 71269be5db9SAlfred Perlstein if (newargs != NULL) 71369be5db9SAlfred Perlstein pargs_drop(newargs); 71490af4afaSJohn Baldwin if (oldsigacts != NULL) 71590af4afaSJohn Baldwin sigacts_free(oldsigacts); 716b9df5231SPoul-Henning Kamp 7171616db3cSJohn Dyson exec_fail_dealloc: 7181616db3cSJohn Dyson 71926f9a767SRodney W. Grimes /* 72026f9a767SRodney W. Grimes * free various allocated resources 72126f9a767SRodney W. Grimes */ 722d6c847f3SBruce Evans if (imgp->firstpage != NULL) 7231616db3cSJohn Dyson exec_unmap_first_page(imgp); 72426f9a767SRodney W. Grimes 725d6c847f3SBruce Evans if (imgp->vp != NULL) { 726762e6b85SEivind Eklund NDFREE(ndp, NDF_ONLY_PNBUF); 727619eb6e5SJeff Roberson vput(imgp->vp); 728a3cf6ebaSDavid Greenman } 72926f9a767SRodney W. Grimes 730a9a08882SJeff Roberson if (imgp->stringbase != NULL) 731a9a08882SJeff Roberson kmem_free_wakeup(exec_map, (vm_offset_t)imgp->stringbase, 73259c8bc40SAlan Cox ARG_MAX); 733a9a08882SJeff Roberson 734d6c847f3SBruce Evans if (imgp->object != NULL) 7350b2ed1aeSJeff Roberson vm_object_deallocate(imgp->object); 7360b2ed1aeSJeff Roberson 737d1989db5SRobert Drehmel if (error == 0) { 738d1989db5SRobert Drehmel /* 739d1989db5SRobert Drehmel * Stop the process here if its stop event mask has 740d1989db5SRobert Drehmel * the S_EXEC bit set. 741d1989db5SRobert Drehmel */ 742d1989db5SRobert Drehmel STOPEVENT(p, S_EXEC, 0); 743116734c4SMatthew Dillon goto done2; 744d1989db5SRobert Drehmel } 7451616db3cSJohn Dyson 74626f9a767SRodney W. Grimes exec_fail: 7479ca45e81SDag-Erling Smørgrav /* we're done here, clear P_INEXEC */ 7489ca45e81SDag-Erling Smørgrav PROC_LOCK(p); 7499ca45e81SDag-Erling Smørgrav p->p_flag &= ~P_INEXEC; 7509ca45e81SDag-Erling Smørgrav PROC_UNLOCK(p); 7519ca45e81SDag-Erling Smørgrav 752c52007c2SDavid Greenman if (imgp->vmspace_destroyed) { 75326f9a767SRodney W. Grimes /* sorry, no more process anymore. exit gracefully */ 754670cb89bSRobert Watson #ifdef MAC 755670cb89bSRobert Watson mac_execve_exit(imgp); 756eca8a663SRobert Watson if (interplabel != NULL) 757eca8a663SRobert Watson mac_vnode_label_free(interplabel); 758670cb89bSRobert Watson #endif 75963993cf0SJohn Baldwin mtx_unlock(&Giant); 760b40ce416SJulian Elischer exit1(td, W_EXITCODE(0, SIGABRT)); 76126f9a767SRodney W. Grimes /* NOT REACHED */ 762116734c4SMatthew Dillon error = 0; 76326f9a767SRodney W. Grimes } 764116734c4SMatthew Dillon done2: 765670cb89bSRobert Watson #ifdef MAC 766670cb89bSRobert Watson mac_execve_exit(imgp); 767eca8a663SRobert Watson if (interplabel != NULL) 768eca8a663SRobert Watson mac_vnode_label_free(interplabel); 769670cb89bSRobert Watson #endif 770116734c4SMatthew Dillon mtx_unlock(&Giant); 771116734c4SMatthew Dillon return (error); 77226f9a767SRodney W. Grimes } 77326f9a767SRodney W. Grimes 7741616db3cSJohn Dyson int 7751616db3cSJohn Dyson exec_map_first_page(imgp) 7761616db3cSJohn Dyson struct image_params *imgp; 7771616db3cSJohn Dyson { 778d8aad40cSJohn Baldwin int rv, i; 77995461b45SJohn Dyson int initial_pagein; 78095461b45SJohn Dyson vm_page_t ma[VM_INITIAL_PAGEIN]; 7811616db3cSJohn Dyson vm_object_t object; 7821616db3cSJohn Dyson 7830cddd8f0SMatthew Dillon GIANT_REQUIRED; 7841616db3cSJohn Dyson 785d6c847f3SBruce Evans if (imgp->firstpage != NULL) 7861616db3cSJohn Dyson exec_unmap_first_page(imgp); 7871616db3cSJohn Dyson 7889ff5ce6bSBoris Popov VOP_GETVOBJECT(imgp->vp, &object); 789fd0cc9a8SAlan Cox VM_OBJECT_LOCK(object); 79095461b45SJohn Dyson ma[0] = vm_page_grab(object, 0, VM_ALLOC_NORMAL | VM_ALLOC_RETRY); 79195461b45SJohn Dyson if ((ma[0]->valid & VM_PAGE_BITS_ALL) != VM_PAGE_BITS_ALL) { 79295461b45SJohn Dyson initial_pagein = VM_INITIAL_PAGEIN; 79395461b45SJohn Dyson if (initial_pagein > object->size) 79495461b45SJohn Dyson initial_pagein = object->size; 79595461b45SJohn Dyson for (i = 1; i < initial_pagein; i++) { 796d254af07SMatthew Dillon if ((ma[i] = vm_page_lookup(object, i)) != NULL) { 7976ec2fca5SAlan Cox if (ma[i]->valid) 7986ec2fca5SAlan Cox break; 799ee113343SAlan Cox vm_page_lock_queues(); 80006fa71cdSAlan Cox if ((ma[i]->flags & PG_BUSY) || ma[i]->busy) { 80106fa71cdSAlan Cox vm_page_unlock_queues(); 80206fa71cdSAlan Cox break; 80306fa71cdSAlan Cox } 804e69763a3SDoug Rabson vm_page_busy(ma[i]); 805ee113343SAlan Cox vm_page_unlock_queues(); 80695461b45SJohn Dyson } else { 807ca0387efSJake Burkholder ma[i] = vm_page_alloc(object, i, 808ca0387efSJake Burkholder VM_ALLOC_NORMAL); 80995461b45SJohn Dyson if (ma[i] == NULL) 81095461b45SJohn Dyson break; 81195461b45SJohn Dyson } 81295461b45SJohn Dyson } 81395461b45SJohn Dyson initial_pagein = i; 81495461b45SJohn Dyson rv = vm_pager_get_pages(object, ma, initial_pagein, 0); 81595461b45SJohn Dyson ma[0] = vm_page_lookup(object, 0); 816ca0387efSJake Burkholder if ((rv != VM_PAGER_OK) || (ma[0] == NULL) || 817ca0387efSJake Burkholder (ma[0]->valid == 0)) { 818ecbb00a2SDoug Rabson if (ma[0]) { 8196ec2fca5SAlan Cox vm_page_lock_queues(); 8204fec79beSAlan Cox pmap_remove_all(ma[0]); 8218f9110f6SJohn Dyson vm_page_free(ma[0]); 82206fa71cdSAlan Cox vm_page_unlock_queues(); 8236ec2fca5SAlan Cox } 82406fa71cdSAlan Cox VM_OBJECT_UNLOCK(object); 825a7cddfedSJake Burkholder return (EIO); 8261616db3cSJohn Dyson } 8271616db3cSJohn Dyson } 8286ec2fca5SAlan Cox vm_page_lock_queues(); 829148b3f62SAlan Cox vm_page_hold(ma[0]); 830e69763a3SDoug Rabson vm_page_wakeup(ma[0]); 83197646f56SAlan Cox vm_page_unlock_queues(); 8326ec2fca5SAlan Cox VM_OBJECT_UNLOCK(object); 8331616db3cSJohn Dyson 83459c8bc40SAlan Cox imgp->firstpage = sf_buf_alloc(ma[0], 0); 83559c8bc40SAlan Cox imgp->image_header = (char *)sf_buf_kva(imgp->firstpage); 8361616db3cSJohn Dyson 837a7cddfedSJake Burkholder return (0); 8381616db3cSJohn Dyson } 8391616db3cSJohn Dyson 8401616db3cSJohn Dyson void 8411616db3cSJohn Dyson exec_unmap_first_page(imgp) 8421616db3cSJohn Dyson struct image_params *imgp; 8431616db3cSJohn Dyson { 84459c8bc40SAlan Cox vm_page_t m; 84523955314SAlfred Perlstein 846d6c847f3SBruce Evans if (imgp->firstpage != NULL) { 84759c8bc40SAlan Cox m = sf_buf_page(imgp->firstpage); 84859c8bc40SAlan Cox sf_buf_free(imgp->firstpage); 8491616db3cSJohn Dyson imgp->firstpage = NULL; 85059c8bc40SAlan Cox vm_page_lock_queues(); 85159c8bc40SAlan Cox vm_page_unhold(m); 85259c8bc40SAlan Cox vm_page_unlock_queues(); 8531616db3cSJohn Dyson } 8541616db3cSJohn Dyson } 8551616db3cSJohn Dyson 85626f9a767SRodney W. Grimes /* 85726f9a767SRodney W. Grimes * Destroy old address space, and allocate a new stack 85826f9a767SRodney W. Grimes * The new stack is only SGROWSIZ large because it is grown 85926f9a767SRodney W. Grimes * automatically in trap.c. 86026f9a767SRodney W. Grimes */ 86126f9a767SRodney W. Grimes int 86205ba50f5SJake Burkholder exec_new_vmspace(imgp, sv) 863c52007c2SDavid Greenman struct image_params *imgp; 86405ba50f5SJake Burkholder struct sysentvec *sv; 86526f9a767SRodney W. Grimes { 86626f9a767SRodney W. Grimes int error; 8675e20c11fSAlan Cox struct proc *p = imgp->proc; 8685e20c11fSAlan Cox struct vmspace *vmspace = p->p_vmspace; 86905ba50f5SJake Burkholder vm_offset_t stack_addr; 87005ba50f5SJake Burkholder vm_map_t map; 87126f9a767SRodney W. Grimes 8720cddd8f0SMatthew Dillon GIANT_REQUIRED; 8730cddd8f0SMatthew Dillon 874c52007c2SDavid Greenman imgp->vmspace_destroyed = 1; 87526f9a767SRodney W. Grimes 876a5bdcb2aSPeter Wemm /* Called with Giant held, do not depend on it! */ 87775b8b3b2SJohn Baldwin EVENTHANDLER_INVOKE(process_exec, p); 8786f5dafeaSAlan Cox 8796f5dafeaSAlan Cox /* 880c460ac3aSPeter Wemm * Here is as good a place as any to do any resource limit cleanups. 881c460ac3aSPeter Wemm * This is needed if a 64 bit binary exec's a 32 bit binary - the 882c460ac3aSPeter Wemm * data size limit may need to be changed to a value that makes 883c460ac3aSPeter Wemm * sense for the 32 bit binary. 884c460ac3aSPeter Wemm */ 885d6c847f3SBruce Evans if (sv->sv_fixlimits != NULL) 886c460ac3aSPeter Wemm sv->sv_fixlimits(imgp); 887c460ac3aSPeter Wemm 888c460ac3aSPeter Wemm /* 889af9ec885SJohn Dyson * Blow away entire process VM, if address space not shared, 890af9ec885SJohn Dyson * otherwise, create a new VM space so that other threads are 891af9ec885SJohn Dyson * not disrupted 892af9ec885SJohn Dyson */ 89305ba50f5SJake Burkholder map = &vmspace->vm_map; 89405ba50f5SJake Burkholder if (vmspace->vm_refcnt == 1 && vm_map_min(map) == sv->sv_minuser && 89505ba50f5SJake Burkholder vm_map_max(map) == sv->sv_maxuser) { 8963db161e0SMatthew Dillon shmexit(vmspace); 89705ba50f5SJake Burkholder pmap_remove_pages(vmspace_pmap(vmspace), vm_map_min(map), 89805ba50f5SJake Burkholder vm_map_max(map)); 89905ba50f5SJake Burkholder vm_map_remove(map, vm_map_min(map), vm_map_max(map)); 900af9ec885SJohn Dyson } else { 90105ba50f5SJake Burkholder vmspace_exec(p, sv->sv_minuser, sv->sv_maxuser); 9025e20c11fSAlan Cox vmspace = p->p_vmspace; 90305ba50f5SJake Burkholder map = &vmspace->vm_map; 904af9ec885SJohn Dyson } 90526f9a767SRodney W. Grimes 90626f9a767SRodney W. Grimes /* Allocate a new stack */ 907fd75d710SMarcel Moolenaar stack_addr = sv->sv_usrstack - maxssiz; 90805ba50f5SJake Burkholder error = vm_map_stack(map, stack_addr, (vm_size_t)maxssiz, 909fd75d710SMarcel Moolenaar sv->sv_stackprot, VM_PROT_ALL, MAP_STACK_GROWS_DOWN); 9102267af78SJulian Elischer if (error) 9112267af78SJulian Elischer return (error); 9122267af78SJulian Elischer 91363c47a5cSDoug Rabson #ifdef __ia64__ 914fd75d710SMarcel Moolenaar /* Allocate a new register stack */ 915bab1f052SMarcel Moolenaar stack_addr = IA64_BACKINGSTORE; 916fd75d710SMarcel Moolenaar error = vm_map_stack(map, stack_addr, (vm_size_t)maxssiz, 917fd75d710SMarcel Moolenaar sv->sv_stackprot, VM_PROT_ALL, MAP_STACK_GROWS_UP); 918fd75d710SMarcel Moolenaar if (error) 919fd75d710SMarcel Moolenaar return (error); 92063c47a5cSDoug Rabson #endif 92163c47a5cSDoug Rabson 9222267af78SJulian Elischer /* vm_ssize and vm_maxsaddr are somewhat antiquated concepts in the 9232267af78SJulian Elischer * VM_STACK case, but they are still used to monitor the size of the 9242267af78SJulian Elischer * process stack so we can check the stack rlimit. 9252267af78SJulian Elischer */ 926cbc89bfbSPaul Saab vmspace->vm_ssize = sgrowsiz >> PAGE_SHIFT; 92705ba50f5SJake Burkholder vmspace->vm_maxsaddr = (char *)sv->sv_usrstack - maxssiz; 92826f9a767SRodney W. Grimes 92926f9a767SRodney W. Grimes return (0); 93026f9a767SRodney W. Grimes } 93126f9a767SRodney W. Grimes 93226f9a767SRodney W. Grimes /* 93326f9a767SRodney W. Grimes * Copy out argument and environment strings from the old process 93426f9a767SRodney W. Grimes * address space into the temporary string buffer. 93526f9a767SRodney W. Grimes */ 93626f9a767SRodney W. Grimes int 937c52007c2SDavid Greenman exec_extract_strings(imgp) 938c52007c2SDavid Greenman struct image_params *imgp; 93926f9a767SRodney W. Grimes { 94026f9a767SRodney W. Grimes char **argv, **envv; 94126f9a767SRodney W. Grimes char *argp, *envp; 942ecbb00a2SDoug Rabson int error; 943ecbb00a2SDoug Rabson size_t length; 94426f9a767SRodney W. Grimes 94526f9a767SRodney W. Grimes /* 94626f9a767SRodney W. Grimes * extract arguments first 94726f9a767SRodney W. Grimes */ 94826f9a767SRodney W. Grimes 949450ffb44SRobert Watson argv = imgp->userspace_argv; 95026f9a767SRodney W. Grimes 9510fd1a014SDavid Greenman if (argv) { 952aae0aa45SBruce Evans argp = (caddr_t)(intptr_t)fuword(argv); 9535cf3d12cSAndrey A. Chernov if (argp == (caddr_t)-1) 9545cf3d12cSAndrey A. Chernov return (EFAULT); 9555cf3d12cSAndrey A. Chernov if (argp) 9565cf3d12cSAndrey A. Chernov argv++; 9575cf3d12cSAndrey A. Chernov if (imgp->argv0) 9585cf3d12cSAndrey A. Chernov argp = imgp->argv0; 9595cf3d12cSAndrey A. Chernov if (argp) { 9605cf3d12cSAndrey A. Chernov do { 96126f9a767SRodney W. Grimes if (argp == (caddr_t)-1) 96226f9a767SRodney W. Grimes return (EFAULT); 963c52007c2SDavid Greenman if ((error = copyinstr(argp, imgp->stringp, 964c52007c2SDavid Greenman imgp->stringspace, &length))) { 9650fd1a014SDavid Greenman if (error == ENAMETOOLONG) 96626f9a767SRodney W. Grimes return (E2BIG); 9670fd1a014SDavid Greenman return (error); 9680fd1a014SDavid Greenman } 969c52007c2SDavid Greenman imgp->stringspace -= length; 970c52007c2SDavid Greenman imgp->stringp += length; 971c52007c2SDavid Greenman imgp->argc++; 972aae0aa45SBruce Evans } while ((argp = (caddr_t)(intptr_t)fuword(argv++))); 97326f9a767SRodney W. Grimes } 9747700eb86SRuslan Ermilov } else 9757700eb86SRuslan Ermilov return (EFAULT); 97626f9a767SRodney W. Grimes 977b9df5231SPoul-Henning Kamp imgp->endargs = imgp->stringp; 978b9df5231SPoul-Henning Kamp 97926f9a767SRodney W. Grimes /* 98026f9a767SRodney W. Grimes * extract environment strings 98126f9a767SRodney W. Grimes */ 98226f9a767SRodney W. Grimes 983450ffb44SRobert Watson envv = imgp->userspace_envv; 98426f9a767SRodney W. Grimes 9850fd1a014SDavid Greenman if (envv) { 986aae0aa45SBruce Evans while ((envp = (caddr_t)(intptr_t)fuword(envv++))) { 98726f9a767SRodney W. Grimes if (envp == (caddr_t)-1) 98826f9a767SRodney W. Grimes return (EFAULT); 989c52007c2SDavid Greenman if ((error = copyinstr(envp, imgp->stringp, 990c52007c2SDavid Greenman imgp->stringspace, &length))) { 9910fd1a014SDavid Greenman if (error == ENAMETOOLONG) 99226f9a767SRodney W. Grimes return (E2BIG); 9930fd1a014SDavid Greenman return (error); 9940fd1a014SDavid Greenman } 995c52007c2SDavid Greenman imgp->stringspace -= length; 996c52007c2SDavid Greenman imgp->stringp += length; 997c52007c2SDavid Greenman imgp->envc++; 99826f9a767SRodney W. Grimes } 9990fd1a014SDavid Greenman } 100026f9a767SRodney W. Grimes 100126f9a767SRodney W. Grimes return (0); 100226f9a767SRodney W. Grimes } 100326f9a767SRodney W. Grimes 100426f9a767SRodney W. Grimes /* 100526f9a767SRodney W. Grimes * Copy strings out to the new process address space, constructing 100626f9a767SRodney W. Grimes * new arg and env vector tables. Return a pointer to the base 100726f9a767SRodney W. Grimes * so that it can be used as the initial stack pointer. 100826f9a767SRodney W. Grimes */ 1009654f6be1SBruce Evans register_t * 1010c52007c2SDavid Greenman exec_copyout_strings(imgp) 1011c52007c2SDavid Greenman struct image_params *imgp; 101226f9a767SRodney W. Grimes { 101326f9a767SRodney W. Grimes int argc, envc; 101426f9a767SRodney W. Grimes char **vectp; 101526f9a767SRodney W. Grimes char *stringp, *destp; 1016654f6be1SBruce Evans register_t *stack_base; 101793f6448cSDavid Greenman struct ps_strings *arginfo; 1018f3bec5d7SJake Burkholder struct proc *p; 1019d66a5066SPeter Wemm int szsigcode; 102026f9a767SRodney W. Grimes 102126f9a767SRodney W. Grimes /* 102226f9a767SRodney W. Grimes * Calculate string base and vector table pointers. 1023d66a5066SPeter Wemm * Also deal with signal trampoline code for this exec type. 102426f9a767SRodney W. Grimes */ 1025f3bec5d7SJake Burkholder p = imgp->proc; 1026f3bec5d7SJake Burkholder szsigcode = 0; 102705ba50f5SJake Burkholder arginfo = (struct ps_strings *)p->p_sysent->sv_psstrings; 1028f3bec5d7SJake Burkholder if (p->p_sysent->sv_szsigcode != NULL) 1029f3bec5d7SJake Burkholder szsigcode = *(p->p_sysent->sv_szsigcode); 1030d66a5066SPeter Wemm destp = (caddr_t)arginfo - szsigcode - SPARE_USRSPACE - 10311ed012f9SPeter Wemm roundup((ARG_MAX - imgp->stringspace), sizeof(char *)); 10321ed012f9SPeter Wemm 103326f9a767SRodney W. Grimes /* 1034d66a5066SPeter Wemm * install sigcode 1035d66a5066SPeter Wemm */ 1036d66a5066SPeter Wemm if (szsigcode) 1037f3bec5d7SJake Burkholder copyout(p->p_sysent->sv_sigcode, ((caddr_t)arginfo - 1038f3bec5d7SJake Burkholder szsigcode), szsigcode); 1039d66a5066SPeter Wemm 1040d66a5066SPeter Wemm /* 1041e1743d02SSøren Schmidt * If we have a valid auxargs ptr, prepare some room 1042e1743d02SSøren Schmidt * on the stack. 1043e1743d02SSøren Schmidt */ 1044b9a22da4STakanori Watanabe if (imgp->auxargs) { 1045e1743d02SSøren Schmidt /* 1046b9a22da4STakanori Watanabe * 'AT_COUNT*2' is size for the ELF Auxargs data. This is for 1047b9a22da4STakanori Watanabe * lower compatibility. 1048b9a22da4STakanori Watanabe */ 1049ca0387efSJake Burkholder imgp->auxarg_size = (imgp->auxarg_size) ? imgp->auxarg_size : 1050ca0387efSJake Burkholder (AT_COUNT * 2); 1051b9a22da4STakanori Watanabe /* 1052b9a22da4STakanori Watanabe * The '+ 2' is for the null pointers at the end of each of 1053b9a22da4STakanori Watanabe * the arg and env vector sets,and imgp->auxarg_size is room 1054b9a22da4STakanori Watanabe * for argument of Runtime loader. 1055e1743d02SSøren Schmidt */ 1056e1743d02SSøren Schmidt vectp = (char **)(destp - (imgp->argc + imgp->envc + 2 + 1057b9a22da4STakanori Watanabe imgp->auxarg_size) * sizeof(char *)); 1058b9a22da4STakanori Watanabe 1059b9a22da4STakanori Watanabe } else 1060e1743d02SSøren Schmidt /* 1061b9a22da4STakanori Watanabe * The '+ 2' is for the null pointers at the end of each of 1062b9a22da4STakanori Watanabe * the arg and env vector sets 106326f9a767SRodney W. Grimes */ 1064ca0387efSJake Burkholder vectp = (char **)(destp - (imgp->argc + imgp->envc + 2) * 1065ca0387efSJake Burkholder sizeof(char *)); 106626f9a767SRodney W. Grimes 106726f9a767SRodney W. Grimes /* 106826f9a767SRodney W. Grimes * vectp also becomes our initial stack base 106926f9a767SRodney W. Grimes */ 1070654f6be1SBruce Evans stack_base = (register_t *)vectp; 107126f9a767SRodney W. Grimes 1072c52007c2SDavid Greenman stringp = imgp->stringbase; 1073c52007c2SDavid Greenman argc = imgp->argc; 1074c52007c2SDavid Greenman envc = imgp->envc; 107526f9a767SRodney W. Grimes 107693f6448cSDavid Greenman /* 10773aed948bSDavid Greenman * Copy out strings - arguments and environment. 107893f6448cSDavid Greenman */ 1079c52007c2SDavid Greenman copyout(stringp, destp, ARG_MAX - imgp->stringspace); 108093f6448cSDavid Greenman 108193f6448cSDavid Greenman /* 10823aed948bSDavid Greenman * Fill in "ps_strings" struct for ps, w, etc. 10833aed948bSDavid Greenman */ 1084aae0aa45SBruce Evans suword(&arginfo->ps_argvstr, (long)(intptr_t)vectp); 10853aed948bSDavid Greenman suword(&arginfo->ps_nargvstr, argc); 10863aed948bSDavid Greenman 10873aed948bSDavid Greenman /* 10883aed948bSDavid Greenman * Fill in argument portion of vector table. 108993f6448cSDavid Greenman */ 109026f9a767SRodney W. Grimes for (; argc > 0; --argc) { 1091aae0aa45SBruce Evans suword(vectp++, (long)(intptr_t)destp); 10923aed948bSDavid Greenman while (*stringp++ != 0) 10933aed948bSDavid Greenman destp++; 10943aed948bSDavid Greenman destp++; 109526f9a767SRodney W. Grimes } 109626f9a767SRodney W. Grimes 10971a6e52d0SJeroen Ruigrok van der Werven /* a null vector table pointer separates the argp's from the envp's */ 10986ab46d52SBruce Evans suword(vectp++, 0); 109926f9a767SRodney W. Grimes 1100aae0aa45SBruce Evans suword(&arginfo->ps_envstr, (long)(intptr_t)vectp); 11013aed948bSDavid Greenman suword(&arginfo->ps_nenvstr, envc); 110293f6448cSDavid Greenman 110393f6448cSDavid Greenman /* 11043aed948bSDavid Greenman * Fill in environment portion of vector table. 110593f6448cSDavid Greenman */ 110626f9a767SRodney W. Grimes for (; envc > 0; --envc) { 1107aae0aa45SBruce Evans suword(vectp++, (long)(intptr_t)destp); 11083aed948bSDavid Greenman while (*stringp++ != 0) 11093aed948bSDavid Greenman destp++; 11103aed948bSDavid Greenman destp++; 111126f9a767SRodney W. Grimes } 111226f9a767SRodney W. Grimes 111326f9a767SRodney W. Grimes /* end of vector table is a null pointer */ 11146ab46d52SBruce Evans suword(vectp, 0); 111526f9a767SRodney W. Grimes 111626f9a767SRodney W. Grimes return (stack_base); 111726f9a767SRodney W. Grimes } 111826f9a767SRodney W. Grimes 111926f9a767SRodney W. Grimes /* 112026f9a767SRodney W. Grimes * Check permissions of file to execute. 1121cf64863aSRobert Watson * Called with imgp->vp locked. 112226f9a767SRodney W. Grimes * Return 0 for success or error code on failure. 112326f9a767SRodney W. Grimes */ 1124c8a79999SPeter Wemm int 1125c52007c2SDavid Greenman exec_check_permissions(imgp) 1126c52007c2SDavid Greenman struct image_params *imgp; 112726f9a767SRodney W. Grimes { 1128c52007c2SDavid Greenman struct vnode *vp = imgp->vp; 1129c52007c2SDavid Greenman struct vattr *attr = imgp->attr; 1130a854ed98SJohn Baldwin struct thread *td; 113126f9a767SRodney W. Grimes int error; 113226f9a767SRodney W. Grimes 1133a854ed98SJohn Baldwin td = curthread; /* XXXKSE */ 1134339b79b9SRobert Watson 1135ec35c2afSRobert Watson /* Get file attributes */ 1136ec35c2afSRobert Watson error = VOP_GETATTR(vp, attr, td->td_ucred, td); 1137ec35c2afSRobert Watson if (error) 1138ec35c2afSRobert Watson return (error); 1139ec35c2afSRobert Watson 1140339b79b9SRobert Watson #ifdef MAC 1141670cb89bSRobert Watson error = mac_check_vnode_exec(td->td_ucred, imgp->vp, imgp); 1142339b79b9SRobert Watson if (error) 1143339b79b9SRobert Watson return (error); 1144339b79b9SRobert Watson #endif 1145339b79b9SRobert Watson 114626f9a767SRodney W. Grimes /* 114726f9a767SRodney W. Grimes * 1) Check if file execution is disabled for the filesystem that this 114826f9a767SRodney W. Grimes * file resides on. 114926f9a767SRodney W. Grimes * 2) Insure that at least one execute bit is on - otherwise root 115026f9a767SRodney W. Grimes * will always succeed, and we don't want to happen unless the 115126f9a767SRodney W. Grimes * file really is executable. 115226f9a767SRodney W. Grimes * 3) Insure that the file is a regular file. 115326f9a767SRodney W. Grimes */ 1154c52007c2SDavid Greenman if ((vp->v_mount->mnt_flag & MNT_NOEXEC) || 115526f9a767SRodney W. Grimes ((attr->va_mode & 0111) == 0) || 1156a854ed98SJohn Baldwin (attr->va_type != VREG)) 115726f9a767SRodney W. Grimes return (EACCES); 115826f9a767SRodney W. Grimes 115926f9a767SRodney W. Grimes /* 116026f9a767SRodney W. Grimes * Zero length files can't be exec'd 116126f9a767SRodney W. Grimes */ 116226f9a767SRodney W. Grimes if (attr->va_size == 0) 116326f9a767SRodney W. Grimes return (ENOEXEC); 116426f9a767SRodney W. Grimes 116526f9a767SRodney W. Grimes /* 116626f9a767SRodney W. Grimes * Check for execute permission to file based on current credentials. 116726f9a767SRodney W. Grimes */ 1168a854ed98SJohn Baldwin error = VOP_ACCESS(vp, VEXEC, td->td_ucred, td); 116926f9a767SRodney W. Grimes if (error) 117026f9a767SRodney W. Grimes return (error); 117126f9a767SRodney W. Grimes 11726d5a0a8cSDavid Greenman /* 11736d5a0a8cSDavid Greenman * Check number of open-for-writes on the file and deny execution 11746d5a0a8cSDavid Greenman * if there are any. 11756d5a0a8cSDavid Greenman */ 11766d5a0a8cSDavid Greenman if (vp->v_writecount) 11776d5a0a8cSDavid Greenman return (ETXTBSY); 11786d5a0a8cSDavid Greenman 11796d5a0a8cSDavid Greenman /* 11806d5a0a8cSDavid Greenman * Call filesystem specific open routine (which does nothing in the 11816d5a0a8cSDavid Greenman * general case). 11826d5a0a8cSDavid Greenman */ 1183a8d43c90SPoul-Henning Kamp error = VOP_OPEN(vp, FREAD, td->td_ucred, td, -1); 118426f9a767SRodney W. Grimes return (error); 1185df8bae1dSRodney W. Grimes } 1186aa855a59SPeter Wemm 1187aa855a59SPeter Wemm /* 1188aa855a59SPeter Wemm * Exec handler registration 1189aa855a59SPeter Wemm */ 1190aa855a59SPeter Wemm int 1191aa855a59SPeter Wemm exec_register(execsw_arg) 1192aa855a59SPeter Wemm const struct execsw *execsw_arg; 1193aa855a59SPeter Wemm { 1194aa855a59SPeter Wemm const struct execsw **es, **xs, **newexecsw; 1195aa855a59SPeter Wemm int count = 2; /* New slot and trailing NULL */ 1196aa855a59SPeter Wemm 1197aa855a59SPeter Wemm if (execsw) 1198aa855a59SPeter Wemm for (es = execsw; *es; es++) 1199aa855a59SPeter Wemm count++; 1200a163d034SWarner Losh newexecsw = malloc(count * sizeof(*es), M_TEMP, M_WAITOK); 1201aa855a59SPeter Wemm if (newexecsw == NULL) 1202a7cddfedSJake Burkholder return (ENOMEM); 1203aa855a59SPeter Wemm xs = newexecsw; 1204aa855a59SPeter Wemm if (execsw) 1205aa855a59SPeter Wemm for (es = execsw; *es; es++) 1206aa855a59SPeter Wemm *xs++ = *es; 1207aa855a59SPeter Wemm *xs++ = execsw_arg; 1208aa855a59SPeter Wemm *xs = NULL; 1209aa855a59SPeter Wemm if (execsw) 1210aa855a59SPeter Wemm free(execsw, M_TEMP); 1211aa855a59SPeter Wemm execsw = newexecsw; 1212a7cddfedSJake Burkholder return (0); 1213aa855a59SPeter Wemm } 1214aa855a59SPeter Wemm 1215aa855a59SPeter Wemm int 1216aa855a59SPeter Wemm exec_unregister(execsw_arg) 1217aa855a59SPeter Wemm const struct execsw *execsw_arg; 1218aa855a59SPeter Wemm { 1219aa855a59SPeter Wemm const struct execsw **es, **xs, **newexecsw; 1220aa855a59SPeter Wemm int count = 1; 1221aa855a59SPeter Wemm 1222aa855a59SPeter Wemm if (execsw == NULL) 1223aa855a59SPeter Wemm panic("unregister with no handlers left?\n"); 1224aa855a59SPeter Wemm 1225aa855a59SPeter Wemm for (es = execsw; *es; es++) { 1226aa855a59SPeter Wemm if (*es == execsw_arg) 1227aa855a59SPeter Wemm break; 1228aa855a59SPeter Wemm } 1229aa855a59SPeter Wemm if (*es == NULL) 1230a7cddfedSJake Burkholder return (ENOENT); 1231aa855a59SPeter Wemm for (es = execsw; *es; es++) 1232aa855a59SPeter Wemm if (*es != execsw_arg) 1233aa855a59SPeter Wemm count++; 1234a163d034SWarner Losh newexecsw = malloc(count * sizeof(*es), M_TEMP, M_WAITOK); 1235aa855a59SPeter Wemm if (newexecsw == NULL) 1236a7cddfedSJake Burkholder return (ENOMEM); 1237aa855a59SPeter Wemm xs = newexecsw; 1238aa855a59SPeter Wemm for (es = execsw; *es; es++) 1239aa855a59SPeter Wemm if (*es != execsw_arg) 1240aa855a59SPeter Wemm *xs++ = *es; 1241aa855a59SPeter Wemm *xs = NULL; 1242aa855a59SPeter Wemm if (execsw) 1243aa855a59SPeter Wemm free(execsw, M_TEMP); 1244aa855a59SPeter Wemm execsw = newexecsw; 1245a7cddfedSJake Burkholder return (0); 1246aa855a59SPeter Wemm } 1247