Home | History | Annotate | Line # | Download | only in kern
kern_exec.c revision 1.162
      1  1.162      manu /*	$NetBSD: kern_exec.c,v 1.162 2002/11/07 00:22:30 manu Exp $	*/
      2   1.55       cgd 
      3   1.55       cgd /*-
      4   1.77       cgd  * Copyright (C) 1993, 1994, 1996 Christopher G. Demetriou
      5   1.55       cgd  * Copyright (C) 1992 Wolfgang Solfrank.
      6   1.55       cgd  * Copyright (C) 1992 TooLs GmbH.
      7   1.55       cgd  * All rights reserved.
      8   1.55       cgd  *
      9   1.55       cgd  * Redistribution and use in source and binary forms, with or without
     10   1.55       cgd  * modification, are permitted provided that the following conditions
     11   1.55       cgd  * are met:
     12   1.55       cgd  * 1. Redistributions of source code must retain the above copyright
     13   1.55       cgd  *    notice, this list of conditions and the following disclaimer.
     14   1.55       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     15   1.55       cgd  *    notice, this list of conditions and the following disclaimer in the
     16   1.55       cgd  *    documentation and/or other materials provided with the distribution.
     17   1.55       cgd  * 3. All advertising materials mentioning features or use of this software
     18   1.55       cgd  *    must display the following acknowledgement:
     19   1.55       cgd  *	This product includes software developed by TooLs GmbH.
     20   1.55       cgd  * 4. The name of TooLs GmbH may not be used to endorse or promote products
     21   1.55       cgd  *    derived from this software without specific prior written permission.
     22   1.55       cgd  *
     23   1.55       cgd  * THIS SOFTWARE IS PROVIDED BY TOOLS GMBH ``AS IS'' AND ANY EXPRESS OR
     24   1.55       cgd  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     25   1.55       cgd  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     26   1.55       cgd  * IN NO EVENT SHALL TOOLS GMBH BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
     27   1.55       cgd  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
     28   1.55       cgd  * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
     29   1.55       cgd  * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
     30   1.55       cgd  * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
     31   1.55       cgd  * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
     32   1.55       cgd  * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     33   1.55       cgd  */
     34  1.146     lukem 
     35  1.146     lukem #include <sys/cdefs.h>
     36  1.162      manu __KERNEL_RCSID(0, "$NetBSD: kern_exec.c,v 1.162 2002/11/07 00:22:30 manu Exp $");
     37   1.89       mrg 
     38   1.92   thorpej #include "opt_ktrace.h"
     39  1.124  jdolecek #include "opt_syscall_debug.h"
     40   1.55       cgd 
     41   1.55       cgd #include <sys/param.h>
     42   1.55       cgd #include <sys/systm.h>
     43   1.55       cgd #include <sys/filedesc.h>
     44   1.55       cgd #include <sys/kernel.h>
     45   1.55       cgd #include <sys/proc.h>
     46   1.55       cgd #include <sys/mount.h>
     47   1.55       cgd #include <sys/malloc.h>
     48   1.55       cgd #include <sys/namei.h>
     49   1.55       cgd #include <sys/vnode.h>
     50   1.55       cgd #include <sys/file.h>
     51   1.55       cgd #include <sys/acct.h>
     52   1.55       cgd #include <sys/exec.h>
     53   1.55       cgd #include <sys/ktrace.h>
     54   1.55       cgd #include <sys/resourcevar.h>
     55   1.55       cgd #include <sys/wait.h>
     56   1.55       cgd #include <sys/mman.h>
     57  1.155  gmcgarry #include <sys/ras.h>
     58   1.55       cgd #include <sys/signalvar.h>
     59   1.55       cgd #include <sys/stat.h>
     60  1.124  jdolecek #include <sys/syscall.h>
     61   1.55       cgd 
     62   1.56       cgd #include <sys/syscallargs.h>
     63   1.55       cgd 
     64   1.88       mrg #include <uvm/uvm_extern.h>
     65   1.88       mrg 
     66   1.55       cgd #include <machine/cpu.h>
     67   1.55       cgd #include <machine/reg.h>
     68   1.55       cgd 
     69  1.143  christos #ifdef DEBUG_EXEC
     70  1.143  christos #define DPRINTF(a) uprintf a
     71  1.143  christos #else
     72  1.143  christos #define DPRINTF(a)
     73  1.143  christos #endif /* DEBUG_EXEC */
     74  1.143  christos 
     75  1.130  jdolecek /*
     76  1.130  jdolecek  * Exec function switch:
     77  1.130  jdolecek  *
     78  1.130  jdolecek  * Note that each makecmds function is responsible for loading the
     79  1.130  jdolecek  * exec package with the necessary functions for any exec-type-specific
     80  1.130  jdolecek  * handling.
     81  1.130  jdolecek  *
     82  1.130  jdolecek  * Functions for specific exec types should be defined in their own
     83  1.130  jdolecek  * header file.
     84  1.130  jdolecek  */
     85  1.138     lukem extern const struct execsw	execsw_builtin[];
     86  1.138     lukem extern int			nexecs_builtin;
     87  1.138     lukem static const struct execsw	**execsw = NULL;
     88  1.138     lukem static int			nexecs;
     89  1.138     lukem 
     90  1.153   thorpej u_int	exec_maxhdrsz;		/* must not be static - netbsd32 needs it */
     91  1.130  jdolecek 
     92  1.130  jdolecek #ifdef LKM
     93  1.130  jdolecek /* list of supported emulations */
     94  1.130  jdolecek static
     95  1.130  jdolecek LIST_HEAD(emlist_head, emul_entry) el_head = LIST_HEAD_INITIALIZER(el_head);
     96  1.130  jdolecek struct emul_entry {
     97  1.138     lukem 	LIST_ENTRY(emul_entry)	el_list;
     98  1.138     lukem 	const struct emul	*el_emul;
     99  1.138     lukem 	int			ro_entry;
    100  1.130  jdolecek };
    101  1.130  jdolecek 
    102  1.130  jdolecek /* list of dynamically loaded execsw entries */
    103  1.130  jdolecek static
    104  1.130  jdolecek LIST_HEAD(execlist_head, exec_entry) ex_head = LIST_HEAD_INITIALIZER(ex_head);
    105  1.130  jdolecek struct exec_entry {
    106  1.138     lukem 	LIST_ENTRY(exec_entry)	ex_list;
    107  1.138     lukem 	const struct execsw	*es;
    108  1.130  jdolecek };
    109  1.130  jdolecek 
    110  1.130  jdolecek /* structure used for building execw[] */
    111  1.130  jdolecek struct execsw_entry {
    112  1.138     lukem 	struct execsw_entry	*next;
    113  1.138     lukem 	const struct execsw	*es;
    114  1.130  jdolecek };
    115  1.130  jdolecek #endif /* LKM */
    116  1.130  jdolecek 
    117  1.130  jdolecek /* NetBSD emul struct */
    118  1.138     lukem extern char	sigcode[], esigcode[];
    119  1.124  jdolecek #ifdef SYSCALL_DEBUG
    120  1.124  jdolecek extern const char * const syscallnames[];
    121  1.124  jdolecek #endif
    122  1.133   mycroft #ifdef __HAVE_SYSCALL_INTERN
    123  1.138     lukem void syscall_intern(struct proc *);
    124  1.133   mycroft #else
    125  1.138     lukem void syscall(void);
    126  1.133   mycroft #endif
    127  1.124  jdolecek 
    128  1.124  jdolecek const struct emul emul_netbsd = {
    129  1.124  jdolecek 	"netbsd",
    130  1.127  jdolecek 	NULL,		/* emulation path */
    131  1.133   mycroft #ifndef __HAVE_MINIMAL_EMUL
    132  1.140      manu 	EMUL_HAS_SYS___syscall,
    133  1.124  jdolecek 	NULL,
    134  1.124  jdolecek 	SYS_syscall,
    135  1.161  jdolecek 	SYS_NSYSENT,
    136  1.133   mycroft #endif
    137  1.124  jdolecek 	sysent,
    138  1.124  jdolecek #ifdef SYSCALL_DEBUG
    139  1.124  jdolecek 	syscallnames,
    140  1.124  jdolecek #else
    141  1.124  jdolecek 	NULL,
    142  1.124  jdolecek #endif
    143  1.133   mycroft 	sendsig,
    144  1.142  christos 	trapsignal,
    145  1.124  jdolecek 	sigcode,
    146  1.124  jdolecek 	esigcode,
    147  1.145  jdolecek 	setregs,
    148  1.128  jdolecek 	NULL,
    149  1.128  jdolecek 	NULL,
    150  1.128  jdolecek 	NULL,
    151  1.133   mycroft #ifdef __HAVE_SYSCALL_INTERN
    152  1.133   mycroft 	syscall_intern,
    153  1.133   mycroft #else
    154  1.133   mycroft 	syscall,
    155  1.133   mycroft #endif
    156  1.156      manu 	NULL,
    157  1.156      manu 	NULL,
    158  1.124  jdolecek };
    159  1.124  jdolecek 
    160  1.147  jdolecek #ifdef LKM
    161   1.55       cgd /*
    162  1.130  jdolecek  * Exec lock. Used to control access to execsw[] structures.
    163  1.130  jdolecek  * This must not be static so that netbsd32 can access it, too.
    164  1.130  jdolecek  */
    165  1.130  jdolecek struct lock exec_lock;
    166  1.130  jdolecek 
    167  1.138     lukem static void link_es(struct execsw_entry **, const struct execsw *);
    168  1.130  jdolecek #endif /* LKM */
    169  1.130  jdolecek 
    170  1.130  jdolecek /*
    171   1.55       cgd  * check exec:
    172   1.55       cgd  * given an "executable" described in the exec package's namei info,
    173   1.55       cgd  * see what we can do with it.
    174   1.55       cgd  *
    175   1.55       cgd  * ON ENTRY:
    176   1.55       cgd  *	exec package with appropriate namei info
    177   1.55       cgd  *	proc pointer of exec'ing proc
    178  1.160     blymn  *      iff verified exec enabled then flag indicating a direct exec or
    179  1.160     blymn  *        an indirect exec (i.e. for a shell script interpreter)
    180   1.55       cgd  *	NO SELF-LOCKED VNODES
    181   1.55       cgd  *
    182   1.55       cgd  * ON EXIT:
    183   1.55       cgd  *	error:	nothing held, etc.  exec header still allocated.
    184   1.77       cgd  *	ok:	filled exec package, executable's vnode (unlocked).
    185   1.55       cgd  *
    186   1.55       cgd  * EXEC SWITCH ENTRY:
    187   1.55       cgd  * 	Locked vnode to check, exec package, proc.
    188   1.55       cgd  *
    189   1.55       cgd  * EXEC SWITCH EXIT:
    190   1.77       cgd  *	ok:	return 0, filled exec package, executable's vnode (unlocked).
    191   1.55       cgd  *	error:	destructive:
    192   1.55       cgd  *			everything deallocated execept exec header.
    193   1.76       cgd  *		non-destructive:
    194   1.77       cgd  *			error code, executable's vnode (unlocked),
    195   1.76       cgd  *			exec header unmodified.
    196   1.55       cgd  */
    197   1.55       cgd int
    198  1.160     blymn #ifdef VERIFIED_EXEC
    199  1.160     blymn check_exec(struct proc *p, struct exec_package *epp, int direct_exec)
    200  1.160     blymn #else
    201  1.118   thorpej check_exec(struct proc *p, struct exec_package *epp)
    202  1.160     blymn #endif
    203   1.55       cgd {
    204  1.138     lukem 	int		error, i;
    205  1.138     lukem 	struct vnode	*vp;
    206   1.55       cgd 	struct nameidata *ndp;
    207  1.138     lukem 	size_t		resid;
    208   1.55       cgd 
    209   1.55       cgd 	ndp = epp->ep_ndp;
    210   1.55       cgd 	ndp->ni_cnd.cn_nameiop = LOOKUP;
    211   1.55       cgd 	ndp->ni_cnd.cn_flags = FOLLOW | LOCKLEAF | SAVENAME;
    212   1.55       cgd 	/* first get the vnode */
    213   1.74  christos 	if ((error = namei(ndp)) != 0)
    214   1.55       cgd 		return error;
    215   1.55       cgd 	epp->ep_vp = vp = ndp->ni_vp;
    216   1.55       cgd 
    217   1.84   mycroft 	/* check access and type */
    218   1.55       cgd 	if (vp->v_type != VREG) {
    219   1.81    kleink 		error = EACCES;
    220   1.55       cgd 		goto bad1;
    221   1.55       cgd 	}
    222   1.84   mycroft 	if ((error = VOP_ACCESS(vp, VEXEC, p->p_ucred, p)) != 0)
    223   1.84   mycroft 		goto bad1;
    224   1.55       cgd 
    225   1.55       cgd 	/* get attributes */
    226   1.74  christos 	if ((error = VOP_GETATTR(vp, epp->ep_vap, p->p_ucred, p)) != 0)
    227   1.55       cgd 		goto bad1;
    228   1.55       cgd 
    229   1.55       cgd 	/* Check mount point */
    230   1.55       cgd 	if (vp->v_mount->mnt_flag & MNT_NOEXEC) {
    231   1.55       cgd 		error = EACCES;
    232   1.55       cgd 		goto bad1;
    233   1.55       cgd 	}
    234  1.141   thorpej 	if (vp->v_mount->mnt_flag & MNT_NOSUID)
    235   1.83   mycroft 		epp->ep_vap->va_mode &= ~(S_ISUID | S_ISGID);
    236   1.55       cgd 
    237   1.55       cgd 	/* try to open it */
    238   1.74  christos 	if ((error = VOP_OPEN(vp, FREAD, p->p_ucred, p)) != 0)
    239   1.55       cgd 		goto bad1;
    240   1.55       cgd 
    241   1.99  wrstuden 	/* unlock vp, since we need it unlocked from here on out. */
    242   1.90      fvdl 	VOP_UNLOCK(vp, 0);
    243   1.77       cgd 
    244  1.160     blymn 
    245  1.160     blymn #ifdef VERIFIED_EXEC
    246  1.160     blymn         /* Evaluate signature for file... */
    247  1.160     blymn         if ((error = check_veriexec(p, vp, epp, direct_exec)) != 0)
    248  1.160     blymn                 goto bad2;
    249  1.160     blymn #endif
    250  1.160     blymn 
    251   1.55       cgd 	/* now we have the file, get the exec header */
    252  1.125       chs 	uvn_attach(vp, VM_PROT_READ);
    253   1.74  christos 	error = vn_rdwr(UIO_READ, vp, epp->ep_hdr, epp->ep_hdrlen, 0,
    254   1.77       cgd 			UIO_SYSSPACE, 0, p->p_ucred, &resid, p);
    255   1.74  christos 	if (error)
    256   1.55       cgd 		goto bad2;
    257   1.55       cgd 	epp->ep_hdrvalid = epp->ep_hdrlen - resid;
    258   1.55       cgd 
    259   1.55       cgd 	/*
    260  1.136       eeh 	 * Set up default address space limits.  Can be overridden
    261  1.136       eeh 	 * by individual exec packages.
    262  1.136       eeh 	 *
    263  1.136       eeh 	 * XXX probably shoul be all done in the exec pakages.
    264  1.136       eeh 	 */
    265  1.136       eeh 	epp->ep_vm_minaddr = VM_MIN_ADDRESS;
    266  1.136       eeh 	epp->ep_vm_maxaddr = VM_MAXUSER_ADDRESS;
    267  1.136       eeh 	/*
    268   1.55       cgd 	 * set up the vmcmds for creation of the process
    269   1.55       cgd 	 * address space
    270   1.55       cgd 	 */
    271   1.55       cgd 	error = ENOEXEC;
    272   1.55       cgd 	for (i = 0; i < nexecs && error != 0; i++) {
    273   1.68       cgd 		int newerror;
    274   1.68       cgd 
    275  1.130  jdolecek 		epp->ep_esch = execsw[i];
    276  1.130  jdolecek 		newerror = (*execsw[i]->es_check)(p, epp);
    277   1.68       cgd 		/* make sure the first "interesting" error code is saved. */
    278   1.68       cgd 		if (!newerror || error == ENOEXEC)
    279   1.68       cgd 			error = newerror;
    280  1.124  jdolecek 
    281  1.124  jdolecek 		/* if es_check call was successful, update epp->ep_es */
    282  1.124  jdolecek 		if (!newerror && (epp->ep_flags & EXEC_HASES) == 0)
    283  1.130  jdolecek 			epp->ep_es = execsw[i];
    284  1.124  jdolecek 
    285   1.55       cgd 		if (epp->ep_flags & EXEC_DESTR && error != 0)
    286   1.55       cgd 			return error;
    287   1.55       cgd 	}
    288   1.55       cgd 	if (!error) {
    289   1.55       cgd 		/* check that entry point is sane */
    290   1.55       cgd 		if (epp->ep_entry > VM_MAXUSER_ADDRESS)
    291   1.55       cgd 			error = ENOEXEC;
    292   1.55       cgd 
    293   1.55       cgd 		/* check limits */
    294   1.55       cgd 		if ((epp->ep_tsize > MAXTSIZ) ||
    295  1.153   thorpej 		    (epp->ep_dsize >
    296  1.153   thorpej 		     (u_quad_t)p->p_rlimit[RLIMIT_DATA].rlim_cur))
    297   1.55       cgd 			error = ENOMEM;
    298   1.55       cgd 
    299   1.55       cgd 		if (!error)
    300   1.55       cgd 			return (0);
    301   1.55       cgd 	}
    302   1.55       cgd 
    303   1.55       cgd 	/*
    304   1.55       cgd 	 * free any vmspace-creation commands,
    305   1.55       cgd 	 * and release their references
    306   1.55       cgd 	 */
    307   1.55       cgd 	kill_vmcmds(&epp->ep_vmcmds);
    308   1.55       cgd 
    309   1.55       cgd bad2:
    310   1.55       cgd 	/*
    311   1.99  wrstuden 	 * close and release the vnode, restore the old one, free the
    312   1.55       cgd 	 * pathname buf, and punt.
    313   1.55       cgd 	 */
    314   1.99  wrstuden 	vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
    315   1.77       cgd 	VOP_CLOSE(vp, FREAD, p->p_ucred, p);
    316   1.99  wrstuden 	vput(vp);
    317  1.120   thorpej 	PNBUF_PUT(ndp->ni_cnd.cn_pnbuf);
    318   1.55       cgd 	return error;
    319   1.55       cgd 
    320   1.55       cgd bad1:
    321   1.55       cgd 	/*
    322   1.55       cgd 	 * free the namei pathname buffer, and put the vnode
    323   1.55       cgd 	 * (which we don't yet have open).
    324   1.55       cgd 	 */
    325   1.77       cgd 	vput(vp);				/* was still locked */
    326  1.120   thorpej 	PNBUF_PUT(ndp->ni_cnd.cn_pnbuf);
    327   1.55       cgd 	return error;
    328   1.55       cgd }
    329   1.55       cgd 
    330   1.55       cgd /*
    331   1.55       cgd  * exec system call
    332   1.55       cgd  */
    333   1.55       cgd /* ARGSUSED */
    334   1.75  christos int
    335  1.118   thorpej sys_execve(struct proc *p, void *v, register_t *retval)
    336   1.71   thorpej {
    337  1.108  augustss 	struct sys_execve_args /* {
    338  1.138     lukem 		syscallarg(const char *)	path;
    339  1.138     lukem 		syscallarg(char * const *)	argp;
    340  1.138     lukem 		syscallarg(char * const *)	envp;
    341   1.71   thorpej 	} */ *uap = v;
    342  1.153   thorpej 	int			error;
    343  1.153   thorpej 	u_int			i;
    344  1.138     lukem 	struct exec_package	pack;
    345  1.138     lukem 	struct nameidata	nid;
    346  1.138     lukem 	struct vattr		attr;
    347  1.138     lukem 	struct ucred		*cred;
    348  1.138     lukem 	char			*argp;
    349  1.138     lukem 	char * const		*cpp;
    350  1.138     lukem 	char			*dp, *sp;
    351  1.138     lukem 	long			argc, envc;
    352  1.138     lukem 	size_t			len;
    353  1.138     lukem 	char			*stack;
    354  1.138     lukem 	struct ps_strings	arginfo;
    355  1.138     lukem 	struct vmspace		*vm;
    356  1.138     lukem 	char			**tmpfap;
    357  1.138     lukem 	int			szsigcode;
    358  1.138     lukem 	struct exec_vmcmd	*base_vcp;
    359   1.55       cgd 
    360  1.149  christos 	/*
    361  1.149  christos 	 * Lock the process and set the P_INEXEC flag to indicate that
    362  1.149  christos 	 * it should be left alone until we're done here.  This is
    363  1.149  christos 	 * necessary to avoid race conditions - e.g. in ptrace() -
    364  1.149  christos 	 * that might allow a local user to illicitly obtain elevated
    365  1.149  christos 	 * privileges.
    366  1.149  christos 	 */
    367  1.149  christos 	p->p_flag |= P_INEXEC;
    368  1.149  christos 
    369  1.138     lukem 	cred = p->p_ucred;
    370  1.138     lukem 	base_vcp = NULL;
    371   1.55       cgd 	/*
    372  1.129  jdolecek 	 * Init the namei data to point the file user's program name.
    373  1.129  jdolecek 	 * This is done here rather than in check_exec(), so that it's
    374  1.129  jdolecek 	 * possible to override this settings if any of makecmd/probe
    375  1.129  jdolecek 	 * functions call check_exec() recursively - for example,
    376  1.129  jdolecek 	 * see exec_script_makecmds().
    377  1.129  jdolecek 	 */
    378   1.56       cgd 	NDINIT(&nid, LOOKUP, NOFOLLOW, UIO_USERSPACE, SCARG(uap, path), p);
    379   1.55       cgd 
    380   1.55       cgd 	/*
    381   1.55       cgd 	 * initialize the fields of the exec package.
    382   1.55       cgd 	 */
    383   1.56       cgd 	pack.ep_name = SCARG(uap, path);
    384  1.119   thorpej 	pack.ep_hdr = malloc(exec_maxhdrsz, M_EXEC, M_WAITOK);
    385   1.55       cgd 	pack.ep_hdrlen = exec_maxhdrsz;
    386   1.55       cgd 	pack.ep_hdrvalid = 0;
    387   1.55       cgd 	pack.ep_ndp = &nid;
    388   1.67  christos 	pack.ep_emul_arg = NULL;
    389   1.55       cgd 	pack.ep_vmcmds.evs_cnt = 0;
    390   1.55       cgd 	pack.ep_vmcmds.evs_used = 0;
    391   1.55       cgd 	pack.ep_vap = &attr;
    392   1.55       cgd 	pack.ep_flags = 0;
    393   1.55       cgd 
    394  1.147  jdolecek #ifdef LKM
    395  1.130  jdolecek 	lockmgr(&exec_lock, LK_SHARED, NULL);
    396  1.147  jdolecek #endif
    397  1.130  jdolecek 
    398   1.55       cgd 	/* see if we can run it. */
    399  1.160     blymn #ifdef VERIFIED_EXEC
    400  1.160     blymn         if ((error = check_exec(p, &pack, 1)) != 0)
    401  1.160     blymn         //if ((error = check_exec(p, &pack, 0)) != 0)
    402  1.160     blymn #else
    403  1.160     blymn         if ((error = check_exec(p, &pack)) != 0)
    404  1.160     blymn #endif
    405   1.55       cgd 		goto freehdr;
    406   1.55       cgd 
    407   1.55       cgd 	/* XXX -- THE FOLLOWING SECTION NEEDS MAJOR CLEANUP */
    408   1.55       cgd 
    409   1.55       cgd 	/* allocate an argument buffer */
    410   1.88       mrg 	argp = (char *) uvm_km_valloc_wait(exec_map, NCARGS);
    411   1.55       cgd #ifdef DIAGNOSTIC
    412   1.95       eeh 	if (argp == (vaddr_t) 0)
    413   1.55       cgd 		panic("execve: argp == NULL");
    414   1.55       cgd #endif
    415   1.55       cgd 	dp = argp;
    416   1.55       cgd 	argc = 0;
    417   1.55       cgd 
    418   1.55       cgd 	/* copy the fake args list, if there's one, freeing it as we go */
    419   1.55       cgd 	if (pack.ep_flags & EXEC_HASARGL) {
    420   1.55       cgd 		tmpfap = pack.ep_fa;
    421   1.55       cgd 		while (*tmpfap != NULL) {
    422   1.55       cgd 			char *cp;
    423   1.55       cgd 
    424   1.55       cgd 			cp = *tmpfap;
    425   1.55       cgd 			while (*cp)
    426   1.55       cgd 				*dp++ = *cp++;
    427   1.74  christos 			dp++;
    428   1.55       cgd 
    429   1.55       cgd 			FREE(*tmpfap, M_EXEC);
    430   1.55       cgd 			tmpfap++; argc++;
    431   1.55       cgd 		}
    432   1.55       cgd 		FREE(pack.ep_fa, M_EXEC);
    433   1.55       cgd 		pack.ep_flags &= ~EXEC_HASARGL;
    434   1.55       cgd 	}
    435   1.55       cgd 
    436   1.55       cgd 	/* Now get argv & environment */
    437   1.56       cgd 	if (!(cpp = SCARG(uap, argp))) {
    438   1.55       cgd 		error = EINVAL;
    439   1.55       cgd 		goto bad;
    440   1.55       cgd 	}
    441   1.55       cgd 
    442   1.55       cgd 	if (pack.ep_flags & EXEC_SKIPARG)
    443   1.55       cgd 		cpp++;
    444   1.55       cgd 
    445   1.55       cgd 	while (1) {
    446   1.55       cgd 		len = argp + ARG_MAX - dp;
    447   1.74  christos 		if ((error = copyin(cpp, &sp, sizeof(sp))) != 0)
    448   1.55       cgd 			goto bad;
    449   1.55       cgd 		if (!sp)
    450   1.55       cgd 			break;
    451   1.74  christos 		if ((error = copyinstr(sp, dp, len, &len)) != 0) {
    452   1.55       cgd 			if (error == ENAMETOOLONG)
    453   1.55       cgd 				error = E2BIG;
    454   1.55       cgd 			goto bad;
    455   1.55       cgd 		}
    456   1.55       cgd 		dp += len;
    457   1.55       cgd 		cpp++;
    458   1.55       cgd 		argc++;
    459   1.55       cgd 	}
    460   1.55       cgd 
    461   1.55       cgd 	envc = 0;
    462   1.74  christos 	/* environment need not be there */
    463   1.74  christos 	if ((cpp = SCARG(uap, envp)) != NULL ) {
    464   1.55       cgd 		while (1) {
    465   1.55       cgd 			len = argp + ARG_MAX - dp;
    466   1.74  christos 			if ((error = copyin(cpp, &sp, sizeof(sp))) != 0)
    467   1.55       cgd 				goto bad;
    468   1.55       cgd 			if (!sp)
    469   1.55       cgd 				break;
    470   1.74  christos 			if ((error = copyinstr(sp, dp, len, &len)) != 0) {
    471   1.55       cgd 				if (error == ENAMETOOLONG)
    472   1.55       cgd 					error = E2BIG;
    473   1.55       cgd 				goto bad;
    474   1.55       cgd 			}
    475   1.55       cgd 			dp += len;
    476   1.55       cgd 			cpp++;
    477   1.55       cgd 			envc++;
    478   1.55       cgd 		}
    479   1.55       cgd 	}
    480   1.61   mycroft 
    481   1.61   mycroft 	dp = (char *) ALIGN(dp);
    482   1.55       cgd 
    483  1.126       mrg 	szsigcode = pack.ep_es->es_emul->e_esigcode -
    484  1.126       mrg 	    pack.ep_es->es_emul->e_sigcode;
    485   1.65      fvdl 
    486   1.55       cgd 	/* Now check if args & environ fit into new stack */
    487  1.105       eeh 	if (pack.ep_flags & EXEC_32)
    488  1.126       mrg 		len = ((argc + envc + 2 + pack.ep_es->es_arglen) *
    489  1.126       mrg 		    sizeof(int) + sizeof(int) + dp + STACKGAPLEN +
    490  1.126       mrg 		    szsigcode + sizeof(struct ps_strings)) - argp;
    491  1.105       eeh 	else
    492  1.126       mrg 		len = ((argc + envc + 2 + pack.ep_es->es_arglen) *
    493  1.126       mrg 		    sizeof(char *) + sizeof(int) + dp + STACKGAPLEN +
    494  1.126       mrg 		    szsigcode + sizeof(struct ps_strings)) - argp;
    495   1.67  christos 
    496   1.55       cgd 	len = ALIGN(len);	/* make the stack "safely" aligned */
    497   1.55       cgd 
    498   1.55       cgd 	if (len > pack.ep_ssize) { /* in effect, compare to initial limit */
    499   1.55       cgd 		error = ENOMEM;
    500   1.55       cgd 		goto bad;
    501   1.55       cgd 	}
    502   1.55       cgd 
    503   1.55       cgd 	/* adjust "active stack depth" for process VSZ */
    504   1.55       cgd 	pack.ep_ssize = len;	/* maybe should go elsewhere, but... */
    505   1.55       cgd 
    506   1.86   thorpej 	/*
    507   1.86   thorpej 	 * Do whatever is necessary to prepare the address space
    508   1.86   thorpej 	 * for remapping.  Note that this might replace the current
    509   1.86   thorpej 	 * vmspace with another!
    510   1.86   thorpej 	 */
    511  1.136       eeh 	uvmspace_exec(p, pack.ep_vm_minaddr, pack.ep_vm_maxaddr);
    512   1.55       cgd 
    513   1.55       cgd 	/* Now map address space */
    514   1.86   thorpej 	vm = p->p_vmspace;
    515  1.158  junyoung 	vm->vm_taddr = (caddr_t) pack.ep_taddr;
    516   1.55       cgd 	vm->vm_tsize = btoc(pack.ep_tsize);
    517  1.158  junyoung 	vm->vm_daddr = (caddr_t) pack.ep_daddr;
    518   1.55       cgd 	vm->vm_dsize = btoc(pack.ep_dsize);
    519   1.55       cgd 	vm->vm_ssize = btoc(pack.ep_ssize);
    520  1.158  junyoung 	vm->vm_maxsaddr = (caddr_t) pack.ep_maxsaddr;
    521  1.158  junyoung 	vm->vm_minsaddr = (caddr_t) pack.ep_minsaddr;
    522   1.55       cgd 
    523   1.55       cgd 	/* create the new process's VM space by running the vmcmds */
    524   1.55       cgd #ifdef DIAGNOSTIC
    525   1.55       cgd 	if (pack.ep_vmcmds.evs_used == 0)
    526   1.55       cgd 		panic("execve: no vmcmds");
    527   1.55       cgd #endif
    528   1.55       cgd 	for (i = 0; i < pack.ep_vmcmds.evs_used && !error; i++) {
    529   1.55       cgd 		struct exec_vmcmd *vcp;
    530   1.55       cgd 
    531   1.55       cgd 		vcp = &pack.ep_vmcmds.evs_cmds[i];
    532  1.114      matt 		if (vcp->ev_flags & VMCMD_RELATIVE) {
    533  1.114      matt #ifdef DIAGNOSTIC
    534  1.114      matt 			if (base_vcp == NULL)
    535  1.114      matt 				panic("execve: relative vmcmd with no base");
    536  1.114      matt 			if (vcp->ev_flags & VMCMD_BASE)
    537  1.114      matt 				panic("execve: illegal base & relative vmcmd");
    538  1.114      matt #endif
    539  1.114      matt 			vcp->ev_addr += base_vcp->ev_addr;
    540  1.114      matt 		}
    541   1.55       cgd 		error = (*vcp->ev_proc)(p, vcp);
    542  1.143  christos #ifdef DEBUG_EXEC
    543  1.111      matt 		if (error) {
    544  1.143  christos 			int j;
    545  1.143  christos 			struct exec_vmcmd *vp = &pack.ep_vmcmds.evs_cmds[0];
    546  1.143  christos 			for (j = 0; j <= i; j++)
    547  1.143  christos 				uprintf(
    548  1.143  christos 			    "vmcmd[%d] = %#lx/%#lx fd@%#lx prot=0%o flags=%d\n",
    549  1.143  christos 				    j, vp[j].ev_addr, vp[j].ev_len,
    550  1.143  christos 				    vp[j].ev_offset, vp[j].ev_prot,
    551  1.143  christos 				    vp[j].ev_flags);
    552  1.111      matt 		}
    553  1.143  christos #endif /* DEBUG_EXEC */
    554  1.114      matt 		if (vcp->ev_flags & VMCMD_BASE)
    555  1.114      matt 			base_vcp = vcp;
    556   1.55       cgd 	}
    557   1.55       cgd 
    558   1.55       cgd 	/* free the vmspace-creation commands, and release their references */
    559   1.55       cgd 	kill_vmcmds(&pack.ep_vmcmds);
    560   1.55       cgd 
    561   1.55       cgd 	/* if an error happened, deallocate and punt */
    562  1.111      matt 	if (error) {
    563  1.143  christos 		DPRINTF(("execve: vmcmd %i failed: %d\n", i - 1, error));
    564   1.55       cgd 		goto exec_abort;
    565  1.111      matt 	}
    566   1.55       cgd 
    567   1.55       cgd 	/* remember information about the process */
    568   1.55       cgd 	arginfo.ps_nargvstr = argc;
    569   1.55       cgd 	arginfo.ps_nenvstr = envc;
    570   1.55       cgd 
    571  1.121       eeh 	stack = (char *) (vm->vm_minsaddr - len);
    572   1.55       cgd 	/* Now copy argc, args & environ to new stack */
    573  1.154  christos 	error = (*pack.ep_es->es_copyargs)(p, &pack, &arginfo, &stack, argp);
    574  1.144  christos 	if (error) {
    575  1.144  christos 		DPRINTF(("execve: copyargs failed %d\n", error));
    576   1.55       cgd 		goto exec_abort;
    577  1.111      matt 	}
    578  1.144  christos 	/* Move the stack back to original point */
    579  1.144  christos 	stack = (char *) (vm->vm_minsaddr - len);
    580   1.55       cgd 
    581  1.121       eeh 	/* fill process ps_strings info */
    582  1.121       eeh 	p->p_psstr = (struct ps_strings *)(vm->vm_minsaddr
    583  1.121       eeh 		- sizeof(struct ps_strings));
    584  1.121       eeh 	p->p_psargv = offsetof(struct ps_strings, ps_argvstr);
    585  1.121       eeh 	p->p_psnargv = offsetof(struct ps_strings, ps_nargvstr);
    586  1.121       eeh 	p->p_psenv = offsetof(struct ps_strings, ps_envstr);
    587  1.121       eeh 	p->p_psnenv = offsetof(struct ps_strings, ps_nenvstr);
    588  1.121       eeh 
    589   1.55       cgd 	/* copy out the process's ps_strings structure */
    590  1.144  christos 	if ((error = copyout(&arginfo, (char *)p->p_psstr,
    591  1.144  christos 	    sizeof(arginfo))) != 0) {
    592  1.143  christos 		DPRINTF(("execve: ps_strings copyout %p->%p size %ld failed\n",
    593  1.143  christos 		       &arginfo, (char *)p->p_psstr, (long)sizeof(arginfo)));
    594   1.55       cgd 		goto exec_abort;
    595  1.111      matt 	}
    596  1.109    simonb 
    597  1.158  junyoung 	/* copy out the process's signal trampoline code */
    598   1.96   mycroft 	if (szsigcode) {
    599  1.144  christos 		if ((error = copyout((char *)pack.ep_es->es_emul->e_sigcode,
    600  1.134  jdolecek 		    p->p_sigctx.ps_sigcode = (char *)p->p_psstr - szsigcode,
    601  1.144  christos 		    szsigcode)) != 0) {
    602  1.143  christos 			DPRINTF(("execve: sig trampoline copyout failed\n"));
    603   1.97    kleink 			goto exec_abort;
    604  1.111      matt 		}
    605  1.104        is #ifdef PMAP_NEED_PROCWR
    606  1.104        is 		/* This is code. Let the pmap do what is needed. */
    607  1.134  jdolecek 		pmap_procwr(p, (vaddr_t)p->p_sigctx.ps_sigcode, szsigcode);
    608  1.104        is #endif
    609   1.96   mycroft 	}
    610   1.55       cgd 
    611  1.102      ross 	stopprofclock(p);	/* stop profiling */
    612   1.55       cgd 	fdcloseexec(p);		/* handle close on exec */
    613   1.55       cgd 	execsigs(p);		/* reset catched signals */
    614   1.98    kleink 	p->p_ctxlink = NULL;	/* reset ucontext link */
    615   1.55       cgd 
    616   1.55       cgd 	/* set command name & other accounting info */
    617   1.55       cgd 	len = min(nid.ni_cnd.cn_namelen, MAXCOMLEN);
    618   1.94     perry 	memcpy(p->p_comm, nid.ni_cnd.cn_nameptr, len);
    619   1.55       cgd 	p->p_comm[len] = 0;
    620   1.55       cgd 	p->p_acflag &= ~AFORK;
    621   1.55       cgd 
    622   1.55       cgd 	/* record proc's vnode, for use by procfs and others */
    623   1.55       cgd         if (p->p_textvp)
    624   1.55       cgd                 vrele(p->p_textvp);
    625   1.55       cgd 	VREF(pack.ep_vp);
    626   1.55       cgd 	p->p_textvp = pack.ep_vp;
    627   1.55       cgd 
    628   1.55       cgd 	p->p_flag |= P_EXEC;
    629   1.55       cgd 	if (p->p_flag & P_PPWAIT) {
    630   1.55       cgd 		p->p_flag &= ~P_PPWAIT;
    631   1.55       cgd 		wakeup((caddr_t) p->p_pptr);
    632   1.55       cgd 	}
    633   1.55       cgd 
    634   1.55       cgd 	/*
    635   1.55       cgd 	 * deal with set[ug]id.
    636  1.141   thorpej 	 * MNT_NOSUID has already been used to disable s[ug]id.
    637   1.55       cgd 	 */
    638  1.141   thorpej 	if ((p->p_flag & P_TRACED) == 0 &&
    639  1.141   thorpej 
    640  1.141   thorpej 	    (((attr.va_mode & S_ISUID) != 0 &&
    641  1.141   thorpej 	      p->p_ucred->cr_uid != attr.va_uid) ||
    642  1.141   thorpej 
    643  1.141   thorpej 	     ((attr.va_mode & S_ISGID) != 0 &&
    644  1.141   thorpej 	      p->p_ucred->cr_gid != attr.va_gid))) {
    645  1.141   thorpej 		/*
    646  1.141   thorpej 		 * Mark the process as SUGID before we do
    647  1.141   thorpej 		 * anything that might block.
    648  1.141   thorpej 		 */
    649  1.141   thorpej 		p_sugid(p);
    650  1.152  christos 
    651  1.152  christos 		/* Make sure file descriptors 0..2 are in use. */
    652  1.152  christos 		if ((error = fdcheckstd(p)) != 0)
    653  1.152  christos 			goto exec_abort;
    654  1.141   thorpej 
    655   1.55       cgd 		p->p_ucred = crcopy(cred);
    656   1.55       cgd #ifdef KTRACE
    657   1.55       cgd 		/*
    658   1.55       cgd 		 * If process is being ktraced, turn off - unless
    659   1.55       cgd 		 * root set it.
    660   1.55       cgd 		 */
    661   1.91  christos 		if (p->p_tracep && !(p->p_traceflag & KTRFAC_ROOT))
    662   1.91  christos 			ktrderef(p);
    663   1.55       cgd #endif
    664   1.83   mycroft 		if (attr.va_mode & S_ISUID)
    665   1.55       cgd 			p->p_ucred->cr_uid = attr.va_uid;
    666   1.83   mycroft 		if (attr.va_mode & S_ISGID)
    667   1.55       cgd 			p->p_ucred->cr_gid = attr.va_gid;
    668   1.79       mrg 	} else
    669   1.79       mrg 		p->p_flag &= ~P_SUGID;
    670   1.55       cgd 	p->p_cred->p_svuid = p->p_ucred->cr_uid;
    671   1.55       cgd 	p->p_cred->p_svgid = p->p_ucred->cr_gid;
    672  1.155  gmcgarry 
    673  1.155  gmcgarry #if defined(__HAVE_RAS)
    674  1.155  gmcgarry 	/*
    675  1.155  gmcgarry 	 * Remove all RASs from the address space.
    676  1.155  gmcgarry 	 */
    677  1.155  gmcgarry 	ras_purgeall(p);
    678  1.155  gmcgarry #endif
    679  1.107      fvdl 
    680  1.107      fvdl 	doexechooks(p);
    681   1.55       cgd 
    682   1.95       eeh 	uvm_km_free_wakeup(exec_map, (vaddr_t) argp, NCARGS);
    683   1.55       cgd 
    684  1.120   thorpej 	PNBUF_PUT(nid.ni_cnd.cn_pnbuf);
    685   1.99  wrstuden 	vn_lock(pack.ep_vp, LK_EXCLUSIVE | LK_RETRY);
    686   1.55       cgd 	VOP_CLOSE(pack.ep_vp, FREAD, cred, p);
    687   1.99  wrstuden 	vput(pack.ep_vp);
    688  1.159  jdolecek 
    689  1.159  jdolecek 	/* notify others that we exec'd */
    690  1.159  jdolecek 	KNOTE(&p->p_klist, NOTE_EXEC);
    691   1.55       cgd 
    692   1.55       cgd 	/* setup new registers and do misc. setup. */
    693  1.145  jdolecek 	(*pack.ep_es->es_emul->e_setregs)(p, &pack, (u_long) stack);
    694  1.145  jdolecek 	if (pack.ep_es->es_setregs)
    695  1.145  jdolecek 		(*pack.ep_es->es_setregs)(p, &pack, (u_long) stack);
    696   1.55       cgd 
    697   1.55       cgd 	if (p->p_flag & P_TRACED)
    698   1.55       cgd 		psignal(p, SIGTRAP);
    699   1.55       cgd 
    700  1.122  jdolecek 	free(pack.ep_hdr, M_EXEC);
    701  1.122  jdolecek 
    702  1.122  jdolecek 	/*
    703  1.122  jdolecek 	 * Call emulation specific exec hook. This can setup setup per-process
    704  1.122  jdolecek 	 * p->p_emuldata or do any other per-process stuff an emulation needs.
    705  1.122  jdolecek 	 *
    706  1.122  jdolecek 	 * If we are executing process of different emulation than the
    707  1.122  jdolecek 	 * original forked process, call e_proc_exit() of the old emulation
    708  1.122  jdolecek 	 * first, then e_proc_exec() of new emulation. If the emulation is
    709  1.122  jdolecek 	 * same, the exec hook code should deallocate any old emulation
    710  1.122  jdolecek 	 * resources held previously by this process.
    711  1.122  jdolecek 	 */
    712  1.124  jdolecek 	if (p->p_emul && p->p_emul->e_proc_exit
    713  1.124  jdolecek 	    && p->p_emul != pack.ep_es->es_emul)
    714  1.122  jdolecek 		(*p->p_emul->e_proc_exit)(p);
    715  1.122  jdolecek 
    716  1.123  jdolecek 	/*
    717  1.123  jdolecek 	 * Call exec hook. Emulation code may NOT store reference to anything
    718  1.123  jdolecek 	 * from &pack.
    719  1.123  jdolecek 	 */
    720  1.124  jdolecek         if (pack.ep_es->es_emul->e_proc_exec)
    721  1.124  jdolecek                 (*pack.ep_es->es_emul->e_proc_exec)(p, &pack);
    722  1.122  jdolecek 
    723  1.122  jdolecek 	/* update p_emul, the old value is no longer needed */
    724  1.124  jdolecek 	p->p_emul = pack.ep_es->es_emul;
    725  1.148   thorpej 
    726  1.148   thorpej 	/* ...and the same for p_execsw */
    727  1.148   thorpej 	p->p_execsw = pack.ep_es;
    728  1.148   thorpej 
    729  1.133   mycroft #ifdef __HAVE_SYSCALL_INTERN
    730  1.133   mycroft 	(*p->p_emul->e_syscall_intern)(p);
    731  1.133   mycroft #endif
    732   1.70  christos #ifdef KTRACE
    733   1.70  christos 	if (KTRPOINT(p, KTR_EMUL))
    734  1.110  sommerfe 		ktremul(p);
    735   1.70  christos #endif
    736   1.85   mycroft 
    737  1.147  jdolecek #ifdef LKM
    738  1.130  jdolecek 	lockmgr(&exec_lock, LK_RELEASE, NULL);
    739  1.147  jdolecek #endif
    740  1.149  christos 	p->p_flag &= ~P_INEXEC;
    741  1.162      manu 
    742  1.162      manu 	if (p->p_flag & P_STOPEXEC) {
    743  1.162      manu 		int s;
    744  1.162      manu 
    745  1.162      manu 		sigminusset(&contsigmask, &p->p_sigctx.ps_siglist);
    746  1.162      manu 		SCHED_LOCK(s);
    747  1.162      manu 		p->p_stat = SSTOP;
    748  1.162      manu 		mi_switch(p, NULL);
    749  1.162      manu 		SCHED_ASSERT_UNLOCKED();
    750  1.162      manu 		splx(s);
    751  1.162      manu 	}
    752  1.162      manu 
    753   1.85   mycroft 	return (EJUSTRETURN);
    754   1.55       cgd 
    755  1.138     lukem  bad:
    756  1.149  christos 	p->p_flag &= ~P_INEXEC;
    757   1.55       cgd 	/* free the vmspace-creation commands, and release their references */
    758   1.55       cgd 	kill_vmcmds(&pack.ep_vmcmds);
    759   1.55       cgd 	/* kill any opened file descriptor, if necessary */
    760   1.55       cgd 	if (pack.ep_flags & EXEC_HASFD) {
    761   1.55       cgd 		pack.ep_flags &= ~EXEC_HASFD;
    762   1.66   mycroft 		(void) fdrelease(p, pack.ep_fd);
    763   1.55       cgd 	}
    764   1.55       cgd 	/* close and put the exec'd file */
    765   1.99  wrstuden 	vn_lock(pack.ep_vp, LK_EXCLUSIVE | LK_RETRY);
    766   1.55       cgd 	VOP_CLOSE(pack.ep_vp, FREAD, cred, p);
    767   1.99  wrstuden 	vput(pack.ep_vp);
    768  1.120   thorpej 	PNBUF_PUT(nid.ni_cnd.cn_pnbuf);
    769   1.95       eeh 	uvm_km_free_wakeup(exec_map, (vaddr_t) argp, NCARGS);
    770   1.55       cgd 
    771  1.138     lukem  freehdr:
    772  1.150  christos 	p->p_flag &= ~P_INEXEC;
    773  1.147  jdolecek #ifdef LKM
    774  1.130  jdolecek 	lockmgr(&exec_lock, LK_RELEASE, NULL);
    775  1.147  jdolecek #endif
    776  1.130  jdolecek 
    777  1.119   thorpej 	free(pack.ep_hdr, M_EXEC);
    778   1.55       cgd 	return error;
    779   1.55       cgd 
    780  1.138     lukem  exec_abort:
    781  1.150  christos 	p->p_flag &= ~P_INEXEC;
    782  1.147  jdolecek #ifdef LKM
    783  1.130  jdolecek 	lockmgr(&exec_lock, LK_RELEASE, NULL);
    784  1.147  jdolecek #endif
    785  1.130  jdolecek 
    786   1.55       cgd 	/*
    787   1.55       cgd 	 * the old process doesn't exist anymore.  exit gracefully.
    788   1.55       cgd 	 * get rid of the (new) address space we have created, if any, get rid
    789   1.55       cgd 	 * of our namei data and vnode, and exit noting failure
    790   1.55       cgd 	 */
    791   1.88       mrg 	uvm_deallocate(&vm->vm_map, VM_MIN_ADDRESS,
    792   1.88       mrg 		VM_MAXUSER_ADDRESS - VM_MIN_ADDRESS);
    793   1.73   mycroft 	if (pack.ep_emul_arg)
    794  1.124  jdolecek 		FREE(pack.ep_emul_arg, M_TEMP);
    795  1.120   thorpej 	PNBUF_PUT(nid.ni_cnd.cn_pnbuf);
    796   1.99  wrstuden 	vn_lock(pack.ep_vp, LK_EXCLUSIVE | LK_RETRY);
    797   1.55       cgd 	VOP_CLOSE(pack.ep_vp, FREAD, cred, p);
    798   1.99  wrstuden 	vput(pack.ep_vp);
    799   1.95       eeh 	uvm_km_free_wakeup(exec_map, (vaddr_t) argp, NCARGS);
    800  1.119   thorpej 	free(pack.ep_hdr, M_EXEC);
    801  1.144  christos 	exit1(p, W_EXITCODE(error, SIGABRT));
    802   1.55       cgd 
    803   1.55       cgd 	/* NOTREACHED */
    804   1.55       cgd 	return 0;
    805   1.67  christos }
    806   1.67  christos 
    807   1.67  christos 
    808  1.144  christos int
    809  1.154  christos copyargs(struct proc *p, struct exec_package *pack, struct ps_strings *arginfo,
    810  1.144  christos     char **stackp, void *argp)
    811   1.67  christos {
    812  1.138     lukem 	char	**cpp, *dp, *sp;
    813  1.138     lukem 	size_t	len;
    814  1.138     lukem 	void	*nullp;
    815  1.138     lukem 	long	argc, envc;
    816  1.144  christos 	int	error;
    817  1.138     lukem 
    818  1.144  christos 	cpp = (char **)*stackp;
    819  1.138     lukem 	nullp = NULL;
    820  1.138     lukem 	argc = arginfo->ps_nargvstr;
    821  1.138     lukem 	envc = arginfo->ps_nenvstr;
    822  1.144  christos 	if ((error = copyout(&argc, cpp++, sizeof(argc))) != 0)
    823  1.144  christos 		return error;
    824   1.67  christos 
    825  1.124  jdolecek 	dp = (char *) (cpp + argc + envc + 2 + pack->ep_es->es_arglen);
    826   1.67  christos 	sp = argp;
    827   1.67  christos 
    828   1.67  christos 	/* XXX don't copy them out, remap them! */
    829   1.69   mycroft 	arginfo->ps_argvstr = cpp; /* remember location of argv for later */
    830   1.67  christos 
    831   1.67  christos 	for (; --argc >= 0; sp += len, dp += len)
    832  1.144  christos 		if ((error = copyout(&dp, cpp++, sizeof(dp))) != 0 ||
    833  1.144  christos 		    (error = copyoutstr(sp, dp, ARG_MAX, &len)) != 0)
    834  1.144  christos 			return error;
    835   1.67  christos 
    836  1.144  christos 	if ((error = copyout(&nullp, cpp++, sizeof(nullp))) != 0)
    837  1.144  christos 		return error;
    838   1.67  christos 
    839   1.69   mycroft 	arginfo->ps_envstr = cpp; /* remember location of envp for later */
    840   1.67  christos 
    841   1.67  christos 	for (; --envc >= 0; sp += len, dp += len)
    842  1.144  christos 		if ((error = copyout(&dp, cpp++, sizeof(dp))) != 0 ||
    843  1.144  christos 		    (error = copyoutstr(sp, dp, ARG_MAX, &len)) != 0)
    844  1.144  christos 			return error;
    845   1.67  christos 
    846  1.144  christos 	if ((error = copyout(&nullp, cpp++, sizeof(nullp))) != 0)
    847  1.144  christos 		return error;
    848   1.67  christos 
    849  1.144  christos 	*stackp = (char *)cpp;
    850  1.144  christos 	return 0;
    851   1.55       cgd }
    852  1.130  jdolecek 
    853  1.130  jdolecek #ifdef LKM
    854  1.130  jdolecek /*
    855  1.130  jdolecek  * Find an emulation of given name in list of emulations.
    856  1.151  jdolecek  * Needs to be called with the exec_lock held.
    857  1.130  jdolecek  */
    858  1.151  jdolecek const struct emul *
    859  1.138     lukem emul_search(const char *name)
    860  1.130  jdolecek {
    861  1.130  jdolecek 	struct emul_entry *it;
    862  1.130  jdolecek 
    863  1.130  jdolecek 	LIST_FOREACH(it, &el_head, el_list) {
    864  1.130  jdolecek 		if (strcmp(name, it->el_emul->e_name) == 0)
    865  1.130  jdolecek 			return it->el_emul;
    866  1.130  jdolecek 	}
    867  1.130  jdolecek 
    868  1.130  jdolecek 	return NULL;
    869  1.130  jdolecek }
    870  1.130  jdolecek 
    871  1.130  jdolecek /*
    872  1.130  jdolecek  * Add an emulation to list, if it's not there already.
    873  1.130  jdolecek  */
    874  1.130  jdolecek int
    875  1.138     lukem emul_register(const struct emul *emul, int ro_entry)
    876  1.130  jdolecek {
    877  1.138     lukem 	struct emul_entry	*ee;
    878  1.138     lukem 	int			error;
    879  1.130  jdolecek 
    880  1.138     lukem 	error = 0;
    881  1.130  jdolecek 	lockmgr(&exec_lock, LK_SHARED, NULL);
    882  1.130  jdolecek 
    883  1.130  jdolecek 	if (emul_search(emul->e_name)) {
    884  1.130  jdolecek 		error = EEXIST;
    885  1.130  jdolecek 		goto out;
    886  1.130  jdolecek 	}
    887  1.130  jdolecek 
    888  1.130  jdolecek 	MALLOC(ee, struct emul_entry *, sizeof(struct emul_entry),
    889  1.130  jdolecek 		M_EXEC, M_WAITOK);
    890  1.130  jdolecek 	ee->el_emul = emul;
    891  1.130  jdolecek 	ee->ro_entry = ro_entry;
    892  1.130  jdolecek 	LIST_INSERT_HEAD(&el_head, ee, el_list);
    893  1.130  jdolecek 
    894  1.138     lukem  out:
    895  1.130  jdolecek 	lockmgr(&exec_lock, LK_RELEASE, NULL);
    896  1.130  jdolecek 	return error;
    897  1.130  jdolecek }
    898  1.130  jdolecek 
    899  1.130  jdolecek /*
    900  1.130  jdolecek  * Remove emulation with name 'name' from list of supported emulations.
    901  1.130  jdolecek  */
    902  1.130  jdolecek int
    903  1.138     lukem emul_unregister(const char *name)
    904  1.130  jdolecek {
    905  1.130  jdolecek 	const struct proclist_desc *pd;
    906  1.138     lukem 	struct emul_entry	*it;
    907  1.138     lukem 	int			i, error;
    908  1.138     lukem 	struct proc		*ptmp;
    909  1.130  jdolecek 
    910  1.138     lukem 	error = 0;
    911  1.130  jdolecek 	lockmgr(&exec_lock, LK_SHARED, NULL);
    912  1.130  jdolecek 
    913  1.130  jdolecek 	LIST_FOREACH(it, &el_head, el_list) {
    914  1.130  jdolecek 		if (strcmp(it->el_emul->e_name, name) == 0)
    915  1.130  jdolecek 			break;
    916  1.130  jdolecek 	}
    917  1.130  jdolecek 
    918  1.130  jdolecek 	if (!it) {
    919  1.130  jdolecek 		error = ENOENT;
    920  1.130  jdolecek 		goto out;
    921  1.130  jdolecek 	}
    922  1.130  jdolecek 
    923  1.130  jdolecek 	if (it->ro_entry) {
    924  1.130  jdolecek 		error = EBUSY;
    925  1.130  jdolecek 		goto out;
    926  1.130  jdolecek 	}
    927  1.130  jdolecek 
    928  1.130  jdolecek 	/* test if any execw[] entry is still using this */
    929  1.132  jdolecek 	for(i=0; i < nexecs; i++) {
    930  1.130  jdolecek 		if (execsw[i]->es_emul == it->el_emul) {
    931  1.130  jdolecek 			error = EBUSY;
    932  1.130  jdolecek 			goto out;
    933  1.130  jdolecek 		}
    934  1.130  jdolecek 	}
    935  1.130  jdolecek 
    936  1.130  jdolecek 	/*
    937  1.130  jdolecek 	 * Test if any process is running under this emulation - since
    938  1.130  jdolecek 	 * emul_unregister() is running quite sendomly, it's better
    939  1.130  jdolecek 	 * to do expensive check here than to use any locking.
    940  1.130  jdolecek 	 */
    941  1.130  jdolecek 	proclist_lock_read();
    942  1.130  jdolecek 	for (pd = proclists; pd->pd_list != NULL && !error; pd++) {
    943  1.130  jdolecek 		LIST_FOREACH(ptmp, pd->pd_list, p_list) {
    944  1.130  jdolecek 			if (ptmp->p_emul == it->el_emul) {
    945  1.130  jdolecek 				error = EBUSY;
    946  1.130  jdolecek 				break;
    947  1.130  jdolecek 			}
    948  1.130  jdolecek 		}
    949  1.130  jdolecek 	}
    950  1.130  jdolecek 	proclist_unlock_read();
    951  1.130  jdolecek 
    952  1.130  jdolecek 	if (error)
    953  1.130  jdolecek 		goto out;
    954  1.130  jdolecek 
    955  1.130  jdolecek 
    956  1.130  jdolecek 	/* entry is not used, remove it */
    957  1.130  jdolecek 	LIST_REMOVE(it, el_list);
    958  1.130  jdolecek 	FREE(it, M_EXEC);
    959  1.130  jdolecek 
    960  1.138     lukem  out:
    961  1.130  jdolecek 	lockmgr(&exec_lock, LK_RELEASE, NULL);
    962  1.130  jdolecek 	return error;
    963  1.130  jdolecek }
    964  1.130  jdolecek 
    965  1.130  jdolecek /*
    966  1.130  jdolecek  * Add execsw[] entry.
    967  1.130  jdolecek  */
    968  1.130  jdolecek int
    969  1.138     lukem exec_add(struct execsw *esp, const char *e_name)
    970  1.130  jdolecek {
    971  1.138     lukem 	struct exec_entry	*it;
    972  1.138     lukem 	int			error;
    973  1.130  jdolecek 
    974  1.138     lukem 	error = 0;
    975  1.130  jdolecek 	lockmgr(&exec_lock, LK_EXCLUSIVE, NULL);
    976  1.130  jdolecek 
    977  1.130  jdolecek 	if (!esp->es_emul) {
    978  1.130  jdolecek 		esp->es_emul = emul_search(e_name);
    979  1.130  jdolecek 		if (!esp->es_emul) {
    980  1.130  jdolecek 			error = ENOENT;
    981  1.130  jdolecek 			goto out;
    982  1.130  jdolecek 		}
    983  1.130  jdolecek 	}
    984  1.130  jdolecek 
    985  1.130  jdolecek 	LIST_FOREACH(it, &ex_head, ex_list) {
    986  1.130  jdolecek 		/* assume tuple (makecmds, probe_func, emulation) is unique */
    987  1.130  jdolecek 		if (it->es->es_check == esp->es_check
    988  1.130  jdolecek 		    && it->es->u.elf_probe_func == esp->u.elf_probe_func
    989  1.130  jdolecek 		    && it->es->es_emul == esp->es_emul) {
    990  1.130  jdolecek 			error = EEXIST;
    991  1.130  jdolecek 			goto out;
    992  1.130  jdolecek 		}
    993  1.130  jdolecek 	}
    994  1.130  jdolecek 
    995  1.130  jdolecek 	/* if we got here, the entry doesn't exist yet */
    996  1.130  jdolecek 	MALLOC(it, struct exec_entry *, sizeof(struct exec_entry),
    997  1.130  jdolecek 		M_EXEC, M_WAITOK);
    998  1.130  jdolecek 	it->es = esp;
    999  1.130  jdolecek 	LIST_INSERT_HEAD(&ex_head, it, ex_list);
   1000  1.130  jdolecek 
   1001  1.130  jdolecek 	/* update execsw[] */
   1002  1.130  jdolecek 	exec_init(0);
   1003  1.130  jdolecek 
   1004  1.138     lukem  out:
   1005  1.130  jdolecek 	lockmgr(&exec_lock, LK_RELEASE, NULL);
   1006  1.130  jdolecek 	return error;
   1007  1.130  jdolecek }
   1008  1.130  jdolecek 
   1009  1.130  jdolecek /*
   1010  1.130  jdolecek  * Remove execsw[] entry.
   1011  1.130  jdolecek  */
   1012  1.130  jdolecek int
   1013  1.138     lukem exec_remove(const struct execsw *esp)
   1014  1.130  jdolecek {
   1015  1.138     lukem 	struct exec_entry	*it;
   1016  1.138     lukem 	int			error;
   1017  1.130  jdolecek 
   1018  1.138     lukem 	error = 0;
   1019  1.130  jdolecek 	lockmgr(&exec_lock, LK_EXCLUSIVE, NULL);
   1020  1.130  jdolecek 
   1021  1.130  jdolecek 	LIST_FOREACH(it, &ex_head, ex_list) {
   1022  1.130  jdolecek 		/* assume tuple (makecmds, probe_func, emulation) is unique */
   1023  1.130  jdolecek 		if (it->es->es_check == esp->es_check
   1024  1.130  jdolecek 		    && it->es->u.elf_probe_func == esp->u.elf_probe_func
   1025  1.130  jdolecek 		    && it->es->es_emul == esp->es_emul)
   1026  1.130  jdolecek 			break;
   1027  1.130  jdolecek 	}
   1028  1.130  jdolecek 	if (!it) {
   1029  1.130  jdolecek 		error = ENOENT;
   1030  1.130  jdolecek 		goto out;
   1031  1.130  jdolecek 	}
   1032  1.130  jdolecek 
   1033  1.130  jdolecek 	/* remove item from list and free resources */
   1034  1.130  jdolecek 	LIST_REMOVE(it, ex_list);
   1035  1.130  jdolecek 	FREE(it, M_EXEC);
   1036  1.130  jdolecek 
   1037  1.130  jdolecek 	/* update execsw[] */
   1038  1.130  jdolecek 	exec_init(0);
   1039  1.130  jdolecek 
   1040  1.138     lukem  out:
   1041  1.130  jdolecek 	lockmgr(&exec_lock, LK_RELEASE, NULL);
   1042  1.130  jdolecek 	return error;
   1043  1.130  jdolecek }
   1044  1.130  jdolecek 
   1045  1.130  jdolecek static void
   1046  1.138     lukem link_es(struct execsw_entry **listp, const struct execsw *esp)
   1047  1.130  jdolecek {
   1048  1.130  jdolecek 	struct execsw_entry *et, *e1;
   1049  1.130  jdolecek 
   1050  1.130  jdolecek 	MALLOC(et, struct execsw_entry *, sizeof(struct execsw_entry),
   1051  1.130  jdolecek 			M_TEMP, M_WAITOK);
   1052  1.130  jdolecek 	et->next = NULL;
   1053  1.130  jdolecek 	et->es = esp;
   1054  1.130  jdolecek 	if (*listp == NULL) {
   1055  1.130  jdolecek 		*listp = et;
   1056  1.130  jdolecek 		return;
   1057  1.130  jdolecek 	}
   1058  1.130  jdolecek 
   1059  1.130  jdolecek 	switch(et->es->es_prio) {
   1060  1.130  jdolecek 	case EXECSW_PRIO_FIRST:
   1061  1.130  jdolecek 		/* put new entry as the first */
   1062  1.130  jdolecek 		et->next = *listp;
   1063  1.130  jdolecek 		*listp = et;
   1064  1.130  jdolecek 		break;
   1065  1.130  jdolecek 	case EXECSW_PRIO_ANY:
   1066  1.130  jdolecek 		/* put new entry after all *_FIRST and *_ANY entries */
   1067  1.130  jdolecek 		for(e1 = *listp; e1->next
   1068  1.130  jdolecek 			&& e1->next->es->es_prio != EXECSW_PRIO_LAST;
   1069  1.130  jdolecek 			e1 = e1->next);
   1070  1.130  jdolecek 		et->next = e1->next;
   1071  1.130  jdolecek 		e1->next = et;
   1072  1.130  jdolecek 		break;
   1073  1.130  jdolecek 	case EXECSW_PRIO_LAST:
   1074  1.130  jdolecek 		/* put new entry as the last one */
   1075  1.130  jdolecek 		for(e1 = *listp; e1->next; e1 = e1->next);
   1076  1.130  jdolecek 		e1->next = et;
   1077  1.130  jdolecek 		break;
   1078  1.130  jdolecek 	default:
   1079  1.130  jdolecek #ifdef DIAGNOSTIC
   1080  1.157    provos 		panic("execw[] entry with unknown priority %d found",
   1081  1.130  jdolecek 			et->es->es_prio);
   1082  1.130  jdolecek #endif
   1083  1.130  jdolecek 		break;
   1084  1.130  jdolecek 	}
   1085  1.130  jdolecek }
   1086  1.130  jdolecek 
   1087  1.130  jdolecek /*
   1088  1.130  jdolecek  * Initialize exec structures. If init_boot is true, also does necessary
   1089  1.130  jdolecek  * one-time initialization (it's called from main() that way).
   1090  1.147  jdolecek  * Once system is multiuser, this should be called with exec_lock held,
   1091  1.130  jdolecek  * i.e. via exec_{add|remove}().
   1092  1.130  jdolecek  */
   1093  1.130  jdolecek int
   1094  1.138     lukem exec_init(int init_boot)
   1095  1.130  jdolecek {
   1096  1.138     lukem 	const struct execsw	**new_es, * const *old_es;
   1097  1.138     lukem 	struct execsw_entry	*list, *e1;
   1098  1.138     lukem 	struct exec_entry	*e2;
   1099  1.138     lukem 	int			i, es_sz;
   1100  1.130  jdolecek 
   1101  1.130  jdolecek 	if (init_boot) {
   1102  1.130  jdolecek 		/* do one-time initializations */
   1103  1.130  jdolecek 		lockinit(&exec_lock, PWAIT, "execlck", 0, 0);
   1104  1.130  jdolecek 
   1105  1.130  jdolecek 		/* register compiled-in emulations */
   1106  1.130  jdolecek 		for(i=0; i < nexecs_builtin; i++) {
   1107  1.130  jdolecek 			if (execsw_builtin[i].es_emul)
   1108  1.130  jdolecek 				emul_register(execsw_builtin[i].es_emul, 1);
   1109  1.130  jdolecek 		}
   1110  1.130  jdolecek #ifdef DIAGNOSTIC
   1111  1.130  jdolecek 		if (i == 0)
   1112  1.157    provos 			panic("no emulations found in execsw_builtin[]");
   1113  1.130  jdolecek #endif
   1114  1.130  jdolecek 	}
   1115  1.130  jdolecek 
   1116  1.130  jdolecek 	/*
   1117  1.130  jdolecek 	 * Build execsw[] array from builtin entries and entries added
   1118  1.130  jdolecek 	 * at runtime.
   1119  1.130  jdolecek 	 */
   1120  1.130  jdolecek 	list = NULL;
   1121  1.130  jdolecek 	for(i=0; i < nexecs_builtin; i++)
   1122  1.130  jdolecek 		link_es(&list, &execsw_builtin[i]);
   1123  1.130  jdolecek 
   1124  1.130  jdolecek 	/* Add dynamically loaded entries */
   1125  1.130  jdolecek 	es_sz = nexecs_builtin;
   1126  1.130  jdolecek 	LIST_FOREACH(e2, &ex_head, ex_list) {
   1127  1.130  jdolecek 		link_es(&list, e2->es);
   1128  1.130  jdolecek 		es_sz++;
   1129  1.130  jdolecek 	}
   1130  1.130  jdolecek 
   1131  1.130  jdolecek 	/*
   1132  1.130  jdolecek 	 * Now that we have sorted all execw entries, create new execsw[]
   1133  1.130  jdolecek 	 * and free no longer needed memory in the process.
   1134  1.130  jdolecek 	 */
   1135  1.130  jdolecek 	new_es = malloc(es_sz * sizeof(struct execsw *), M_EXEC, M_WAITOK);
   1136  1.130  jdolecek 	for(i=0; list; i++) {
   1137  1.130  jdolecek 		new_es[i] = list->es;
   1138  1.130  jdolecek 		e1 = list->next;
   1139  1.130  jdolecek 		FREE(list, M_TEMP);
   1140  1.130  jdolecek 		list = e1;
   1141  1.130  jdolecek 	}
   1142  1.130  jdolecek 
   1143  1.130  jdolecek 	/*
   1144  1.130  jdolecek 	 * New execsw[] array built, now replace old execsw[] and free
   1145  1.130  jdolecek 	 * used memory.
   1146  1.130  jdolecek 	 */
   1147  1.130  jdolecek 	old_es = execsw;
   1148  1.130  jdolecek 	execsw = new_es;
   1149  1.130  jdolecek 	nexecs = es_sz;
   1150  1.130  jdolecek 	if (old_es)
   1151  1.130  jdolecek 		free((void *)old_es, M_EXEC);
   1152  1.130  jdolecek 
   1153  1.130  jdolecek 	/*
   1154  1.130  jdolecek 	 * Figure out the maximum size of an exec header.
   1155  1.130  jdolecek 	 */
   1156  1.130  jdolecek 	exec_maxhdrsz = 0;
   1157  1.130  jdolecek 	for (i = 0; i < nexecs; i++) {
   1158  1.130  jdolecek 		if (execsw[i]->es_hdrsz > exec_maxhdrsz)
   1159  1.130  jdolecek 			exec_maxhdrsz = execsw[i]->es_hdrsz;
   1160  1.130  jdolecek 	}
   1161  1.130  jdolecek 
   1162  1.130  jdolecek 	return 0;
   1163  1.130  jdolecek }
   1164  1.130  jdolecek #endif
   1165  1.130  jdolecek 
   1166  1.130  jdolecek #ifndef LKM
   1167  1.130  jdolecek /*
   1168  1.130  jdolecek  * Simplified exec_init() for kernels without LKMs. Only initialize
   1169  1.130  jdolecek  * exec_maxhdrsz and execsw[].
   1170  1.130  jdolecek  */
   1171  1.130  jdolecek int
   1172  1.138     lukem exec_init(int init_boot)
   1173  1.130  jdolecek {
   1174  1.130  jdolecek 	int i;
   1175  1.130  jdolecek 
   1176  1.130  jdolecek #ifdef DIAGNOSTIC
   1177  1.130  jdolecek 	if (!init_boot)
   1178  1.130  jdolecek 		panic("exec_init(): called with init_boot == 0");
   1179  1.130  jdolecek #endif
   1180  1.130  jdolecek 
   1181  1.130  jdolecek 	/* do one-time initializations */
   1182  1.130  jdolecek 	nexecs = nexecs_builtin;
   1183  1.130  jdolecek 	execsw = malloc(nexecs*sizeof(struct execsw *), M_EXEC, M_WAITOK);
   1184  1.130  jdolecek 
   1185  1.130  jdolecek 	/*
   1186  1.130  jdolecek 	 * Fill in execsw[] and figure out the maximum size of an exec header.
   1187  1.130  jdolecek 	 */
   1188  1.130  jdolecek 	exec_maxhdrsz = 0;
   1189  1.130  jdolecek 	for(i=0; i < nexecs; i++) {
   1190  1.130  jdolecek 		execsw[i] = &execsw_builtin[i];
   1191  1.130  jdolecek 		if (execsw_builtin[i].es_hdrsz > exec_maxhdrsz)
   1192  1.130  jdolecek 			exec_maxhdrsz = execsw_builtin[i].es_hdrsz;
   1193  1.130  jdolecek 	}
   1194  1.130  jdolecek 
   1195  1.130  jdolecek 	return 0;
   1196  1.130  jdolecek 
   1197  1.130  jdolecek }
   1198  1.130  jdolecek #endif /* !LKM */
   1199