Home | History | Annotate | Line # | Download | only in common
linux_exec.c revision 1.83.16.1
      1  1.83.16.1   gdamore /*	$NetBSD: linux_exec.c,v 1.83.16.1 2006/07/13 17:49:13 gdamore Exp $	*/
      2       1.29  christos 
      3       1.29  christos /*-
      4       1.44   mycroft  * Copyright (c) 1994, 1995, 1998, 2000 The NetBSD Foundation, Inc.
      5       1.29  christos  * All rights reserved.
      6       1.29  christos  *
      7       1.29  christos  * This code is derived from software contributed to The NetBSD Foundation
      8       1.33      fvdl  * by Christos Zoulas, Frank van der Linden, Eric Haszlakiewicz and
      9       1.33      fvdl  * Thor Lancelot Simon.
     10       1.29  christos  *
     11       1.29  christos  * Redistribution and use in source and binary forms, with or without
     12       1.29  christos  * modification, are permitted provided that the following conditions
     13       1.29  christos  * are met:
     14       1.29  christos  * 1. Redistributions of source code must retain the above copyright
     15       1.29  christos  *    notice, this list of conditions and the following disclaimer.
     16       1.29  christos  * 2. Redistributions in binary form must reproduce the above copyright
     17       1.29  christos  *    notice, this list of conditions and the following disclaimer in the
     18       1.29  christos  *    documentation and/or other materials provided with the distribution.
     19       1.29  christos  * 3. All advertising materials mentioning features or use of this software
     20       1.29  christos  *    must display the following acknowledgement:
     21       1.29  christos  *        This product includes software developed by the NetBSD
     22       1.29  christos  *        Foundation, Inc. and its contributors.
     23       1.29  christos  * 4. Neither the name of The NetBSD Foundation nor the names of its
     24       1.29  christos  *    contributors may be used to endorse or promote products derived
     25       1.29  christos  *    from this software without specific prior written permission.
     26       1.29  christos  *
     27       1.29  christos  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     28       1.29  christos  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     29       1.29  christos  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     30       1.29  christos  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     31       1.29  christos  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     32       1.29  christos  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     33       1.29  christos  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     34       1.29  christos  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     35       1.29  christos  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     36       1.29  christos  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     37       1.29  christos  * POSSIBILITY OF SUCH DAMAGE.
     38        1.1      fvdl  */
     39       1.54     lukem 
     40       1.54     lukem #include <sys/cdefs.h>
     41  1.83.16.1   gdamore __KERNEL_RCSID(0, "$NetBSD: linux_exec.c,v 1.83.16.1 2006/07/13 17:49:13 gdamore Exp $");
     42        1.1      fvdl 
     43        1.1      fvdl #include <sys/param.h>
     44        1.1      fvdl #include <sys/systm.h>
     45        1.1      fvdl #include <sys/kernel.h>
     46        1.1      fvdl #include <sys/proc.h>
     47        1.1      fvdl #include <sys/malloc.h>
     48        1.1      fvdl #include <sys/namei.h>
     49        1.1      fvdl #include <sys/vnode.h>
     50       1.13  christos #include <sys/mount.h>
     51       1.25  christos #include <sys/exec.h>
     52        1.8      fvdl #include <sys/exec_elf.h>
     53        1.1      fvdl 
     54        1.1      fvdl #include <sys/mman.h>
     55       1.61   thorpej #include <sys/sa.h>
     56       1.13  christos #include <sys/syscallargs.h>
     57        1.1      fvdl 
     58       1.73      fvdl #include <uvm/uvm_extern.h>
     59       1.73      fvdl 
     60        1.1      fvdl #include <machine/cpu.h>
     61        1.1      fvdl #include <machine/reg.h>
     62        1.1      fvdl 
     63       1.32  christos #include <compat/linux/common/linux_types.h>
     64       1.32  christos #include <compat/linux/common/linux_signal.h>
     65       1.32  christos #include <compat/linux/common/linux_util.h>
     66       1.32  christos #include <compat/linux/common/linux_exec.h>
     67       1.32  christos #include <compat/linux/common/linux_machdep.h>
     68       1.78      manu #include <compat/linux/common/linux_futex.h>
     69       1.32  christos 
     70       1.32  christos #include <compat/linux/linux_syscallargs.h>
     71        1.4  christos #include <compat/linux/linux_syscall.h>
     72       1.38  jdolecek #include <compat/linux/common/linux_misc.h>
     73       1.38  jdolecek #include <compat/linux/common/linux_errno.h>
     74       1.39  jdolecek #include <compat/linux/common/linux_emuldata.h>
     75        1.8      fvdl 
     76       1.38  jdolecek extern struct sysent linux_sysent[];
     77       1.38  jdolecek extern const char * const linux_syscallnames[];
     78       1.38  jdolecek extern char linux_sigcode[], linux_esigcode[];
     79        1.1      fvdl 
     80       1.39  jdolecek static void linux_e_proc_exec __P((struct proc *, struct exec_package *));
     81       1.71  jdolecek static void linux_e_proc_fork __P((struct proc *, struct proc *, int));
     82       1.39  jdolecek static void linux_e_proc_exit __P((struct proc *));
     83       1.71  jdolecek static void linux_e_proc_init __P((struct proc *, struct proc *, int));
     84       1.39  jdolecek 
     85       1.79      manu #ifdef LINUX_NPTL
     86       1.79      manu static void linux_userret __P((struct lwp *, void *));
     87       1.79      manu #endif
     88       1.77      manu 
     89        1.1      fvdl /*
     90        1.1      fvdl  * Execve(2). Just check the alternate emulation path, and pass it on
     91        1.1      fvdl  * to the NetBSD execve().
     92        1.1      fvdl  */
     93        1.1      fvdl int
     94       1.61   thorpej linux_sys_execve(l, v, retval)
     95       1.61   thorpej 	struct lwp *l;
     96       1.11   thorpej 	void *v;
     97       1.11   thorpej 	register_t *retval;
     98       1.11   thorpej {
     99       1.12   mycroft 	struct linux_sys_execve_args /* {
    100       1.35  christos 		syscallarg(const char *) path;
    101        1.1      fvdl 		syscallarg(char **) argv;
    102        1.1      fvdl 		syscallarg(char **) envp;
    103       1.11   thorpej 	} */ *uap = v;
    104       1.61   thorpej 	struct proc *p = l->l_proc;
    105       1.16   mycroft 	struct sys_execve_args ap;
    106        1.1      fvdl 	caddr_t sg;
    107        1.1      fvdl 
    108       1.57  christos 	sg = stackgap_init(p, 0);
    109       1.83  christos 	CHECK_ALT_EXIST(l, &sg, SCARG(uap, path));
    110        1.1      fvdl 
    111       1.16   mycroft 	SCARG(&ap, path) = SCARG(uap, path);
    112       1.16   mycroft 	SCARG(&ap, argp) = SCARG(uap, argp);
    113       1.16   mycroft 	SCARG(&ap, envp) = SCARG(uap, envp);
    114       1.16   mycroft 
    115       1.61   thorpej 	return sys_execve(l, &ap, retval);
    116        1.1      fvdl }
    117       1.38  jdolecek 
    118       1.38  jdolecek /*
    119       1.38  jdolecek  * Emulation switch.
    120       1.38  jdolecek  */
    121       1.65       chs 
    122       1.65       chs struct uvm_object *emul_linux_object;
    123       1.65       chs 
    124       1.38  jdolecek const struct emul emul_linux = {
    125       1.38  jdolecek 	"linux",
    126       1.40  jdolecek 	"/emul/linux",
    127       1.44   mycroft #ifndef __HAVE_MINIMAL_EMUL
    128       1.51      manu 	0,
    129       1.76   tsutsui 	(const int *)native_to_linux_errno,
    130       1.38  jdolecek 	LINUX_SYS_syscall,
    131       1.60  jdolecek 	LINUX_SYS_NSYSENT,
    132       1.44   mycroft #endif
    133       1.38  jdolecek 	linux_sysent,
    134       1.38  jdolecek 	linux_syscallnames,
    135       1.44   mycroft 	linux_sendsig,
    136       1.52  christos 	linux_trapsignal,
    137       1.70      fvdl 	NULL,
    138       1.38  jdolecek 	linux_sigcode,
    139       1.38  jdolecek 	linux_esigcode,
    140       1.65       chs 	&emul_linux_object,
    141       1.53  jdolecek 	linux_setregs,
    142       1.39  jdolecek 	linux_e_proc_exec,
    143       1.39  jdolecek 	linux_e_proc_fork,
    144       1.39  jdolecek 	linux_e_proc_exit,
    145       1.69      manu 	NULL,
    146       1.69      manu 	NULL,
    147       1.44   mycroft #ifdef __HAVE_SYSCALL_INTERN
    148       1.44   mycroft 	linux_syscall_intern,
    149       1.42  jdolecek #else
    150       1.62   thorpej #error Implement __HAVE_SYSCALL_INTERN for this platform
    151       1.41  jdolecek #endif
    152       1.67    atatat 	NULL,
    153       1.59      manu 	NULL,
    154       1.73      fvdl 
    155       1.74  christos 	uvm_default_mapaddr,
    156       1.75      fvdl 
    157       1.75      fvdl 	linux_usertrap,
    158       1.38  jdolecek };
    159       1.39  jdolecek 
    160       1.39  jdolecek static void
    161       1.71  jdolecek linux_e_proc_init(p, parent, forkflags)
    162       1.71  jdolecek 	struct proc *p, *parent;
    163       1.71  jdolecek 	int forkflags;
    164       1.39  jdolecek {
    165       1.71  jdolecek 	struct linux_emuldata *e = p->p_emuldata;
    166       1.71  jdolecek 	struct linux_emuldata_shared *s;
    167       1.77      manu 	struct linux_emuldata *ep = NULL;
    168       1.71  jdolecek 
    169       1.71  jdolecek 	if (!e) {
    170       1.39  jdolecek 		/* allocate new Linux emuldata */
    171       1.71  jdolecek 		MALLOC(e, void *, sizeof(struct linux_emuldata),
    172       1.71  jdolecek 			M_EMULDATA, M_WAITOK);
    173       1.71  jdolecek 	} else  {
    174       1.72  jdolecek 		e->s->refs--;
    175       1.71  jdolecek 		if (e->s->refs == 0)
    176       1.71  jdolecek 			FREE(e->s, M_EMULDATA);
    177       1.71  jdolecek 	}
    178       1.71  jdolecek 
    179       1.71  jdolecek 	memset(e, '\0', sizeof(struct linux_emuldata));
    180       1.71  jdolecek 
    181  1.83.16.1   gdamore 	e->proc = p;
    182  1.83.16.1   gdamore 
    183       1.77      manu 	if (parent)
    184       1.77      manu 		ep = parent->p_emuldata;
    185       1.77      manu 
    186       1.72  jdolecek 	if (forkflags & FORK_SHAREVM) {
    187       1.77      manu #ifdef DIAGNOSTIC
    188       1.77      manu 		if (ep == NULL) {
    189       1.77      manu 			killproc(p, "FORK_SHAREVM while emuldata is NULL\n");
    190       1.77      manu 			return;
    191       1.77      manu 		}
    192       1.77      manu #endif
    193       1.77      manu 		s = ep->s;
    194       1.71  jdolecek 		s->refs++;
    195       1.71  jdolecek 	} else {
    196       1.71  jdolecek 		struct vmspace *vm;
    197       1.71  jdolecek 
    198       1.71  jdolecek 		MALLOC(s, void *, sizeof(struct linux_emuldata_shared),
    199       1.39  jdolecek 			M_EMULDATA, M_WAITOK);
    200       1.71  jdolecek 		s->refs = 1;
    201       1.71  jdolecek 
    202       1.71  jdolecek 		/*
    203       1.71  jdolecek 		 * Set the process idea of the break to the real value.
    204       1.71  jdolecek 		 * For fork, we use parent's vmspace since our's
    205       1.71  jdolecek 		 * is not setup at the time of this call and is going
    206       1.71  jdolecek 		 * to be copy of parent's anyway. For exec, just
    207       1.71  jdolecek 		 * use our own vmspace.
    208       1.71  jdolecek 		 */
    209       1.71  jdolecek 		vm = (parent) ? parent->p_vmspace : p->p_vmspace;
    210       1.71  jdolecek 		s->p_break = vm->vm_daddr + ctob(vm->vm_dsize);
    211       1.71  jdolecek 
    212       1.77      manu 		/*
    213       1.77      manu 		 * Linux threads are emulated as NetBSD processes (not lwp)
    214       1.77      manu 		 * We use native PID for Linux TID. The Linux TID is the
    215       1.77      manu 		 * PID of the first process in the group. It is stored
    216       1.77      manu 		 * here
    217       1.77      manu 		 */
    218       1.77      manu 		s->group_pid = p->p_pid;
    219  1.83.16.1   gdamore 
    220  1.83.16.1   gdamore 		/*
    221  1.83.16.1   gdamore 		 * Initialize the list of threads in the group
    222  1.83.16.1   gdamore 		 */
    223  1.83.16.1   gdamore 		LIST_INIT(&s->threads);
    224       1.39  jdolecek 	}
    225       1.39  jdolecek 
    226       1.71  jdolecek 	e->s = s;
    227       1.77      manu 
    228  1.83.16.1   gdamore 	/*
    229  1.83.16.1   gdamore 	 * Add this thread in the group thread list
    230  1.83.16.1   gdamore 	 */
    231  1.83.16.1   gdamore 	LIST_INSERT_HEAD(&s->threads, e, threads);
    232  1.83.16.1   gdamore 
    233       1.79      manu #ifdef LINUX_NPTL
    234       1.77      manu 	/*
    235       1.77      manu 	 * initialize TID pointers. ep->child_clear_tid and
    236       1.77      manu 	 * ep->child_set_tid will not be used beyond this point.
    237       1.77      manu 	 */
    238       1.77      manu 	e->child_clear_tid = NULL;
    239       1.77      manu 	e->child_set_tid = NULL;
    240       1.77      manu 	if (ep != NULL) {
    241       1.77      manu 		e->clear_tid = ep->child_clear_tid;
    242       1.77      manu 		e->set_tid = ep->child_set_tid;
    243       1.79      manu 		e->set_tls = ep->set_tls;
    244       1.77      manu 		ep->child_clear_tid = NULL;
    245       1.77      manu 		ep->child_set_tid = NULL;
    246       1.79      manu 		ep->set_tls = 0;
    247       1.77      manu 	} else {
    248       1.77      manu 		e->clear_tid = NULL;
    249       1.77      manu 		e->set_tid = NULL;
    250       1.79      manu 		e->set_tls = 0;
    251       1.77      manu 	}
    252       1.79      manu #endif /* LINUX_NPTL */
    253       1.77      manu 
    254       1.71  jdolecek 	p->p_emuldata = e;
    255       1.48  jdolecek }
    256       1.48  jdolecek 
    257       1.48  jdolecek /*
    258       1.71  jdolecek  * Allocate new per-process structures. Called when executing Linux
    259       1.48  jdolecek  * process. We can reuse the old emuldata - if it's not null,
    260       1.48  jdolecek  * the executed process is of same emulation as original forked one.
    261       1.48  jdolecek  */
    262       1.48  jdolecek static void
    263       1.48  jdolecek linux_e_proc_exec(p, epp)
    264       1.48  jdolecek 	struct proc *p;
    265       1.48  jdolecek 	struct exec_package *epp;
    266       1.48  jdolecek {
    267       1.48  jdolecek 	/* exec, use our vmspace */
    268       1.71  jdolecek 	linux_e_proc_init(p, NULL, 0);
    269       1.39  jdolecek }
    270       1.39  jdolecek 
    271       1.39  jdolecek /*
    272       1.39  jdolecek  * Emulation per-process exit hook.
    273       1.39  jdolecek  */
    274       1.39  jdolecek static void
    275       1.39  jdolecek linux_e_proc_exit(p)
    276       1.39  jdolecek 	struct proc *p;
    277       1.39  jdolecek {
    278       1.71  jdolecek 	struct linux_emuldata *e = p->p_emuldata;
    279       1.71  jdolecek 
    280       1.79      manu #ifdef LINUX_NPTL
    281       1.77      manu 	/* Emulate LINUX_CLONE_CHILD_CLEARTID */
    282       1.77      manu 	if (e->clear_tid != NULL) {
    283       1.77      manu 		int error;
    284       1.77      manu 		int null = 0;
    285       1.78      manu 		struct linux_sys_futex_args cup;
    286       1.78      manu 		register_t retval;
    287       1.78      manu 		struct lwp *l;
    288       1.77      manu 
    289  1.83.16.1   gdamore 		error = copyout(&null, e->clear_tid, sizeof(null));
    290  1.83.16.1   gdamore #ifdef DEBUG_LINUX
    291  1.83.16.1   gdamore 		if (error != 0)
    292       1.77      manu 			printf("linux_e_proc_exit: cannot clear TID\n");
    293  1.83.16.1   gdamore #endif
    294       1.77      manu 
    295       1.78      manu 		l = proc_representative_lwp(p);
    296       1.78      manu 		SCARG(&cup, uaddr) = e->clear_tid;
    297       1.78      manu 		SCARG(&cup, op) = LINUX_FUTEX_WAKE;
    298       1.82      manu 		SCARG(&cup, val) = 0x7fffffff; /* Awake everyone */
    299       1.78      manu 		SCARG(&cup, timeout) = NULL;
    300       1.78      manu 		SCARG(&cup, uaddr2) = NULL;
    301       1.78      manu 		SCARG(&cup, val3) = 0;
    302       1.78      manu 		if ((error = linux_sys_futex(l, &cup, &retval)) != 0)
    303       1.77      manu 			printf("linux_e_proc_exit: linux_sys_futex failed\n");
    304       1.77      manu 	}
    305       1.79      manu #endif /* LINUX_NPTL */
    306       1.77      manu 
    307  1.83.16.1   gdamore 	/* Remove the thread for the group thread list */
    308  1.83.16.1   gdamore 	LIST_REMOVE(e, threads);
    309  1.83.16.1   gdamore 
    310       1.39  jdolecek 	/* free Linux emuldata and set the pointer to null */
    311       1.71  jdolecek 	e->s->refs--;
    312       1.71  jdolecek 	if (e->s->refs == 0)
    313       1.71  jdolecek 		FREE(e->s, M_EMULDATA);
    314       1.71  jdolecek 	FREE(e, M_EMULDATA);
    315       1.39  jdolecek 	p->p_emuldata = NULL;
    316       1.39  jdolecek }
    317       1.39  jdolecek 
    318       1.39  jdolecek /*
    319       1.39  jdolecek  * Emulation fork hook.
    320       1.39  jdolecek  */
    321       1.39  jdolecek static void
    322       1.71  jdolecek linux_e_proc_fork(p, parent, forkflags)
    323       1.39  jdolecek 	struct proc *p, *parent;
    324       1.71  jdolecek 	int forkflags;
    325       1.39  jdolecek {
    326       1.80      manu #ifdef LINUX_NPTL
    327       1.77      manu 	struct linux_emuldata *e;
    328       1.80      manu #endif
    329       1.77      manu 
    330       1.39  jdolecek 	/*
    331       1.71  jdolecek 	 * The new process might share some vmspace-related stuff
    332       1.71  jdolecek 	 * with parent, depending on fork flags (CLONE_VM et.al).
    333       1.71  jdolecek 	 * Force allocation of new base emuldata, and share the
    334       1.71  jdolecek 	 * VM-related parts only if necessary.
    335       1.39  jdolecek 	 */
    336       1.39  jdolecek 	p->p_emuldata = NULL;
    337       1.71  jdolecek 	linux_e_proc_init(p, parent, forkflags);
    338       1.77      manu 
    339       1.79      manu #ifdef LINUX_NPTL
    340       1.77      manu 	/*
    341       1.79      manu 	 * Emulate LINUX_CLONE_CHILD_SETTID and LINUX_CLONE_TLS:
    342       1.79      manu 	 * This cannot be done right now because the child VM
    343       1.79      manu 	 * is not set up. We will do it at userret time.
    344       1.77      manu 	 */
    345       1.77      manu 	e = p->p_emuldata;
    346       1.79      manu 	if ((e->set_tid != NULL) || (e->set_tls != 0))
    347       1.79      manu 		p->p_userret = (*linux_userret);
    348       1.79      manu #endif
    349       1.77      manu 
    350       1.77      manu 	return;
    351       1.77      manu }
    352       1.77      manu 
    353       1.79      manu #ifdef LINUX_NPTL
    354       1.77      manu static void
    355       1.79      manu linux_userret(l, arg)
    356       1.77      manu 	struct lwp *l;
    357       1.77      manu 	void *arg;
    358       1.77      manu {
    359       1.77      manu 	struct proc *p = l->l_proc;
    360       1.77      manu 	struct linux_emuldata *led = p->p_emuldata;
    361       1.77      manu 	int error;
    362       1.77      manu 
    363       1.77      manu 	p->p_userret = NULL;
    364       1.77      manu 
    365       1.77      manu 	/* Emulate LINUX_CLONE_CHILD_SETTID  */
    366       1.77      manu 	if (led->set_tid != NULL) {
    367       1.77      manu 		if ((error = copyout(&p->p_pid,
    368       1.77      manu 		    led->set_tid, sizeof(p->p_pid))) != 0)
    369       1.79      manu 			printf("linux_userret: cannot set TID\n");
    370       1.79      manu 	}
    371       1.79      manu 
    372       1.79      manu 	/* Emulate LINUX_CLONE_NEWTLS */
    373       1.79      manu 	if (led->set_tls != 0) {
    374       1.79      manu 		if (linux_set_newtls(l, led->set_tls) != 0)
    375       1.79      manu 			printf("linux_userret: cannot set TLS\n");
    376       1.77      manu 	}
    377       1.77      manu 
    378       1.77      manu 	return;
    379       1.39  jdolecek }
    380       1.79      manu #endif /* LINUX_NPTL */
    381