Home | History | Annotate | Line # | Download | only in common
linux_exec.c revision 1.83
      1  1.83  christos /*	$NetBSD: linux_exec.c,v 1.83 2005/12/11 12:20:19 christos Exp $	*/
      2  1.29  christos 
      3  1.29  christos /*-
      4  1.44   mycroft  * Copyright (c) 1994, 1995, 1998, 2000 The NetBSD Foundation, Inc.
      5  1.29  christos  * All rights reserved.
      6  1.29  christos  *
      7  1.29  christos  * This code is derived from software contributed to The NetBSD Foundation
      8  1.33      fvdl  * by Christos Zoulas, Frank van der Linden, Eric Haszlakiewicz and
      9  1.33      fvdl  * Thor Lancelot Simon.
     10  1.29  christos  *
     11  1.29  christos  * Redistribution and use in source and binary forms, with or without
     12  1.29  christos  * modification, are permitted provided that the following conditions
     13  1.29  christos  * are met:
     14  1.29  christos  * 1. Redistributions of source code must retain the above copyright
     15  1.29  christos  *    notice, this list of conditions and the following disclaimer.
     16  1.29  christos  * 2. Redistributions in binary form must reproduce the above copyright
     17  1.29  christos  *    notice, this list of conditions and the following disclaimer in the
     18  1.29  christos  *    documentation and/or other materials provided with the distribution.
     19  1.29  christos  * 3. All advertising materials mentioning features or use of this software
     20  1.29  christos  *    must display the following acknowledgement:
     21  1.29  christos  *        This product includes software developed by the NetBSD
     22  1.29  christos  *        Foundation, Inc. and its contributors.
     23  1.29  christos  * 4. Neither the name of The NetBSD Foundation nor the names of its
     24  1.29  christos  *    contributors may be used to endorse or promote products derived
     25  1.29  christos  *    from this software without specific prior written permission.
     26  1.29  christos  *
     27  1.29  christos  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     28  1.29  christos  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     29  1.29  christos  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     30  1.29  christos  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     31  1.29  christos  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     32  1.29  christos  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     33  1.29  christos  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     34  1.29  christos  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     35  1.29  christos  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     36  1.29  christos  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     37  1.29  christos  * POSSIBILITY OF SUCH DAMAGE.
     38   1.1      fvdl  */
     39  1.54     lukem 
     40  1.54     lukem #include <sys/cdefs.h>
     41  1.83  christos __KERNEL_RCSID(0, "$NetBSD: linux_exec.c,v 1.83 2005/12/11 12:20:19 christos Exp $");
     42   1.1      fvdl 
     43   1.1      fvdl #include <sys/param.h>
     44   1.1      fvdl #include <sys/systm.h>
     45   1.1      fvdl #include <sys/kernel.h>
     46   1.1      fvdl #include <sys/proc.h>
     47   1.1      fvdl #include <sys/malloc.h>
     48   1.1      fvdl #include <sys/namei.h>
     49   1.1      fvdl #include <sys/vnode.h>
     50  1.13  christos #include <sys/mount.h>
     51  1.25  christos #include <sys/exec.h>
     52   1.8      fvdl #include <sys/exec_elf.h>
     53   1.1      fvdl 
     54   1.1      fvdl #include <sys/mman.h>
     55  1.61   thorpej #include <sys/sa.h>
     56  1.13  christos #include <sys/syscallargs.h>
     57   1.1      fvdl 
     58  1.73      fvdl #include <uvm/uvm_extern.h>
     59  1.73      fvdl 
     60   1.1      fvdl #include <machine/cpu.h>
     61   1.1      fvdl #include <machine/reg.h>
     62   1.1      fvdl 
     63  1.32  christos #include <compat/linux/common/linux_types.h>
     64  1.32  christos #include <compat/linux/common/linux_signal.h>
     65  1.32  christos #include <compat/linux/common/linux_util.h>
     66  1.32  christos #include <compat/linux/common/linux_exec.h>
     67  1.32  christos #include <compat/linux/common/linux_machdep.h>
     68  1.78      manu #include <compat/linux/common/linux_futex.h>
     69  1.32  christos 
     70  1.32  christos #include <compat/linux/linux_syscallargs.h>
     71   1.4  christos #include <compat/linux/linux_syscall.h>
     72  1.38  jdolecek #include <compat/linux/common/linux_misc.h>
     73  1.38  jdolecek #include <compat/linux/common/linux_errno.h>
     74  1.39  jdolecek #include <compat/linux/common/linux_emuldata.h>
     75   1.8      fvdl 
     76  1.38  jdolecek extern struct sysent linux_sysent[];
     77  1.38  jdolecek extern const char * const linux_syscallnames[];
     78  1.38  jdolecek extern char linux_sigcode[], linux_esigcode[];
     79   1.1      fvdl 
     80  1.39  jdolecek static void linux_e_proc_exec __P((struct proc *, struct exec_package *));
     81  1.71  jdolecek static void linux_e_proc_fork __P((struct proc *, struct proc *, int));
     82  1.39  jdolecek static void linux_e_proc_exit __P((struct proc *));
     83  1.71  jdolecek static void linux_e_proc_init __P((struct proc *, struct proc *, int));
     84  1.39  jdolecek 
     85  1.79      manu #ifdef LINUX_NPTL
     86  1.79      manu static void linux_userret __P((struct lwp *, void *));
     87  1.79      manu #endif
     88  1.77      manu 
     89   1.1      fvdl /*
     90   1.1      fvdl  * Execve(2). Just check the alternate emulation path, and pass it on
     91   1.1      fvdl  * to the NetBSD execve().
     92   1.1      fvdl  */
     93   1.1      fvdl int
     94  1.61   thorpej linux_sys_execve(l, v, retval)
     95  1.61   thorpej 	struct lwp *l;
     96  1.11   thorpej 	void *v;
     97  1.11   thorpej 	register_t *retval;
     98  1.11   thorpej {
     99  1.12   mycroft 	struct linux_sys_execve_args /* {
    100  1.35  christos 		syscallarg(const char *) path;
    101   1.1      fvdl 		syscallarg(char **) argv;
    102   1.1      fvdl 		syscallarg(char **) envp;
    103  1.11   thorpej 	} */ *uap = v;
    104  1.61   thorpej 	struct proc *p = l->l_proc;
    105  1.16   mycroft 	struct sys_execve_args ap;
    106   1.1      fvdl 	caddr_t sg;
    107   1.1      fvdl 
    108  1.57  christos 	sg = stackgap_init(p, 0);
    109  1.83  christos 	CHECK_ALT_EXIST(l, &sg, SCARG(uap, path));
    110   1.1      fvdl 
    111  1.16   mycroft 	SCARG(&ap, path) = SCARG(uap, path);
    112  1.16   mycroft 	SCARG(&ap, argp) = SCARG(uap, argp);
    113  1.16   mycroft 	SCARG(&ap, envp) = SCARG(uap, envp);
    114  1.16   mycroft 
    115  1.61   thorpej 	return sys_execve(l, &ap, retval);
    116   1.1      fvdl }
    117  1.38  jdolecek 
    118  1.38  jdolecek /*
    119  1.38  jdolecek  * Emulation switch.
    120  1.38  jdolecek  */
    121  1.65       chs 
    122  1.65       chs struct uvm_object *emul_linux_object;
    123  1.65       chs 
    124  1.38  jdolecek const struct emul emul_linux = {
    125  1.38  jdolecek 	"linux",
    126  1.40  jdolecek 	"/emul/linux",
    127  1.44   mycroft #ifndef __HAVE_MINIMAL_EMUL
    128  1.51      manu 	0,
    129  1.76   tsutsui 	(const int *)native_to_linux_errno,
    130  1.38  jdolecek 	LINUX_SYS_syscall,
    131  1.60  jdolecek 	LINUX_SYS_NSYSENT,
    132  1.44   mycroft #endif
    133  1.38  jdolecek 	linux_sysent,
    134  1.38  jdolecek 	linux_syscallnames,
    135  1.44   mycroft 	linux_sendsig,
    136  1.52  christos 	linux_trapsignal,
    137  1.70      fvdl 	NULL,
    138  1.38  jdolecek 	linux_sigcode,
    139  1.38  jdolecek 	linux_esigcode,
    140  1.65       chs 	&emul_linux_object,
    141  1.53  jdolecek 	linux_setregs,
    142  1.39  jdolecek 	linux_e_proc_exec,
    143  1.39  jdolecek 	linux_e_proc_fork,
    144  1.39  jdolecek 	linux_e_proc_exit,
    145  1.69      manu 	NULL,
    146  1.69      manu 	NULL,
    147  1.44   mycroft #ifdef __HAVE_SYSCALL_INTERN
    148  1.44   mycroft 	linux_syscall_intern,
    149  1.42  jdolecek #else
    150  1.62   thorpej #error Implement __HAVE_SYSCALL_INTERN for this platform
    151  1.41  jdolecek #endif
    152  1.67    atatat 	NULL,
    153  1.59      manu 	NULL,
    154  1.73      fvdl 
    155  1.74  christos 	uvm_default_mapaddr,
    156  1.75      fvdl 
    157  1.75      fvdl 	linux_usertrap,
    158  1.38  jdolecek };
    159  1.39  jdolecek 
    160  1.39  jdolecek static void
    161  1.71  jdolecek linux_e_proc_init(p, parent, forkflags)
    162  1.71  jdolecek 	struct proc *p, *parent;
    163  1.71  jdolecek 	int forkflags;
    164  1.39  jdolecek {
    165  1.71  jdolecek 	struct linux_emuldata *e = p->p_emuldata;
    166  1.71  jdolecek 	struct linux_emuldata_shared *s;
    167  1.77      manu 	struct linux_emuldata *ep = NULL;
    168  1.71  jdolecek 
    169  1.71  jdolecek 	if (!e) {
    170  1.39  jdolecek 		/* allocate new Linux emuldata */
    171  1.71  jdolecek 		MALLOC(e, void *, sizeof(struct linux_emuldata),
    172  1.71  jdolecek 			M_EMULDATA, M_WAITOK);
    173  1.71  jdolecek 	} else  {
    174  1.72  jdolecek 		e->s->refs--;
    175  1.71  jdolecek 		if (e->s->refs == 0)
    176  1.71  jdolecek 			FREE(e->s, M_EMULDATA);
    177  1.71  jdolecek 	}
    178  1.71  jdolecek 
    179  1.71  jdolecek 	memset(e, '\0', sizeof(struct linux_emuldata));
    180  1.71  jdolecek 
    181  1.77      manu 	if (parent)
    182  1.77      manu 		ep = parent->p_emuldata;
    183  1.77      manu 
    184  1.72  jdolecek 	if (forkflags & FORK_SHAREVM) {
    185  1.77      manu #ifdef DIAGNOSTIC
    186  1.77      manu 		if (ep == NULL) {
    187  1.77      manu 			killproc(p, "FORK_SHAREVM while emuldata is NULL\n");
    188  1.77      manu 			return;
    189  1.77      manu 		}
    190  1.77      manu #endif
    191  1.77      manu 		s = ep->s;
    192  1.71  jdolecek 		s->refs++;
    193  1.71  jdolecek 	} else {
    194  1.71  jdolecek 		struct vmspace *vm;
    195  1.71  jdolecek 
    196  1.71  jdolecek 		MALLOC(s, void *, sizeof(struct linux_emuldata_shared),
    197  1.39  jdolecek 			M_EMULDATA, M_WAITOK);
    198  1.71  jdolecek 		s->refs = 1;
    199  1.71  jdolecek 
    200  1.71  jdolecek 		/*
    201  1.71  jdolecek 		 * Set the process idea of the break to the real value.
    202  1.71  jdolecek 		 * For fork, we use parent's vmspace since our's
    203  1.71  jdolecek 		 * is not setup at the time of this call and is going
    204  1.71  jdolecek 		 * to be copy of parent's anyway. For exec, just
    205  1.71  jdolecek 		 * use our own vmspace.
    206  1.71  jdolecek 		 */
    207  1.71  jdolecek 		vm = (parent) ? parent->p_vmspace : p->p_vmspace;
    208  1.71  jdolecek 		s->p_break = vm->vm_daddr + ctob(vm->vm_dsize);
    209  1.71  jdolecek 
    210  1.77      manu 		/*
    211  1.77      manu 		 * Linux threads are emulated as NetBSD processes (not lwp)
    212  1.77      manu 		 * We use native PID for Linux TID. The Linux TID is the
    213  1.77      manu 		 * PID of the first process in the group. It is stored
    214  1.77      manu 		 * here
    215  1.77      manu 		 */
    216  1.77      manu 		s->group_pid = p->p_pid;
    217  1.39  jdolecek 	}
    218  1.39  jdolecek 
    219  1.71  jdolecek 	e->s = s;
    220  1.77      manu 
    221  1.79      manu #ifdef LINUX_NPTL
    222  1.77      manu 	/*
    223  1.77      manu 	 * initialize TID pointers. ep->child_clear_tid and
    224  1.77      manu 	 * ep->child_set_tid will not be used beyond this point.
    225  1.77      manu 	 */
    226  1.77      manu 	e->child_clear_tid = NULL;
    227  1.77      manu 	e->child_set_tid = NULL;
    228  1.77      manu 	if (ep != NULL) {
    229  1.77      manu 		e->clear_tid = ep->child_clear_tid;
    230  1.77      manu 		e->set_tid = ep->child_set_tid;
    231  1.79      manu 		e->set_tls = ep->set_tls;
    232  1.77      manu 		ep->child_clear_tid = NULL;
    233  1.77      manu 		ep->child_set_tid = NULL;
    234  1.79      manu 		ep->set_tls = 0;
    235  1.77      manu 	} else {
    236  1.77      manu 		e->clear_tid = NULL;
    237  1.77      manu 		e->set_tid = NULL;
    238  1.79      manu 		e->set_tls = 0;
    239  1.77      manu 	}
    240  1.79      manu #endif /* LINUX_NPTL */
    241  1.77      manu 
    242  1.71  jdolecek 	p->p_emuldata = e;
    243  1.48  jdolecek }
    244  1.48  jdolecek 
    245  1.48  jdolecek /*
    246  1.71  jdolecek  * Allocate new per-process structures. Called when executing Linux
    247  1.48  jdolecek  * process. We can reuse the old emuldata - if it's not null,
    248  1.48  jdolecek  * the executed process is of same emulation as original forked one.
    249  1.48  jdolecek  */
    250  1.48  jdolecek static void
    251  1.48  jdolecek linux_e_proc_exec(p, epp)
    252  1.48  jdolecek 	struct proc *p;
    253  1.48  jdolecek 	struct exec_package *epp;
    254  1.48  jdolecek {
    255  1.48  jdolecek 	/* exec, use our vmspace */
    256  1.71  jdolecek 	linux_e_proc_init(p, NULL, 0);
    257  1.39  jdolecek }
    258  1.39  jdolecek 
    259  1.39  jdolecek /*
    260  1.39  jdolecek  * Emulation per-process exit hook.
    261  1.39  jdolecek  */
    262  1.39  jdolecek static void
    263  1.39  jdolecek linux_e_proc_exit(p)
    264  1.39  jdolecek 	struct proc *p;
    265  1.39  jdolecek {
    266  1.71  jdolecek 	struct linux_emuldata *e = p->p_emuldata;
    267  1.71  jdolecek 
    268  1.79      manu #ifdef LINUX_NPTL
    269  1.77      manu 	/* Emulate LINUX_CLONE_CHILD_CLEARTID */
    270  1.77      manu 	if (e->clear_tid != NULL) {
    271  1.77      manu 		int error;
    272  1.77      manu 		int null = 0;
    273  1.78      manu 		struct linux_sys_futex_args cup;
    274  1.78      manu 		register_t retval;
    275  1.78      manu 		struct lwp *l;
    276  1.77      manu 
    277  1.77      manu 		if ((error = copyout(&null,
    278  1.77      manu 		    e->clear_tid,
    279  1.77      manu 		    sizeof(null))) != 0)
    280  1.77      manu 			printf("linux_e_proc_exit: cannot clear TID\n");
    281  1.77      manu 
    282  1.78      manu 		l = proc_representative_lwp(p);
    283  1.78      manu 		SCARG(&cup, uaddr) = e->clear_tid;
    284  1.78      manu 		SCARG(&cup, op) = LINUX_FUTEX_WAKE;
    285  1.82      manu 		SCARG(&cup, val) = 0x7fffffff; /* Awake everyone */
    286  1.78      manu 		SCARG(&cup, timeout) = NULL;
    287  1.78      manu 		SCARG(&cup, uaddr2) = NULL;
    288  1.78      manu 		SCARG(&cup, val3) = 0;
    289  1.78      manu 		if ((error = linux_sys_futex(l, &cup, &retval)) != 0)
    290  1.77      manu 			printf("linux_e_proc_exit: linux_sys_futex failed\n");
    291  1.77      manu 	}
    292  1.79      manu #endif /* LINUX_NPTL */
    293  1.77      manu 
    294  1.39  jdolecek 	/* free Linux emuldata and set the pointer to null */
    295  1.71  jdolecek 	e->s->refs--;
    296  1.71  jdolecek 	if (e->s->refs == 0)
    297  1.71  jdolecek 		FREE(e->s, M_EMULDATA);
    298  1.71  jdolecek 	FREE(e, M_EMULDATA);
    299  1.39  jdolecek 	p->p_emuldata = NULL;
    300  1.39  jdolecek }
    301  1.39  jdolecek 
    302  1.39  jdolecek /*
    303  1.39  jdolecek  * Emulation fork hook.
    304  1.39  jdolecek  */
    305  1.39  jdolecek static void
    306  1.71  jdolecek linux_e_proc_fork(p, parent, forkflags)
    307  1.39  jdolecek 	struct proc *p, *parent;
    308  1.71  jdolecek 	int forkflags;
    309  1.39  jdolecek {
    310  1.80      manu #ifdef LINUX_NPTL
    311  1.77      manu 	struct linux_emuldata *e;
    312  1.80      manu #endif
    313  1.77      manu 
    314  1.39  jdolecek 	/*
    315  1.71  jdolecek 	 * The new process might share some vmspace-related stuff
    316  1.71  jdolecek 	 * with parent, depending on fork flags (CLONE_VM et.al).
    317  1.71  jdolecek 	 * Force allocation of new base emuldata, and share the
    318  1.71  jdolecek 	 * VM-related parts only if necessary.
    319  1.39  jdolecek 	 */
    320  1.39  jdolecek 	p->p_emuldata = NULL;
    321  1.71  jdolecek 	linux_e_proc_init(p, parent, forkflags);
    322  1.77      manu 
    323  1.79      manu #ifdef LINUX_NPTL
    324  1.77      manu 	/*
    325  1.79      manu 	 * Emulate LINUX_CLONE_CHILD_SETTID and LINUX_CLONE_TLS:
    326  1.79      manu 	 * This cannot be done right now because the child VM
    327  1.79      manu 	 * is not set up. We will do it at userret time.
    328  1.77      manu 	 */
    329  1.77      manu 	e = p->p_emuldata;
    330  1.79      manu 	if ((e->set_tid != NULL) || (e->set_tls != 0))
    331  1.79      manu 		p->p_userret = (*linux_userret);
    332  1.79      manu #endif
    333  1.77      manu 
    334  1.77      manu 	return;
    335  1.77      manu }
    336  1.77      manu 
    337  1.79      manu #ifdef LINUX_NPTL
    338  1.77      manu static void
    339  1.79      manu linux_userret(l, arg)
    340  1.77      manu 	struct lwp *l;
    341  1.77      manu 	void *arg;
    342  1.77      manu {
    343  1.77      manu 	struct proc *p = l->l_proc;
    344  1.77      manu 	struct linux_emuldata *led = p->p_emuldata;
    345  1.77      manu 	int error;
    346  1.77      manu 
    347  1.77      manu 	p->p_userret = NULL;
    348  1.77      manu 
    349  1.77      manu 	/* Emulate LINUX_CLONE_CHILD_SETTID  */
    350  1.77      manu 	if (led->set_tid != NULL) {
    351  1.77      manu 		if ((error = copyout(&p->p_pid,
    352  1.77      manu 		    led->set_tid, sizeof(p->p_pid))) != 0)
    353  1.79      manu 			printf("linux_userret: cannot set TID\n");
    354  1.79      manu 	}
    355  1.79      manu 
    356  1.79      manu 	/* Emulate LINUX_CLONE_NEWTLS */
    357  1.79      manu 	if (led->set_tls != 0) {
    358  1.79      manu 		if (linux_set_newtls(l, led->set_tls) != 0)
    359  1.79      manu 			printf("linux_userret: cannot set TLS\n");
    360  1.77      manu 	}
    361  1.77      manu 
    362  1.77      manu 	return;
    363  1.39  jdolecek }
    364  1.79      manu #endif /* LINUX_NPTL */
    365