Home | History | Annotate | Line # | Download | only in common
linux_exec.c revision 1.83.8.1
      1  1.83.8.1      yamt /*	$NetBSD: linux_exec.c,v 1.83.8.1 2006/06/26 12:46:18 yamt Exp $	*/
      2      1.29  christos 
      3      1.29  christos /*-
      4      1.44   mycroft  * Copyright (c) 1994, 1995, 1998, 2000 The NetBSD Foundation, Inc.
      5      1.29  christos  * All rights reserved.
      6      1.29  christos  *
      7      1.29  christos  * This code is derived from software contributed to The NetBSD Foundation
      8      1.33      fvdl  * by Christos Zoulas, Frank van der Linden, Eric Haszlakiewicz and
      9      1.33      fvdl  * Thor Lancelot Simon.
     10      1.29  christos  *
     11      1.29  christos  * Redistribution and use in source and binary forms, with or without
     12      1.29  christos  * modification, are permitted provided that the following conditions
     13      1.29  christos  * are met:
     14      1.29  christos  * 1. Redistributions of source code must retain the above copyright
     15      1.29  christos  *    notice, this list of conditions and the following disclaimer.
     16      1.29  christos  * 2. Redistributions in binary form must reproduce the above copyright
     17      1.29  christos  *    notice, this list of conditions and the following disclaimer in the
     18      1.29  christos  *    documentation and/or other materials provided with the distribution.
     19      1.29  christos  * 3. All advertising materials mentioning features or use of this software
     20      1.29  christos  *    must display the following acknowledgement:
     21      1.29  christos  *        This product includes software developed by the NetBSD
     22      1.29  christos  *        Foundation, Inc. and its contributors.
     23      1.29  christos  * 4. Neither the name of The NetBSD Foundation nor the names of its
     24      1.29  christos  *    contributors may be used to endorse or promote products derived
     25      1.29  christos  *    from this software without specific prior written permission.
     26      1.29  christos  *
     27      1.29  christos  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     28      1.29  christos  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     29      1.29  christos  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     30      1.29  christos  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     31      1.29  christos  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     32      1.29  christos  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     33      1.29  christos  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     34      1.29  christos  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     35      1.29  christos  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     36      1.29  christos  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     37      1.29  christos  * POSSIBILITY OF SUCH DAMAGE.
     38       1.1      fvdl  */
     39      1.54     lukem 
     40      1.54     lukem #include <sys/cdefs.h>
     41  1.83.8.1      yamt __KERNEL_RCSID(0, "$NetBSD: linux_exec.c,v 1.83.8.1 2006/06/26 12:46:18 yamt Exp $");
     42       1.1      fvdl 
     43       1.1      fvdl #include <sys/param.h>
     44       1.1      fvdl #include <sys/systm.h>
     45       1.1      fvdl #include <sys/kernel.h>
     46       1.1      fvdl #include <sys/proc.h>
     47       1.1      fvdl #include <sys/malloc.h>
     48       1.1      fvdl #include <sys/namei.h>
     49       1.1      fvdl #include <sys/vnode.h>
     50      1.13  christos #include <sys/mount.h>
     51      1.25  christos #include <sys/exec.h>
     52       1.8      fvdl #include <sys/exec_elf.h>
     53       1.1      fvdl 
     54       1.1      fvdl #include <sys/mman.h>
     55      1.61   thorpej #include <sys/sa.h>
     56      1.13  christos #include <sys/syscallargs.h>
     57       1.1      fvdl 
     58      1.73      fvdl #include <uvm/uvm_extern.h>
     59      1.73      fvdl 
     60       1.1      fvdl #include <machine/cpu.h>
     61       1.1      fvdl #include <machine/reg.h>
     62       1.1      fvdl 
     63      1.32  christos #include <compat/linux/common/linux_types.h>
     64      1.32  christos #include <compat/linux/common/linux_signal.h>
     65      1.32  christos #include <compat/linux/common/linux_util.h>
     66      1.32  christos #include <compat/linux/common/linux_exec.h>
     67      1.32  christos #include <compat/linux/common/linux_machdep.h>
     68      1.78      manu #include <compat/linux/common/linux_futex.h>
     69      1.32  christos 
     70      1.32  christos #include <compat/linux/linux_syscallargs.h>
     71       1.4  christos #include <compat/linux/linux_syscall.h>
     72      1.38  jdolecek #include <compat/linux/common/linux_misc.h>
     73      1.38  jdolecek #include <compat/linux/common/linux_errno.h>
     74      1.39  jdolecek #include <compat/linux/common/linux_emuldata.h>
     75       1.8      fvdl 
     76      1.38  jdolecek extern struct sysent linux_sysent[];
     77      1.38  jdolecek extern const char * const linux_syscallnames[];
     78      1.38  jdolecek extern char linux_sigcode[], linux_esigcode[];
     79       1.1      fvdl 
     80      1.39  jdolecek static void linux_e_proc_exec __P((struct proc *, struct exec_package *));
     81      1.71  jdolecek static void linux_e_proc_fork __P((struct proc *, struct proc *, int));
     82      1.39  jdolecek static void linux_e_proc_exit __P((struct proc *));
     83      1.71  jdolecek static void linux_e_proc_init __P((struct proc *, struct proc *, int));
     84      1.39  jdolecek 
     85      1.79      manu #ifdef LINUX_NPTL
     86      1.79      manu static void linux_userret __P((struct lwp *, void *));
     87      1.79      manu #endif
     88      1.77      manu 
     89       1.1      fvdl /*
     90       1.1      fvdl  * Execve(2). Just check the alternate emulation path, and pass it on
     91       1.1      fvdl  * to the NetBSD execve().
     92       1.1      fvdl  */
     93       1.1      fvdl int
     94      1.61   thorpej linux_sys_execve(l, v, retval)
     95      1.61   thorpej 	struct lwp *l;
     96      1.11   thorpej 	void *v;
     97      1.11   thorpej 	register_t *retval;
     98      1.11   thorpej {
     99      1.12   mycroft 	struct linux_sys_execve_args /* {
    100      1.35  christos 		syscallarg(const char *) path;
    101       1.1      fvdl 		syscallarg(char **) argv;
    102       1.1      fvdl 		syscallarg(char **) envp;
    103      1.11   thorpej 	} */ *uap = v;
    104      1.61   thorpej 	struct proc *p = l->l_proc;
    105      1.16   mycroft 	struct sys_execve_args ap;
    106       1.1      fvdl 	caddr_t sg;
    107       1.1      fvdl 
    108      1.57  christos 	sg = stackgap_init(p, 0);
    109      1.83  christos 	CHECK_ALT_EXIST(l, &sg, SCARG(uap, path));
    110       1.1      fvdl 
    111      1.16   mycroft 	SCARG(&ap, path) = SCARG(uap, path);
    112      1.16   mycroft 	SCARG(&ap, argp) = SCARG(uap, argp);
    113      1.16   mycroft 	SCARG(&ap, envp) = SCARG(uap, envp);
    114      1.16   mycroft 
    115      1.61   thorpej 	return sys_execve(l, &ap, retval);
    116       1.1      fvdl }
    117      1.38  jdolecek 
    118      1.38  jdolecek /*
    119      1.38  jdolecek  * Emulation switch.
    120      1.38  jdolecek  */
    121      1.65       chs 
    122      1.65       chs struct uvm_object *emul_linux_object;
    123      1.65       chs 
    124      1.38  jdolecek const struct emul emul_linux = {
    125      1.38  jdolecek 	"linux",
    126      1.40  jdolecek 	"/emul/linux",
    127      1.44   mycroft #ifndef __HAVE_MINIMAL_EMUL
    128      1.51      manu 	0,
    129      1.76   tsutsui 	(const int *)native_to_linux_errno,
    130      1.38  jdolecek 	LINUX_SYS_syscall,
    131      1.60  jdolecek 	LINUX_SYS_NSYSENT,
    132      1.44   mycroft #endif
    133      1.38  jdolecek 	linux_sysent,
    134      1.38  jdolecek 	linux_syscallnames,
    135      1.44   mycroft 	linux_sendsig,
    136      1.52  christos 	linux_trapsignal,
    137      1.70      fvdl 	NULL,
    138      1.38  jdolecek 	linux_sigcode,
    139      1.38  jdolecek 	linux_esigcode,
    140      1.65       chs 	&emul_linux_object,
    141      1.53  jdolecek 	linux_setregs,
    142      1.39  jdolecek 	linux_e_proc_exec,
    143      1.39  jdolecek 	linux_e_proc_fork,
    144      1.39  jdolecek 	linux_e_proc_exit,
    145      1.69      manu 	NULL,
    146      1.69      manu 	NULL,
    147      1.44   mycroft #ifdef __HAVE_SYSCALL_INTERN
    148      1.44   mycroft 	linux_syscall_intern,
    149      1.42  jdolecek #else
    150      1.62   thorpej #error Implement __HAVE_SYSCALL_INTERN for this platform
    151      1.41  jdolecek #endif
    152      1.67    atatat 	NULL,
    153      1.59      manu 	NULL,
    154      1.73      fvdl 
    155      1.74  christos 	uvm_default_mapaddr,
    156      1.75      fvdl 
    157      1.75      fvdl 	linux_usertrap,
    158      1.38  jdolecek };
    159      1.39  jdolecek 
    160      1.39  jdolecek static void
    161      1.71  jdolecek linux_e_proc_init(p, parent, forkflags)
    162      1.71  jdolecek 	struct proc *p, *parent;
    163      1.71  jdolecek 	int forkflags;
    164      1.39  jdolecek {
    165      1.71  jdolecek 	struct linux_emuldata *e = p->p_emuldata;
    166      1.71  jdolecek 	struct linux_emuldata_shared *s;
    167      1.77      manu 	struct linux_emuldata *ep = NULL;
    168      1.71  jdolecek 
    169      1.71  jdolecek 	if (!e) {
    170      1.39  jdolecek 		/* allocate new Linux emuldata */
    171      1.71  jdolecek 		MALLOC(e, void *, sizeof(struct linux_emuldata),
    172      1.71  jdolecek 			M_EMULDATA, M_WAITOK);
    173      1.71  jdolecek 	} else  {
    174      1.72  jdolecek 		e->s->refs--;
    175      1.71  jdolecek 		if (e->s->refs == 0)
    176      1.71  jdolecek 			FREE(e->s, M_EMULDATA);
    177      1.71  jdolecek 	}
    178      1.71  jdolecek 
    179      1.71  jdolecek 	memset(e, '\0', sizeof(struct linux_emuldata));
    180      1.71  jdolecek 
    181  1.83.8.1      yamt 	e->proc = p;
    182  1.83.8.1      yamt 
    183      1.77      manu 	if (parent)
    184      1.77      manu 		ep = parent->p_emuldata;
    185      1.77      manu 
    186      1.72  jdolecek 	if (forkflags & FORK_SHAREVM) {
    187      1.77      manu #ifdef DIAGNOSTIC
    188      1.77      manu 		if (ep == NULL) {
    189      1.77      manu 			killproc(p, "FORK_SHAREVM while emuldata is NULL\n");
    190      1.77      manu 			return;
    191      1.77      manu 		}
    192      1.77      manu #endif
    193      1.77      manu 		s = ep->s;
    194      1.71  jdolecek 		s->refs++;
    195      1.71  jdolecek 	} else {
    196      1.71  jdolecek 		struct vmspace *vm;
    197      1.71  jdolecek 
    198      1.71  jdolecek 		MALLOC(s, void *, sizeof(struct linux_emuldata_shared),
    199      1.39  jdolecek 			M_EMULDATA, M_WAITOK);
    200      1.71  jdolecek 		s->refs = 1;
    201      1.71  jdolecek 
    202      1.71  jdolecek 		/*
    203      1.71  jdolecek 		 * Set the process idea of the break to the real value.
    204      1.71  jdolecek 		 * For fork, we use parent's vmspace since our's
    205      1.71  jdolecek 		 * is not setup at the time of this call and is going
    206      1.71  jdolecek 		 * to be copy of parent's anyway. For exec, just
    207      1.71  jdolecek 		 * use our own vmspace.
    208      1.71  jdolecek 		 */
    209      1.71  jdolecek 		vm = (parent) ? parent->p_vmspace : p->p_vmspace;
    210      1.71  jdolecek 		s->p_break = vm->vm_daddr + ctob(vm->vm_dsize);
    211      1.71  jdolecek 
    212      1.77      manu 		/*
    213      1.77      manu 		 * Linux threads are emulated as NetBSD processes (not lwp)
    214      1.77      manu 		 * We use native PID for Linux TID. The Linux TID is the
    215      1.77      manu 		 * PID of the first process in the group. It is stored
    216      1.77      manu 		 * here
    217      1.77      manu 		 */
    218      1.77      manu 		s->group_pid = p->p_pid;
    219  1.83.8.1      yamt 
    220  1.83.8.1      yamt 		/*
    221  1.83.8.1      yamt 		 * Initialize the list of threads in the group
    222  1.83.8.1      yamt 		 */
    223  1.83.8.1      yamt 		LIST_INIT(&s->threads);
    224      1.39  jdolecek 	}
    225      1.39  jdolecek 
    226      1.71  jdolecek 	e->s = s;
    227      1.77      manu 
    228  1.83.8.1      yamt 	/*
    229  1.83.8.1      yamt 	 * Add this thread in the group thread list
    230  1.83.8.1      yamt 	 */
    231  1.83.8.1      yamt 	LIST_INSERT_HEAD(&s->threads, e, threads);
    232  1.83.8.1      yamt 
    233      1.79      manu #ifdef LINUX_NPTL
    234      1.77      manu 	/*
    235      1.77      manu 	 * initialize TID pointers. ep->child_clear_tid and
    236      1.77      manu 	 * ep->child_set_tid will not be used beyond this point.
    237      1.77      manu 	 */
    238      1.77      manu 	e->child_clear_tid = NULL;
    239      1.77      manu 	e->child_set_tid = NULL;
    240      1.77      manu 	if (ep != NULL) {
    241      1.77      manu 		e->clear_tid = ep->child_clear_tid;
    242      1.77      manu 		e->set_tid = ep->child_set_tid;
    243      1.79      manu 		e->set_tls = ep->set_tls;
    244      1.77      manu 		ep->child_clear_tid = NULL;
    245      1.77      manu 		ep->child_set_tid = NULL;
    246      1.79      manu 		ep->set_tls = 0;
    247      1.77      manu 	} else {
    248      1.77      manu 		e->clear_tid = NULL;
    249      1.77      manu 		e->set_tid = NULL;
    250      1.79      manu 		e->set_tls = 0;
    251      1.77      manu 	}
    252      1.79      manu #endif /* LINUX_NPTL */
    253      1.77      manu 
    254      1.71  jdolecek 	p->p_emuldata = e;
    255      1.48  jdolecek }
    256      1.48  jdolecek 
    257      1.48  jdolecek /*
    258      1.71  jdolecek  * Allocate new per-process structures. Called when executing Linux
    259      1.48  jdolecek  * process. We can reuse the old emuldata - if it's not null,
    260      1.48  jdolecek  * the executed process is of same emulation as original forked one.
    261      1.48  jdolecek  */
    262      1.48  jdolecek static void
    263      1.48  jdolecek linux_e_proc_exec(p, epp)
    264      1.48  jdolecek 	struct proc *p;
    265      1.48  jdolecek 	struct exec_package *epp;
    266      1.48  jdolecek {
    267      1.48  jdolecek 	/* exec, use our vmspace */
    268      1.71  jdolecek 	linux_e_proc_init(p, NULL, 0);
    269      1.39  jdolecek }
    270      1.39  jdolecek 
    271      1.39  jdolecek /*
    272      1.39  jdolecek  * Emulation per-process exit hook.
    273      1.39  jdolecek  */
    274      1.39  jdolecek static void
    275      1.39  jdolecek linux_e_proc_exit(p)
    276      1.39  jdolecek 	struct proc *p;
    277      1.39  jdolecek {
    278      1.71  jdolecek 	struct linux_emuldata *e = p->p_emuldata;
    279      1.71  jdolecek 
    280      1.79      manu #ifdef LINUX_NPTL
    281      1.77      manu 	/* Emulate LINUX_CLONE_CHILD_CLEARTID */
    282      1.77      manu 	if (e->clear_tid != NULL) {
    283      1.77      manu 		int error;
    284      1.77      manu 		int null = 0;
    285      1.78      manu 		struct linux_sys_futex_args cup;
    286      1.78      manu 		register_t retval;
    287      1.78      manu 		struct lwp *l;
    288      1.77      manu 
    289  1.83.8.1      yamt 		error = copyout(&null, e->clear_tid, sizeof(null));
    290  1.83.8.1      yamt #ifdef DEBUG_LINUX
    291  1.83.8.1      yamt 		if (error != 0)
    292      1.77      manu 			printf("linux_e_proc_exit: cannot clear TID\n");
    293  1.83.8.1      yamt #endif
    294      1.77      manu 
    295      1.78      manu 		l = proc_representative_lwp(p);
    296      1.78      manu 		SCARG(&cup, uaddr) = e->clear_tid;
    297      1.78      manu 		SCARG(&cup, op) = LINUX_FUTEX_WAKE;
    298      1.82      manu 		SCARG(&cup, val) = 0x7fffffff; /* Awake everyone */
    299      1.78      manu 		SCARG(&cup, timeout) = NULL;
    300      1.78      manu 		SCARG(&cup, uaddr2) = NULL;
    301      1.78      manu 		SCARG(&cup, val3) = 0;
    302      1.78      manu 		if ((error = linux_sys_futex(l, &cup, &retval)) != 0)
    303      1.77      manu 			printf("linux_e_proc_exit: linux_sys_futex failed\n");
    304      1.77      manu 	}
    305      1.79      manu #endif /* LINUX_NPTL */
    306      1.77      manu 
    307  1.83.8.1      yamt 	/* Remove the thread for the group thread list */
    308  1.83.8.1      yamt 	LIST_REMOVE(e, threads);
    309  1.83.8.1      yamt 
    310      1.39  jdolecek 	/* free Linux emuldata and set the pointer to null */
    311      1.71  jdolecek 	e->s->refs--;
    312      1.71  jdolecek 	if (e->s->refs == 0)
    313      1.71  jdolecek 		FREE(e->s, M_EMULDATA);
    314      1.71  jdolecek 	FREE(e, M_EMULDATA);
    315      1.39  jdolecek 	p->p_emuldata = NULL;
    316      1.39  jdolecek }
    317      1.39  jdolecek 
    318      1.39  jdolecek /*
    319      1.39  jdolecek  * Emulation fork hook.
    320      1.39  jdolecek  */
    321      1.39  jdolecek static void
    322      1.71  jdolecek linux_e_proc_fork(p, parent, forkflags)
    323      1.39  jdolecek 	struct proc *p, *parent;
    324      1.71  jdolecek 	int forkflags;
    325      1.39  jdolecek {
    326      1.80      manu #ifdef LINUX_NPTL
    327      1.77      manu 	struct linux_emuldata *e;
    328      1.80      manu #endif
    329      1.77      manu 
    330      1.39  jdolecek 	/*
    331      1.71  jdolecek 	 * The new process might share some vmspace-related stuff
    332      1.71  jdolecek 	 * with parent, depending on fork flags (CLONE_VM et.al).
    333      1.71  jdolecek 	 * Force allocation of new base emuldata, and share the
    334      1.71  jdolecek 	 * VM-related parts only if necessary.
    335      1.39  jdolecek 	 */
    336      1.39  jdolecek 	p->p_emuldata = NULL;
    337      1.71  jdolecek 	linux_e_proc_init(p, parent, forkflags);
    338      1.77      manu 
    339      1.79      manu #ifdef LINUX_NPTL
    340      1.77      manu 	/*
    341      1.79      manu 	 * Emulate LINUX_CLONE_CHILD_SETTID and LINUX_CLONE_TLS:
    342      1.79      manu 	 * This cannot be done right now because the child VM
    343      1.79      manu 	 * is not set up. We will do it at userret time.
    344      1.77      manu 	 */
    345      1.77      manu 	e = p->p_emuldata;
    346      1.79      manu 	if ((e->set_tid != NULL) || (e->set_tls != 0))
    347      1.79      manu 		p->p_userret = (*linux_userret);
    348      1.79      manu #endif
    349      1.77      manu 
    350      1.77      manu 	return;
    351      1.77      manu }
    352      1.77      manu 
    353      1.79      manu #ifdef LINUX_NPTL
    354      1.77      manu static void
    355      1.79      manu linux_userret(l, arg)
    356      1.77      manu 	struct lwp *l;
    357      1.77      manu 	void *arg;
    358      1.77      manu {
    359      1.77      manu 	struct proc *p = l->l_proc;
    360      1.77      manu 	struct linux_emuldata *led = p->p_emuldata;
    361      1.77      manu 	int error;
    362      1.77      manu 
    363      1.77      manu 	p->p_userret = NULL;
    364      1.77      manu 
    365      1.77      manu 	/* Emulate LINUX_CLONE_CHILD_SETTID  */
    366      1.77      manu 	if (led->set_tid != NULL) {
    367      1.77      manu 		if ((error = copyout(&p->p_pid,
    368      1.77      manu 		    led->set_tid, sizeof(p->p_pid))) != 0)
    369      1.79      manu 			printf("linux_userret: cannot set TID\n");
    370      1.79      manu 	}
    371      1.79      manu 
    372      1.79      manu 	/* Emulate LINUX_CLONE_NEWTLS */
    373      1.79      manu 	if (led->set_tls != 0) {
    374      1.79      manu 		if (linux_set_newtls(l, led->set_tls) != 0)
    375      1.79      manu 			printf("linux_userret: cannot set TLS\n");
    376      1.77      manu 	}
    377      1.77      manu 
    378      1.77      manu 	return;
    379      1.39  jdolecek }
    380      1.79      manu #endif /* LINUX_NPTL */
    381