Home | History | Annotate | Line # | Download | only in amd64
linux_exec_machdep.c revision 1.10.26.1
      1  1.10.26.1      haad /*	$NetBSD: linux_exec_machdep.c,v 1.10.26.1 2008/12/13 01:13:53 haad Exp $ */
      2        1.1      manu 
      3        1.1      manu /*-
      4        1.1      manu  * Copyright (c) 2005 Emmanuel Dreyfus, all rights reserved
      5        1.1      manu  *
      6        1.1      manu  * Redistribution and use in source and binary forms, with or without
      7        1.1      manu  * modification, are permitted provided that the following conditions
      8        1.1      manu  * are met:
      9        1.1      manu  * 1. Redistributions of source code must retain the above copyright
     10        1.1      manu  *    notice, this list of conditions and the following disclaimer.
     11        1.1      manu  * 2. Redistributions in binary form must reproduce the above copyright
     12        1.1      manu  *    notice, this list of conditions and the following disclaimer in the
     13        1.1      manu  *    documentation and/or other materials provided with the distribution.
     14        1.1      manu  * 3. All advertising materials mentioning features or use of this software
     15        1.1      manu  *    must display the following acknowledgement:
     16        1.1      manu  *	This product includes software developed by Emmanuel Dreyfus
     17        1.1      manu  * 4. The name of the author may not be used to endorse or promote
     18        1.1      manu  *    products derived from this software without specific prior written
     19        1.1      manu  *    permission.
     20        1.1      manu  *
     21        1.1      manu  * THIS SOFTWARE IS PROVIDED BY THE THE AUTHOR AND CONTRIBUTORS ``AS IS''
     22        1.1      manu  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
     23        1.1      manu  * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     24        1.1      manu  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS
     25        1.1      manu  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     26        1.1      manu  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     27        1.1      manu  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     28        1.1      manu  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     29        1.1      manu  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     30        1.1      manu  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     31        1.1      manu  * POSSIBILITY OF SUCH DAMAGE.
     32        1.1      manu  */
     33        1.1      manu 
     34        1.1      manu #include <sys/cdefs.h>
     35  1.10.26.1      haad __KERNEL_RCSID(0, "$NetBSD: linux_exec_machdep.c,v 1.10.26.1 2008/12/13 01:13:53 haad Exp $");
     36        1.1      manu 
     37        1.1      manu #ifdef __amd64__
     38        1.1      manu #define ELFSIZE 64
     39        1.1      manu #endif
     40        1.1      manu 
     41        1.1      manu #include <sys/param.h>
     42        1.1      manu #include <sys/systm.h>
     43        1.1      manu #include <sys/kernel.h>
     44        1.1      manu #include <sys/resource.h>
     45        1.1      manu #include <sys/proc.h>
     46        1.1      manu #include <sys/conf.h>
     47        1.1      manu #include <sys/malloc.h>
     48        1.1      manu #include <sys/exec_elf.h>
     49        1.1      manu #include <sys/vnode.h>
     50        1.1      manu #include <sys/lwp.h>
     51        1.1      manu #include <sys/exec.h>
     52        1.1      manu #include <sys/stat.h>
     53        1.7      yamt #include <sys/kauth.h>
     54        1.1      manu 
     55       1.10        ad #include <sys/cpu.h>
     56        1.1      manu #include <machine/vmparam.h>
     57  1.10.26.1      haad #include <sys/syscallargs.h>
     58        1.1      manu 
     59        1.1      manu #include <uvm/uvm.h>
     60        1.1      manu 
     61        1.1      manu #include <compat/linux/common/linux_types.h>
     62        1.1      manu #include <compat/linux/common/linux_signal.h>
     63  1.10.26.1      haad #include <compat/linux/common/linux_machdep.h>
     64        1.1      manu #include <compat/linux/common/linux_util.h>
     65        1.1      manu #include <compat/linux/common/linux_ioctl.h>
     66        1.1      manu #include <compat/linux/common/linux_hdio.h>
     67        1.1      manu #include <compat/linux/common/linux_exec.h>
     68        1.1      manu #include <compat/linux/common/linux_errno.h>
     69  1.10.26.1      haad #include <compat/linux/common/linux_prctl.h>
     70  1.10.26.1      haad #include <compat/linux/common/linux_ipc.h>
     71  1.10.26.1      haad #include <compat/linux/common/linux_sem.h>
     72  1.10.26.1      haad #include <compat/linux/linux_syscallargs.h>
     73        1.1      manu 
     74        1.1      manu int
     75        1.4  christos linux_exec_setup_stack(struct lwp *l, struct exec_package *epp)
     76        1.1      manu {
     77        1.1      manu 	u_long max_stack_size;
     78        1.1      manu 	u_long access_linear_min, access_size;
     79        1.1      manu 	u_long noaccess_linear_min, noaccess_size;
     80        1.1      manu 
     81        1.1      manu #ifndef USRSTACK32
     82        1.1      manu #define USRSTACK32      (0x00000000ffffffffL & ~PGOFSET)
     83        1.1      manu #endif
     84        1.1      manu 
     85        1.1      manu 	if (epp->ep_flags & EXEC_32) {
     86        1.1      manu 		epp->ep_minsaddr = USRSTACK32;
     87        1.1      manu 		max_stack_size = MAXSSIZ;
     88        1.1      manu 		if (epp->ep_minsaddr > LINUX_USRSTACK32)
     89        1.1      manu 			epp->ep_minsaddr = LINUX_USRSTACK32;
     90        1.1      manu 	} else {
     91        1.1      manu 		epp->ep_minsaddr = USRSTACK;
     92        1.1      manu 		max_stack_size = MAXSSIZ;
     93        1.1      manu 		if (epp->ep_minsaddr > LINUX_USRSTACK)
     94        1.1      manu 			epp->ep_minsaddr = LINUX_USRSTACK;
     95        1.1      manu 
     96        1.1      manu 	}
     97        1.1      manu 
     98        1.1      manu 	epp->ep_maxsaddr = (u_long)STACK_GROW(epp->ep_minsaddr,
     99        1.1      manu 		max_stack_size);
    100        1.4  christos 	epp->ep_ssize = l->l_proc->p_rlimit[RLIMIT_STACK].rlim_cur;
    101        1.1      manu 
    102        1.1      manu 	/*
    103        1.1      manu 	 * set up commands for stack.  note that this takes *two*, one to
    104        1.1      manu 	 * map the part of the stack which we can access, and one to map
    105        1.1      manu 	 * the part which we can't.
    106        1.1      manu 	 *
    107        1.1      manu 	 * arguably, it could be made into one, but that would require the
    108        1.1      manu 	 * addition of another mapping proc, which is unnecessary
    109        1.1      manu 	 */
    110        1.1      manu 	access_size = epp->ep_ssize;
    111        1.1      manu 	access_linear_min = (u_long)STACK_ALLOC(epp->ep_minsaddr, access_size);
    112        1.1      manu 	noaccess_size = max_stack_size - access_size;
    113        1.1      manu 	noaccess_linear_min = (u_long)STACK_ALLOC(STACK_GROW(epp->ep_minsaddr,
    114        1.1      manu 	    access_size), noaccess_size);
    115        1.1      manu 	if (noaccess_size > 0) {
    116        1.1      manu 		NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, noaccess_size,
    117        1.1      manu 		    noaccess_linear_min, NULLVP, 0, VM_PROT_NONE);
    118        1.1      manu 	}
    119        1.1      manu 	KASSERT(access_size > 0);
    120        1.1      manu 	NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, access_size,
    121        1.1      manu 	    access_linear_min, NULLVP, 0, VM_PROT_READ | VM_PROT_WRITE);
    122        1.1      manu 
    123        1.1      manu 	return 0;
    124        1.1      manu }
    125        1.1      manu 
    126        1.1      manu int
    127        1.5  christos ELFNAME2(linux,copyargs)(l, pack, arginfo, stackp, argp)
    128        1.5  christos 	struct lwp *l;
    129        1.1      manu 	struct exec_package *pack;
    130        1.1      manu 	struct ps_strings *arginfo;
    131        1.1      manu 	char **stackp;
    132        1.1      manu 	void *argp;
    133        1.1      manu {
    134        1.1      manu 	struct linux_extra_stack_data64 *esdp, esd;
    135        1.1      manu 	struct elf_args *ap;
    136        1.5  christos 	struct vattr *vap;
    137        1.1      manu 	Elf_Ehdr *eh;
    138        1.1      manu 	Elf_Phdr *ph;
    139        1.1      manu 	u_long phsize;
    140        1.1      manu 	Elf_Addr phdr = 0;
    141        1.1      manu 	int error;
    142        1.1      manu 	int i;
    143        1.1      manu 
    144        1.5  christos 	if ((error = copyargs(l, pack, arginfo, stackp, argp)) != 0)
    145        1.1      manu 		return error;
    146        1.1      manu 
    147        1.1      manu 	/*
    148        1.1      manu 	 * Push extra arguments on the stack needed by dynamically
    149        1.1      manu 	 * linked binaries and static binaries as well.
    150        1.1      manu 	 */
    151        1.1      manu 	memset(&esd, 0, sizeof(esd));
    152        1.1      manu 	esdp = (struct linux_extra_stack_data64 *)(*stackp);
    153        1.1      manu 	ap = (struct elf_args *)pack->ep_emul_arg;
    154        1.1      manu 	vap = pack->ep_vap;
    155        1.1      manu 	eh = (Elf_Ehdr *)pack->ep_hdr;
    156        1.1      manu 
    157        1.1      manu 	/*
    158        1.1      manu 	 * We forgot this, so we ned to reload it now. XXX keep track of it?
    159        1.1      manu 	 */
    160        1.1      manu 	if (ap == NULL) {
    161        1.1      manu 		phsize = eh->e_phnum * sizeof(Elf_Phdr);
    162        1.1      manu 		ph = (Elf_Phdr *)malloc(phsize, M_TEMP, M_WAITOK);
    163        1.5  christos 		error = exec_read_from(l, pack->ep_vp, eh->e_phoff, ph, phsize);
    164        1.1      manu 		if (error != 0) {
    165        1.1      manu 			for (i = 0; i < eh->e_phnum; i++) {
    166        1.1      manu 				if (ph[i].p_type == PT_PHDR) {
    167        1.1      manu 					phdr = ph[i].p_vaddr;
    168        1.1      manu 					break;
    169        1.1      manu 				}
    170        1.1      manu 			}
    171        1.1      manu 		}
    172        1.1      manu 		free(ph, M_TEMP);
    173        1.1      manu 	}
    174        1.1      manu 
    175        1.1      manu 
    176        1.1      manu 	/*
    177        1.1      manu 	 * The exec_package doesn't have a proc pointer and it's not
    178        1.1      manu 	 * exactly trivial to add one since the credentials are
    179        1.1      manu 	 * changing. XXX Linux uses curlwp's credentials.
    180        1.1      manu 	 * Why can't we use them too?
    181        1.1      manu 	 */
    182        1.1      manu 
    183        1.1      manu 	i = 0;
    184        1.1      manu 	esd.ai[i].a_type = LINUX_AT_HWCAP;
    185        1.1      manu 	esd.ai[i++].a_v = rcr4();
    186        1.1      manu 
    187        1.1      manu 	esd.ai[i].a_type = AT_PAGESZ;
    188        1.1      manu 	esd.ai[i++].a_v = PAGE_SIZE;
    189        1.1      manu 
    190        1.1      manu 	esd.ai[i].a_type = LINUX_AT_CLKTCK;
    191        1.1      manu 	esd.ai[i++].a_v = hz;
    192        1.1      manu 
    193        1.1      manu 	esd.ai[i].a_type = AT_PHDR;
    194        1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_phaddr: phdr);
    195        1.1      manu 
    196        1.1      manu 	esd.ai[i].a_type = AT_PHENT;
    197        1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_phentsize : eh->e_phentsize);
    198        1.1      manu 
    199        1.1      manu 	esd.ai[i].a_type = AT_PHNUM;
    200        1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_phnum : eh->e_phnum);
    201        1.1      manu 
    202        1.1      manu 	esd.ai[i].a_type = AT_BASE;
    203        1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_interp : 0);
    204        1.1      manu 
    205        1.1      manu 	esd.ai[i].a_type = AT_FLAGS;
    206        1.1      manu 	esd.ai[i++].a_v = 0;
    207        1.1      manu 
    208        1.1      manu 	esd.ai[i].a_type = AT_ENTRY;
    209        1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_entry : eh->e_entry);
    210        1.1      manu 
    211        1.1      manu 	esd.ai[i].a_type = LINUX_AT_EGID;
    212        1.8        ad 	esd.ai[i++].a_v = ((vap->va_mode & S_ISGID) ?
    213        1.8        ad 	    vap->va_gid : kauth_cred_getegid(l->l_cred));
    214        1.1      manu 
    215        1.1      manu 	esd.ai[i].a_type = LINUX_AT_GID;
    216        1.8        ad 	esd.ai[i++].a_v = kauth_cred_getgid(l->l_cred);
    217        1.1      manu 
    218        1.1      manu 	esd.ai[i].a_type = LINUX_AT_EUID;
    219        1.8        ad 	esd.ai[i++].a_v = ((vap->va_mode & S_ISUID) ?
    220        1.8        ad 	    vap->va_uid : kauth_cred_geteuid(l->l_cred));
    221        1.1      manu 
    222        1.1      manu 	esd.ai[i].a_type = LINUX_AT_UID;
    223        1.8        ad 	esd.ai[i++].a_v = kauth_cred_getuid(l->l_cred);
    224        1.1      manu 
    225        1.1      manu 	esd.ai[i].a_type = LINUX_AT_SECURE;
    226        1.1      manu 	esd.ai[i++].a_v = 0;
    227        1.1      manu 
    228        1.1      manu 	esd.ai[i].a_type = LINUX_AT_PLATFORM;
    229        1.1      manu 	esd.ai[i++].a_v = (Elf_Addr)&esdp->hw_platform[0];
    230        1.1      manu 
    231        1.1      manu 	esd.ai[i].a_type = AT_NULL;
    232        1.1      manu 	esd.ai[i++].a_v = 0;
    233        1.1      manu 
    234        1.1      manu #ifdef DEBUG_LINUX
    235        1.1      manu 	if (i != LINUX_ELF_AUX_ENTRIES) {
    236        1.1      manu 		printf("linux_elf64_copyargs: %d Aux entries\n", i);
    237        1.1      manu 		return EINVAL;
    238        1.1      manu 	}
    239        1.1      manu #endif
    240        1.1      manu 
    241        1.1      manu 	strcpy(esd.hw_platform, LINUX_PLATFORM);
    242        1.1      manu 
    243        1.1      manu 	if (ap) {
    244        1.1      manu 		free((char *)ap, M_TEMP);
    245        1.1      manu 		pack->ep_emul_arg = NULL;
    246        1.1      manu 	}
    247        1.1      manu 
    248        1.1      manu 	/*
    249        1.1      manu 	 * Copy out the ELF auxiliary table and hw platform name
    250        1.1      manu 	 */
    251        1.1      manu 	if ((error = copyout(&esd, esdp, sizeof(esd))) != 0)
    252        1.1      manu 		return error;
    253        1.1      manu 	*stackp += sizeof(esd);
    254        1.1      manu 
    255        1.1      manu 	return 0;
    256        1.1      manu }
    257  1.10.26.1      haad 
    258  1.10.26.1      haad #ifdef LINUX_NPTL
    259  1.10.26.1      haad int
    260  1.10.26.1      haad linux_init_thread_area(struct lwp *l, struct lwp *l2)
    261  1.10.26.1      haad {
    262  1.10.26.1      haad 	register_t retval;
    263  1.10.26.1      haad 	struct linux_sys_arch_prctl_args uap;
    264  1.10.26.1      haad 	struct trapframe *tf = l2->l_md.md_regs;
    265  1.10.26.1      haad 
    266  1.10.26.1      haad 	SCARG(&uap, code) = LINUX_ARCH_SET_FS;
    267  1.10.26.1      haad 	SCARG(&uap, addr) = tf->tf_r8;
    268  1.10.26.1      haad 	return linux_sys_arch_prctl(l2, &uap, &retval);
    269  1.10.26.1      haad }
    270  1.10.26.1      haad #endif
    271