Home | History | Annotate | Line # | Download | only in i386
linux_exec_machdep.c revision 1.7
      1  1.7  christos /*	$NetBSD: linux_exec_machdep.c,v 1.7 2008/10/26 03:43:42 christos Exp $	*/
      2  1.1  christos 
      3  1.1  christos /*-
      4  1.1  christos  * Copyright (c) 2004 The NetBSD Foundation, Inc.
      5  1.1  christos  * All rights reserved.
      6  1.1  christos  *
      7  1.1  christos  * This code is derived from software contributed to The NetBSD Foundation
      8  1.1  christos  * by Christos Zoulas.
      9  1.1  christos  *
     10  1.1  christos  * Redistribution and use in source and binary forms, with or without
     11  1.1  christos  * modification, are permitted provided that the following conditions
     12  1.1  christos  * are met:
     13  1.1  christos  * 1. Redistributions of source code must retain the above copyright
     14  1.1  christos  *    notice, this list of conditions and the following disclaimer.
     15  1.1  christos  * 2. Redistributions in binary form must reproduce the above copyright
     16  1.1  christos  *    notice, this list of conditions and the following disclaimer in the
     17  1.1  christos  *    documentation and/or other materials provided with the distribution.
     18  1.1  christos  *
     19  1.1  christos  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20  1.1  christos  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21  1.1  christos  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22  1.1  christos  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23  1.1  christos  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24  1.1  christos  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25  1.1  christos  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26  1.1  christos  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27  1.1  christos  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28  1.1  christos  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29  1.1  christos  * POSSIBILITY OF SUCH DAMAGE.
     30  1.1  christos  */
     31  1.1  christos 
     32  1.1  christos #include <sys/cdefs.h>
     33  1.7  christos __KERNEL_RCSID(0, "$NetBSD: linux_exec_machdep.c,v 1.7 2008/10/26 03:43:42 christos Exp $");
     34  1.1  christos 
     35  1.1  christos #if defined(_KERNEL_OPT)
     36  1.1  christos #include "opt_vm86.h"
     37  1.1  christos #include "opt_user_ldt.h"
     38  1.1  christos #endif
     39  1.1  christos 
     40  1.1  christos #include <sys/param.h>
     41  1.1  christos #include <sys/systm.h>
     42  1.1  christos #include <sys/resource.h>
     43  1.1  christos #include <sys/proc.h>
     44  1.1  christos #include <sys/conf.h>
     45  1.1  christos #include <sys/exec.h>
     46  1.1  christos #include <sys/exec_elf.h>
     47  1.1  christos #include <sys/vnode.h>
     48  1.1  christos #include <sys/lwp.h>
     49  1.1  christos 
     50  1.4        ad #include <sys/cpu.h>
     51  1.1  christos #include <machine/vmparam.h>
     52  1.1  christos 
     53  1.1  christos #include <uvm/uvm.h>
     54  1.1  christos 
     55  1.6  christos #include <sys/syscallargs.h>
     56  1.6  christos 
     57  1.6  christos #ifndef DEBUG_LINUX
     58  1.6  christos #define DPRINTF(a)
     59  1.6  christos #else
     60  1.6  christos #define DPRINTF(a)	uprintf a
     61  1.6  christos #endif
     62  1.6  christos 
     63  1.1  christos #include <compat/linux/common/linux_types.h>
     64  1.1  christos #include <compat/linux/common/linux_signal.h>
     65  1.6  christos #include <compat/linux/common/linux_machdep.h>
     66  1.1  christos #include <compat/linux/common/linux_util.h>
     67  1.1  christos #include <compat/linux/common/linux_ioctl.h>
     68  1.1  christos #include <compat/linux/common/linux_hdio.h>
     69  1.1  christos #include <compat/linux/common/linux_exec.h>
     70  1.1  christos #include <compat/linux/common/linux_errno.h>
     71  1.6  christos #include <compat/linux//linux_syscallargs.h>
     72  1.1  christos 
     73  1.7  christos 
     74  1.1  christos int
     75  1.3  christos linux_exec_setup_stack(struct lwp *l, struct exec_package *epp)
     76  1.1  christos {
     77  1.1  christos 	u_long max_stack_size;
     78  1.1  christos 	u_long access_linear_min, access_size;
     79  1.1  christos 	u_long noaccess_linear_min, noaccess_size;
     80  1.1  christos 
     81  1.1  christos #ifndef	USRSTACK32
     82  1.1  christos #define USRSTACK32	(0x00000000ffffffffL&~PGOFSET)
     83  1.1  christos #endif
     84  1.1  christos 
     85  1.1  christos 	if (epp->ep_flags & EXEC_32) {
     86  1.1  christos 		epp->ep_minsaddr = USRSTACK32;
     87  1.1  christos 		max_stack_size = MAXSSIZ;
     88  1.1  christos 	} else {
     89  1.1  christos 		epp->ep_minsaddr = USRSTACK;
     90  1.1  christos 		max_stack_size = MAXSSIZ;
     91  1.1  christos 	}
     92  1.1  christos 
     93  1.1  christos 	if (epp->ep_minsaddr > LINUX_USRSTACK)
     94  1.1  christos 		epp->ep_minsaddr = LINUX_USRSTACK;
     95  1.1  christos #ifdef DEBUG_LINUX
     96  1.1  christos 	else {
     97  1.1  christos 		/*
     98  1.1  christos 		 * Someone needs to make KERNBASE and TEXTADDR
     99  1.1  christos 		 * java versions < 1.4.2 need the stack to be
    100  1.1  christos 		 * at 0xC0000000
    101  1.1  christos 		 */
    102  1.1  christos 		uprintf("Cannot setup stack to 0xC0000000, "
    103  1.1  christos 		    "java will not work properly\n");
    104  1.1  christos 	}
    105  1.1  christos #endif
    106  1.2     perry 	epp->ep_maxsaddr = (u_long)STACK_GROW(epp->ep_minsaddr,
    107  1.1  christos 		max_stack_size);
    108  1.3  christos 	epp->ep_ssize = l->l_proc->p_rlimit[RLIMIT_STACK].rlim_cur;
    109  1.1  christos 
    110  1.1  christos 	/*
    111  1.1  christos 	 * set up commands for stack.  note that this takes *two*, one to
    112  1.1  christos 	 * map the part of the stack which we can access, and one to map
    113  1.1  christos 	 * the part which we can't.
    114  1.1  christos 	 *
    115  1.1  christos 	 * arguably, it could be made into one, but that would require the
    116  1.1  christos 	 * addition of another mapping proc, which is unnecessary
    117  1.1  christos 	 */
    118  1.1  christos 	access_size = epp->ep_ssize;
    119  1.1  christos 	access_linear_min = (u_long)STACK_ALLOC(epp->ep_minsaddr, access_size);
    120  1.1  christos 	noaccess_size = max_stack_size - access_size;
    121  1.2     perry 	noaccess_linear_min = (u_long)STACK_ALLOC(STACK_GROW(epp->ep_minsaddr,
    122  1.1  christos 	    access_size), noaccess_size);
    123  1.1  christos 	if (noaccess_size > 0) {
    124  1.1  christos 		NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, noaccess_size,
    125  1.1  christos 		    noaccess_linear_min, NULLVP, 0, VM_PROT_NONE);
    126  1.1  christos 	}
    127  1.1  christos 	KASSERT(access_size > 0);
    128  1.1  christos 	NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, access_size,
    129  1.1  christos 	    access_linear_min, NULLVP, 0, VM_PROT_READ | VM_PROT_WRITE);
    130  1.1  christos 
    131  1.1  christos 	return 0;
    132  1.1  christos }
    133  1.6  christos 
    134  1.6  christos 
    135  1.6  christos #ifdef LINUX_NPTL
    136  1.7  christos static __inline void
    137  1.7  christos load_gs(u_int sel)
    138  1.7  christos {
    139  1.7  christos         __asm __volatile("movl %0,%%gs" : : "rm" (sel));
    140  1.7  christos }
    141  1.7  christos 
    142  1.6  christos 
    143  1.6  christos int
    144  1.6  christos linux_init_thread_area(struct lwp *l, struct lwp *l2)
    145  1.6  christos {
    146  1.6  christos 	struct trapframe *tf = l->l_md.md_regs, *tf2 = l2->l_md.md_regs;
    147  1.6  christos 	struct pcb *pcb2 = &l2->l_addr->u_pcb;
    148  1.6  christos 	struct linux_user_desc info;
    149  1.6  christos 	struct segment_descriptor sd;
    150  1.6  christos 	int error, idx, a[2];
    151  1.6  christos 
    152  1.6  christos 	error = copyin((void *)tf->tf_esi, &info, sizeof(info));
    153  1.6  christos 	if (error)
    154  1.6  christos 		return error;
    155  1.6  christos 	idx = info.entry_number;
    156  1.6  christos 
    157  1.6  christos 	/*
    158  1.6  christos 	 * looks like we're getting the idx we returned
    159  1.6  christos 	 * in the set_thread_area() syscall
    160  1.6  christos 	 */
    161  1.6  christos 	if (idx != 6 && idx != 3) {
    162  1.6  christos 		printf("resetting idx %d to 3", idx);
    163  1.6  christos 		idx = 3;
    164  1.6  christos 	}
    165  1.6  christos 
    166  1.6  christos 	/* this doesnt happen in practice */
    167  1.6  christos 	if (idx == 6) {
    168  1.6  christos 		/* we might copy out the entry_number as 3 */
    169  1.6  christos 		info.entry_number = 3;
    170  1.6  christos 		error = copyout(&info, (void *)tf->tf_esi, sizeof(info));
    171  1.6  christos 		if (error)
    172  1.6  christos 			return error;
    173  1.6  christos 	}
    174  1.6  christos 
    175  1.6  christos 	a[0] = LINUX_LDT_entry_a(&info);
    176  1.6  christos 	a[1] = LINUX_LDT_entry_b(&info);
    177  1.6  christos 
    178  1.6  christos 	(void)memcpy(&sd, &a, sizeof(a));
    179  1.6  christos 	DPRINTF(("Segment created in clone with CLONE_SETTLS: lobase: %x, "
    180  1.6  christos 	    "hibase: %x, lolimit: %x, hilimit: %x, type: %i, dpl: %i, p: %i, "
    181  1.6  christos 	    "xx: %i, def32: %i, gran: %i\n", sd.sd_lobase,
    182  1.6  christos 	    sd.sd_hibase, sd.sd_lolimit, sd.sd_hilimit, sd.sd_type, sd.sd_dpl,
    183  1.6  christos 	    sd.sd_p, sd.sd_xx, sd.sd_def32, sd.sd_gran));
    184  1.6  christos 
    185  1.7  christos 	kpreempt_disable();
    186  1.7  christos 	(void)memcpy(&pcb2->pcb_gsd, &sd, sizeof(sd));
    187  1.7  christos 	(void)memcpy(&curcpu()->ci_gdt[GUGS_SEL], &sd, sizeof(sd));
    188  1.6  christos 	tf2->tf_gs = GSEL(GUGS_SEL, SEL_UPL);
    189  1.7  christos 	load_gs(tf2->tf_gs);
    190  1.7  christos 	kpreempt_enable();
    191  1.6  christos 	return 0;
    192  1.6  christos }
    193  1.6  christos 
    194  1.6  christos 
    195  1.6  christos int
    196  1.6  christos linux_sys_set_thread_area(struct lwp *l,
    197  1.6  christos     const struct linux_sys_set_thread_area_args *uap, register_t *retval)
    198  1.6  christos {
    199  1.6  christos 	struct trapframe *tf = l->l_md.md_regs;
    200  1.6  christos 	struct pcb *pcb = &l->l_addr->u_pcb;
    201  1.6  christos 	struct linux_user_desc info;
    202  1.6  christos 	struct segment_descriptor sd;
    203  1.6  christos 	int error, idx, a[2];
    204  1.6  christos 
    205  1.6  christos 	*retval = 0;
    206  1.6  christos 	error = copyin(SCARG(uap, desc), &info, sizeof(info));
    207  1.6  christos 	if (error)
    208  1.6  christos 		return error;
    209  1.6  christos 
    210  1.6  christos 	DPRINTF(("set thread area: %i, %x, %x, %i, %i, %i, %i, %i, %i\n",
    211  1.6  christos 	    info.entry_number, info.base_addr, info.limit, info.seg_32bit,
    212  1.6  christos 	    info.contents, info.read_exec_only, info.limit_in_pages,
    213  1.6  christos 	    info.seg_not_present, info.useable));
    214  1.6  christos 
    215  1.6  christos 	idx = info.entry_number;
    216  1.6  christos 	/*
    217  1.6  christos 	 * Semantics of linux version: every thread in the system has array of
    218  1.6  christos 	 * 3 tls descriptors. 1st is GLIBC TLS, 2nd is WINE, 3rd unknown. This
    219  1.6  christos 	 * syscall loads one of the selected tls decriptors with a value and
    220  1.6  christos 	 * also loads GDT descriptors 6, 7 and 8 with the content of the
    221  1.6  christos 	 * per-thread descriptors.
    222  1.6  christos 	 *
    223  1.6  christos 	 * Semantics of fbsd version: I think we can ignore that linux has 3
    224  1.6  christos 	 * per-thread descriptors and use just the 1st one. The tls_array[]
    225  1.6  christos 	 * is used only in set/get-thread_area() syscalls and for loading the
    226  1.6  christos 	 * GDT descriptors. In fbsd we use just one GDT descriptor for TLS so
    227  1.6  christos 	 * we will load just one.
    228  1.6  christos 	 *
    229  1.6  christos 	 * XXX: this doesn't work when a user space process tries to use more
    230  1.6  christos 	 * than 1 TLS segment. Comment in the linux sources says wine might do
    231  1.6  christos 	 * this.
    232  1.6  christos 	 */
    233  1.6  christos 
    234  1.6  christos 	/*
    235  1.6  christos 	 * we support just GLIBC TLS now
    236  1.6  christos 	 * we should let 3 proceed as well because we use this segment so
    237  1.6  christos 	 * if code does two subsequent calls it should succeed
    238  1.6  christos 	 */
    239  1.6  christos 	if (idx != 6 && idx != -1 && idx != 3)
    240  1.6  christos 		return EINVAL;
    241  1.6  christos 
    242  1.6  christos 	/*
    243  1.6  christos 	 * we have to copy out the GDT entry we use
    244  1.6  christos 	 * FreeBSD uses GDT entry #3 for storing %gs so load that
    245  1.6  christos 	 *
    246  1.6  christos 	 * XXX: what if a user space program doesn't check this value and tries
    247  1.6  christos 	 * to use 6, 7 or 8?
    248  1.6  christos 	 */
    249  1.6  christos 	idx = info.entry_number = 3;
    250  1.6  christos 	error = copyout(&info, SCARG(uap, desc), sizeof(info));
    251  1.6  christos 	if (error)
    252  1.6  christos 		return error;
    253  1.6  christos 
    254  1.6  christos 	if (LINUX_LDT_empty(&info)) {
    255  1.6  christos 		a[0] = 0;
    256  1.6  christos 		a[1] = 0;
    257  1.6  christos 	} else {
    258  1.6  christos 		a[0] = LINUX_LDT_entry_a(&info);
    259  1.6  christos 		a[1] = LINUX_LDT_entry_b(&info);
    260  1.6  christos 	}
    261  1.6  christos 
    262  1.6  christos 	(void)memcpy(&sd, &a, sizeof(a));
    263  1.6  christos 	DPRINTF(("Segment created in set_thread_area: lobase: %x, hibase: %x, "
    264  1.6  christos 	    "lolimit: %x, hilimit: %x, type: %i, dpl: %i, p: %i, xx: %i, "
    265  1.6  christos 	    "def32: %i, gran: %i\n", sd.sd_lobase, sd.sd_hibase, sd.sd_lolimit,
    266  1.6  christos 	    sd.sd_hilimit, sd.sd_type, sd.sd_dpl, sd.sd_p, sd.sd_xx,
    267  1.6  christos 	    sd.sd_def32, sd.sd_gran));
    268  1.6  christos 
    269  1.7  christos 	kpreempt_disable();
    270  1.7  christos 	(void)memcpy(&pcb->pcb_gsd, &sd, sizeof(sd));
    271  1.7  christos 	(void)memcpy(&curcpu()->ci_gdt[GUGS_SEL], &sd, sizeof(sd));
    272  1.6  christos 	tf->tf_gs = GSEL(GUGS_SEL, SEL_UPL);
    273  1.7  christos 	load_gs(tf->tf_gs);
    274  1.7  christos 	kpreempt_enable();
    275  1.6  christos 	return 0;
    276  1.6  christos }
    277  1.6  christos 
    278  1.6  christos int
    279  1.6  christos linux_sys_get_thread_area(struct lwp *l,
    280  1.6  christos     const struct linux_sys_get_thread_area_args *uap, register_t *retval)
    281  1.6  christos {
    282  1.6  christos 	struct pcb *pcb = &l->l_addr->u_pcb;
    283  1.6  christos 	struct linux_user_desc info;
    284  1.6  christos 	struct linux_desc_struct desc;
    285  1.6  christos 	struct segment_descriptor sd;
    286  1.6  christos 	int error, idx;
    287  1.6  christos 
    288  1.6  christos 	*retval = 0;
    289  1.6  christos 	error = copyin(SCARG(uap, desc), &info, sizeof(info));
    290  1.6  christos 	if (error)
    291  1.6  christos 		return error;
    292  1.6  christos 
    293  1.6  christos 	idx = info.entry_number;
    294  1.6  christos 	/* XXX: I am not sure if we want 3 to be allowed too. */
    295  1.6  christos 	if (idx != 6 && idx != 3)
    296  1.6  christos 		return EINVAL;
    297  1.6  christos 
    298  1.6  christos 	idx = 3;
    299  1.6  christos 
    300  1.6  christos 	(void)memset(&info, 0, sizeof(info));
    301  1.6  christos 	(void)memcpy(&sd, pcb->pcb_gsd, sizeof(sd));
    302  1.6  christos 	(void)memcpy(&desc, &sd, sizeof(desc));
    303  1.6  christos 
    304  1.6  christos 	info.entry_number = idx;
    305  1.6  christos 	info.base_addr = LINUX_GET_BASE(&desc);
    306  1.6  christos 	info.limit = LINUX_GET_LIMIT(&desc);
    307  1.6  christos 	info.seg_32bit = LINUX_GET_32BIT(&desc);
    308  1.6  christos 	info.contents = LINUX_GET_CONTENTS(&desc);
    309  1.6  christos 	info.read_exec_only = !LINUX_GET_WRITABLE(&desc);
    310  1.6  christos 	info.limit_in_pages = LINUX_GET_LIMIT_PAGES(&desc);
    311  1.6  christos 	info.seg_not_present = !LINUX_GET_PRESENT(&desc);
    312  1.6  christos 	info.useable = LINUX_GET_USEABLE(&desc);
    313  1.6  christos 
    314  1.6  christos 	return copyout(&info, SCARG(uap, desc), sizeof(info));
    315  1.6  christos }
    316  1.6  christos 
    317  1.6  christos #endif
    318