Home | History | Annotate | Line # | Download | only in amd64
      1  1.25  riastrad /*	$NetBSD: linux_exec_machdep.c,v 1.25 2024/10/01 16:35:42 riastradh Exp $ */
      2   1.1      manu 
      3   1.1      manu /*-
      4   1.1      manu  * Copyright (c) 2005 Emmanuel Dreyfus, all rights reserved
      5   1.1      manu  *
      6   1.1      manu  * Redistribution and use in source and binary forms, with or without
      7   1.1      manu  * modification, are permitted provided that the following conditions
      8   1.1      manu  * are met:
      9   1.1      manu  * 1. Redistributions of source code must retain the above copyright
     10   1.1      manu  *    notice, this list of conditions and the following disclaimer.
     11   1.1      manu  * 2. Redistributions in binary form must reproduce the above copyright
     12   1.1      manu  *    notice, this list of conditions and the following disclaimer in the
     13   1.1      manu  *    documentation and/or other materials provided with the distribution.
     14   1.1      manu  * 3. All advertising materials mentioning features or use of this software
     15   1.1      manu  *    must display the following acknowledgement:
     16   1.1      manu  *	This product includes software developed by Emmanuel Dreyfus
     17  1.25  riastrad  * 4. The name of the author may not be used to endorse or promote
     18  1.25  riastrad  *    products derived from this software without specific prior written
     19   1.1      manu  *    permission.
     20   1.1      manu  *
     21  1.25  riastrad  * THIS SOFTWARE IS PROVIDED BY THE THE AUTHOR AND CONTRIBUTORS ``AS IS''
     22  1.25  riastrad  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
     23   1.1      manu  * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     24  1.25  riastrad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS
     25   1.1      manu  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     26   1.1      manu  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     27   1.1      manu  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     28   1.1      manu  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     29   1.1      manu  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     30   1.1      manu  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     31   1.1      manu  * POSSIBILITY OF SUCH DAMAGE.
     32   1.1      manu  */
     33   1.1      manu 
     34   1.1      manu #include <sys/cdefs.h>
     35  1.25  riastrad __KERNEL_RCSID(0, "$NetBSD: linux_exec_machdep.c,v 1.25 2024/10/01 16:35:42 riastradh Exp $");
     36   1.1      manu 
     37   1.1      manu #define ELFSIZE 64
     38   1.1      manu 
     39   1.1      manu #include <sys/param.h>
     40   1.1      manu #include <sys/systm.h>
     41   1.1      manu #include <sys/kernel.h>
     42   1.1      manu #include <sys/resource.h>
     43   1.1      manu #include <sys/proc.h>
     44   1.1      manu #include <sys/conf.h>
     45  1.19      matt #include <sys/kmem.h>
     46   1.1      manu #include <sys/exec_elf.h>
     47   1.1      manu #include <sys/vnode.h>
     48   1.1      manu #include <sys/lwp.h>
     49   1.1      manu #include <sys/exec.h>
     50   1.1      manu #include <sys/stat.h>
     51   1.7      yamt #include <sys/kauth.h>
     52  1.22     njoly #include <sys/cprng.h>
     53   1.1      manu 
     54  1.10        ad #include <sys/cpu.h>
     55   1.1      manu #include <machine/vmparam.h>
     56  1.13  christos #include <sys/syscallargs.h>
     57   1.1      manu 
     58   1.1      manu #include <compat/linux/common/linux_types.h>
     59   1.1      manu #include <compat/linux/common/linux_signal.h>
     60  1.12  christos #include <compat/linux/common/linux_machdep.h>
     61   1.1      manu #include <compat/linux/common/linux_util.h>
     62   1.1      manu #include <compat/linux/common/linux_ioctl.h>
     63   1.1      manu #include <compat/linux/common/linux_hdio.h>
     64   1.1      manu #include <compat/linux/common/linux_exec.h>
     65   1.1      manu #include <compat/linux/common/linux_errno.h>
     66  1.13  christos #include <compat/linux/common/linux_prctl.h>
     67  1.14        ad #include <compat/linux/common/linux_ipc.h>
     68  1.14        ad #include <compat/linux/common/linux_sem.h>
     69  1.13  christos #include <compat/linux/linux_syscallargs.h>
     70   1.1      manu 
     71   1.1      manu int
     72   1.4  christos linux_exec_setup_stack(struct lwp *l, struct exec_package *epp)
     73   1.1      manu {
     74   1.1      manu 	u_long max_stack_size;
     75   1.1      manu 	u_long access_linear_min, access_size;
     76   1.1      manu 	u_long noaccess_linear_min, noaccess_size;
     77   1.1      manu 
     78   1.1      manu #ifndef USRSTACK32
     79   1.1      manu #define USRSTACK32      (0x00000000ffffffffL & ~PGOFSET)
     80   1.1      manu #endif
     81   1.1      manu 
     82   1.1      manu 	if (epp->ep_flags & EXEC_32) {
     83   1.1      manu 		epp->ep_minsaddr = USRSTACK32;
     84   1.1      manu 		max_stack_size = MAXSSIZ;
     85   1.1      manu 		if (epp->ep_minsaddr > LINUX_USRSTACK32)
     86   1.1      manu 			epp->ep_minsaddr = LINUX_USRSTACK32;
     87   1.1      manu 	} else {
     88   1.1      manu 		epp->ep_minsaddr = USRSTACK;
     89   1.1      manu 		max_stack_size = MAXSSIZ;
     90   1.1      manu 		if (epp->ep_minsaddr > LINUX_USRSTACK)
     91   1.1      manu 			epp->ep_minsaddr = LINUX_USRSTACK;
     92   1.1      manu 
     93   1.1      manu 	}
     94   1.1      manu 
     95   1.1      manu 	epp->ep_maxsaddr = (u_long)STACK_GROW(epp->ep_minsaddr,
     96   1.1      manu 		max_stack_size);
     97   1.4  christos 	epp->ep_ssize = l->l_proc->p_rlimit[RLIMIT_STACK].rlim_cur;
     98   1.1      manu 
     99   1.1      manu 	/*
    100   1.1      manu 	 * set up commands for stack.  note that this takes *two*, one to
    101   1.1      manu 	 * map the part of the stack which we can access, and one to map
    102   1.1      manu 	 * the part which we can't.
    103   1.1      manu 	 *
    104   1.1      manu 	 * arguably, it could be made into one, but that would require the
    105   1.1      manu 	 * addition of another mapping proc, which is unnecessary
    106   1.1      manu 	 */
    107   1.1      manu 	access_size = epp->ep_ssize;
    108   1.1      manu 	access_linear_min = (u_long)STACK_ALLOC(epp->ep_minsaddr, access_size);
    109   1.1      manu 	noaccess_size = max_stack_size - access_size;
    110   1.1      manu 	noaccess_linear_min = (u_long)STACK_ALLOC(STACK_GROW(epp->ep_minsaddr,
    111   1.1      manu 	    access_size), noaccess_size);
    112   1.1      manu 	if (noaccess_size > 0) {
    113  1.16       mrg 		NEW_VMCMD2(&epp->ep_vmcmds, vmcmd_map_zero, noaccess_size,
    114  1.16       mrg 		    noaccess_linear_min, NULLVP, 0, VM_PROT_NONE, VMCMD_STACK);
    115   1.1      manu 	}
    116   1.1      manu 	KASSERT(access_size > 0);
    117  1.16       mrg 	NEW_VMCMD2(&epp->ep_vmcmds, vmcmd_map_zero, access_size,
    118  1.16       mrg 	    access_linear_min, NULLVP, 0, VM_PROT_READ | VM_PROT_WRITE,
    119  1.16       mrg 	    VMCMD_STACK);
    120   1.1      manu 
    121   1.1      manu 	return 0;
    122   1.1      manu }
    123   1.1      manu 
    124   1.1      manu int
    125  1.15    cegger ELFNAME2(linux,copyargs)(struct lwp *l, struct exec_package *pack,
    126  1.15    cegger 	struct ps_strings *arginfo, char **stackp, void *argp)
    127   1.1      manu {
    128   1.1      manu 	struct linux_extra_stack_data64 *esdp, esd;
    129   1.1      manu 	struct elf_args *ap;
    130   1.5  christos 	struct vattr *vap;
    131   1.1      manu 	Elf_Ehdr *eh;
    132   1.1      manu 	Elf_Phdr *ph;
    133   1.1      manu 	u_long phsize;
    134   1.1      manu 	Elf_Addr phdr = 0;
    135   1.1      manu 	int error;
    136   1.1      manu 	int i;
    137   1.1      manu 
    138   1.5  christos 	if ((error = copyargs(l, pack, arginfo, stackp, argp)) != 0)
    139   1.1      manu 		return error;
    140   1.1      manu 
    141   1.1      manu 	/*
    142   1.1      manu 	 * Push extra arguments on the stack needed by dynamically
    143   1.1      manu 	 * linked binaries and static binaries as well.
    144   1.1      manu 	 */
    145   1.1      manu 	memset(&esd, 0, sizeof(esd));
    146   1.1      manu 	esdp = (struct linux_extra_stack_data64 *)(*stackp);
    147   1.1      manu 	ap = (struct elf_args *)pack->ep_emul_arg;
    148   1.1      manu 	vap = pack->ep_vap;
    149   1.1      manu 	eh = (Elf_Ehdr *)pack->ep_hdr;
    150   1.1      manu 
    151   1.1      manu 	/*
    152  1.17     njoly 	 * We forgot this, so we need to reload it now. XXX keep track of it?
    153   1.1      manu 	 */
    154   1.1      manu 	if (ap == NULL) {
    155   1.1      manu 		phsize = eh->e_phnum * sizeof(Elf_Phdr);
    156  1.19      matt 		ph = (Elf_Phdr *)kmem_alloc(phsize, KM_SLEEP);
    157  1.23        ad 		error = exec_read(l, pack->ep_vp, eh->e_phoff, ph, phsize, 0);
    158   1.1      manu 		if (error != 0) {
    159   1.1      manu 			for (i = 0; i < eh->e_phnum; i++) {
    160   1.1      manu 				if (ph[i].p_type == PT_PHDR) {
    161   1.1      manu 					phdr = ph[i].p_vaddr;
    162   1.1      manu 					break;
    163   1.1      manu 				}
    164   1.1      manu 			}
    165   1.1      manu 		}
    166  1.19      matt 		kmem_free(ph, phsize);
    167   1.1      manu 	}
    168   1.1      manu 
    169   1.1      manu 
    170   1.1      manu 	/*
    171   1.1      manu 	 * The exec_package doesn't have a proc pointer and it's not
    172   1.1      manu 	 * exactly trivial to add one since the credentials are
    173   1.1      manu 	 * changing. XXX Linux uses curlwp's credentials.
    174   1.1      manu 	 * Why can't we use them too?
    175   1.1      manu 	 */
    176   1.1      manu 
    177   1.1      manu 	i = 0;
    178   1.1      manu 	esd.ai[i].a_type = LINUX_AT_HWCAP;
    179   1.1      manu 	esd.ai[i++].a_v = rcr4();
    180   1.1      manu 
    181   1.1      manu 	esd.ai[i].a_type = AT_PAGESZ;
    182   1.1      manu 	esd.ai[i++].a_v = PAGE_SIZE;
    183   1.1      manu 
    184   1.1      manu 	esd.ai[i].a_type = LINUX_AT_CLKTCK;
    185   1.1      manu 	esd.ai[i++].a_v = hz;
    186   1.1      manu 
    187   1.1      manu 	esd.ai[i].a_type = AT_PHDR;
    188   1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_phaddr: phdr);
    189   1.1      manu 
    190   1.1      manu 	esd.ai[i].a_type = AT_PHENT;
    191   1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_phentsize : eh->e_phentsize);
    192   1.1      manu 
    193   1.1      manu 	esd.ai[i].a_type = AT_PHNUM;
    194   1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_phnum : eh->e_phnum);
    195   1.1      manu 
    196   1.1      manu 	esd.ai[i].a_type = AT_BASE;
    197   1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_interp : 0);
    198   1.1      manu 
    199   1.1      manu 	esd.ai[i].a_type = AT_FLAGS;
    200   1.1      manu 	esd.ai[i++].a_v = 0;
    201   1.1      manu 
    202   1.1      manu 	esd.ai[i].a_type = AT_ENTRY;
    203   1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_entry : eh->e_entry);
    204   1.1      manu 
    205   1.1      manu 	esd.ai[i].a_type = LINUX_AT_EGID;
    206   1.8        ad 	esd.ai[i++].a_v = ((vap->va_mode & S_ISGID) ?
    207   1.8        ad 	    vap->va_gid : kauth_cred_getegid(l->l_cred));
    208   1.1      manu 
    209   1.1      manu 	esd.ai[i].a_type = LINUX_AT_GID;
    210   1.8        ad 	esd.ai[i++].a_v = kauth_cred_getgid(l->l_cred);
    211   1.1      manu 
    212   1.1      manu 	esd.ai[i].a_type = LINUX_AT_EUID;
    213  1.25  riastrad 	esd.ai[i++].a_v = ((vap->va_mode & S_ISUID) ?
    214   1.8        ad 	    vap->va_uid : kauth_cred_geteuid(l->l_cred));
    215   1.1      manu 
    216   1.1      manu 	esd.ai[i].a_type = LINUX_AT_UID;
    217   1.8        ad 	esd.ai[i++].a_v = kauth_cred_getuid(l->l_cred);
    218   1.1      manu 
    219   1.1      manu 	esd.ai[i].a_type = LINUX_AT_SECURE;
    220   1.1      manu 	esd.ai[i++].a_v = 0;
    221   1.1      manu 
    222   1.1      manu 	esd.ai[i].a_type = LINUX_AT_PLATFORM;
    223   1.1      manu 	esd.ai[i++].a_v = (Elf_Addr)&esdp->hw_platform[0];
    224   1.1      manu 
    225  1.20       chs 	esd.ai[i].a_type = LINUX_AT_RANDOM;
    226  1.20       chs 	esd.ai[i++].a_v = (Elf_Addr)&esdp->randbytes[0];
    227  1.22     njoly 	esd.randbytes[0] = cprng_strong32();
    228  1.22     njoly 	esd.randbytes[1] = cprng_strong32();
    229  1.22     njoly 	esd.randbytes[2] = cprng_strong32();
    230  1.22     njoly 	esd.randbytes[3] = cprng_strong32();
    231  1.20       chs 
    232   1.1      manu 	esd.ai[i].a_type = AT_NULL;
    233   1.1      manu 	esd.ai[i++].a_v = 0;
    234   1.1      manu 
    235  1.21      maxv 	KASSERT(i == LINUX_ELF_AUX_ENTRIES);
    236  1.21      maxv 
    237  1.25  riastrad 	strcpy(esd.hw_platform, LINUX_PLATFORM);
    238   1.1      manu 
    239  1.19      matt 	exec_free_emul_arg(pack);
    240  1.19      matt 
    241   1.1      manu 	/*
    242   1.1      manu 	 * Copy out the ELF auxiliary table and hw platform name
    243   1.1      manu 	 */
    244   1.1      manu 	if ((error = copyout(&esd, esdp, sizeof(esd))) != 0)
    245   1.1      manu 		return error;
    246   1.1      manu 	*stackp += sizeof(esd);
    247   1.1      manu 
    248   1.1      manu 	return 0;
    249   1.1      manu }
    250