Home | History | Annotate | Line # | Download | only in amd64
linux_exec_machdep.c revision 1.24.26.1
      1  1.24.26.1  perseant /*	$NetBSD: linux_exec_machdep.c,v 1.24.26.1 2025/08/02 05:56:21 perseant Exp $ */
      2        1.1      manu 
      3        1.1      manu /*-
      4        1.1      manu  * Copyright (c) 2005 Emmanuel Dreyfus, all rights reserved
      5        1.1      manu  *
      6        1.1      manu  * Redistribution and use in source and binary forms, with or without
      7        1.1      manu  * modification, are permitted provided that the following conditions
      8        1.1      manu  * are met:
      9        1.1      manu  * 1. Redistributions of source code must retain the above copyright
     10        1.1      manu  *    notice, this list of conditions and the following disclaimer.
     11        1.1      manu  * 2. Redistributions in binary form must reproduce the above copyright
     12        1.1      manu  *    notice, this list of conditions and the following disclaimer in the
     13        1.1      manu  *    documentation and/or other materials provided with the distribution.
     14        1.1      manu  * 3. All advertising materials mentioning features or use of this software
     15        1.1      manu  *    must display the following acknowledgement:
     16        1.1      manu  *	This product includes software developed by Emmanuel Dreyfus
     17  1.24.26.1  perseant  * 4. The name of the author may not be used to endorse or promote
     18  1.24.26.1  perseant  *    products derived from this software without specific prior written
     19        1.1      manu  *    permission.
     20        1.1      manu  *
     21  1.24.26.1  perseant  * THIS SOFTWARE IS PROVIDED BY THE THE AUTHOR AND CONTRIBUTORS ``AS IS''
     22  1.24.26.1  perseant  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
     23        1.1      manu  * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     24  1.24.26.1  perseant  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS
     25        1.1      manu  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     26        1.1      manu  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     27        1.1      manu  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     28        1.1      manu  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     29        1.1      manu  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     30        1.1      manu  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     31        1.1      manu  * POSSIBILITY OF SUCH DAMAGE.
     32        1.1      manu  */
     33        1.1      manu 
     34        1.1      manu #include <sys/cdefs.h>
     35  1.24.26.1  perseant __KERNEL_RCSID(0, "$NetBSD: linux_exec_machdep.c,v 1.24.26.1 2025/08/02 05:56:21 perseant Exp $");
     36        1.1      manu 
     37        1.1      manu #define ELFSIZE 64
     38        1.1      manu 
     39        1.1      manu #include <sys/param.h>
     40        1.1      manu #include <sys/systm.h>
     41        1.1      manu #include <sys/kernel.h>
     42        1.1      manu #include <sys/resource.h>
     43        1.1      manu #include <sys/proc.h>
     44        1.1      manu #include <sys/conf.h>
     45       1.19      matt #include <sys/kmem.h>
     46        1.1      manu #include <sys/exec_elf.h>
     47        1.1      manu #include <sys/vnode.h>
     48        1.1      manu #include <sys/lwp.h>
     49        1.1      manu #include <sys/exec.h>
     50        1.1      manu #include <sys/stat.h>
     51        1.7      yamt #include <sys/kauth.h>
     52       1.22     njoly #include <sys/cprng.h>
     53        1.1      manu 
     54       1.10        ad #include <sys/cpu.h>
     55        1.1      manu #include <machine/vmparam.h>
     56       1.13  christos #include <sys/syscallargs.h>
     57        1.1      manu 
     58        1.1      manu #include <compat/linux/common/linux_types.h>
     59        1.1      manu #include <compat/linux/common/linux_signal.h>
     60       1.12  christos #include <compat/linux/common/linux_machdep.h>
     61        1.1      manu #include <compat/linux/common/linux_util.h>
     62        1.1      manu #include <compat/linux/common/linux_ioctl.h>
     63        1.1      manu #include <compat/linux/common/linux_hdio.h>
     64        1.1      manu #include <compat/linux/common/linux_exec.h>
     65        1.1      manu #include <compat/linux/common/linux_errno.h>
     66       1.13  christos #include <compat/linux/common/linux_prctl.h>
     67       1.14        ad #include <compat/linux/common/linux_ipc.h>
     68       1.14        ad #include <compat/linux/common/linux_sem.h>
     69       1.13  christos #include <compat/linux/linux_syscallargs.h>
     70        1.1      manu 
     71        1.1      manu int
     72        1.4  christos linux_exec_setup_stack(struct lwp *l, struct exec_package *epp)
     73        1.1      manu {
     74        1.1      manu 	u_long max_stack_size;
     75        1.1      manu 	u_long access_linear_min, access_size;
     76        1.1      manu 	u_long noaccess_linear_min, noaccess_size;
     77        1.1      manu 
     78        1.1      manu #ifndef USRSTACK32
     79        1.1      manu #define USRSTACK32      (0x00000000ffffffffL & ~PGOFSET)
     80        1.1      manu #endif
     81        1.1      manu 
     82        1.1      manu 	if (epp->ep_flags & EXEC_32) {
     83        1.1      manu 		epp->ep_minsaddr = USRSTACK32;
     84        1.1      manu 		max_stack_size = MAXSSIZ;
     85        1.1      manu 		if (epp->ep_minsaddr > LINUX_USRSTACK32)
     86        1.1      manu 			epp->ep_minsaddr = LINUX_USRSTACK32;
     87        1.1      manu 	} else {
     88        1.1      manu 		epp->ep_minsaddr = USRSTACK;
     89        1.1      manu 		max_stack_size = MAXSSIZ;
     90        1.1      manu 		if (epp->ep_minsaddr > LINUX_USRSTACK)
     91        1.1      manu 			epp->ep_minsaddr = LINUX_USRSTACK;
     92        1.1      manu 
     93        1.1      manu 	}
     94        1.1      manu 
     95        1.1      manu 	epp->ep_maxsaddr = (u_long)STACK_GROW(epp->ep_minsaddr,
     96        1.1      manu 		max_stack_size);
     97        1.4  christos 	epp->ep_ssize = l->l_proc->p_rlimit[RLIMIT_STACK].rlim_cur;
     98        1.1      manu 
     99        1.1      manu 	/*
    100        1.1      manu 	 * set up commands for stack.  note that this takes *two*, one to
    101        1.1      manu 	 * map the part of the stack which we can access, and one to map
    102        1.1      manu 	 * the part which we can't.
    103        1.1      manu 	 *
    104        1.1      manu 	 * arguably, it could be made into one, but that would require the
    105        1.1      manu 	 * addition of another mapping proc, which is unnecessary
    106        1.1      manu 	 */
    107        1.1      manu 	access_size = epp->ep_ssize;
    108        1.1      manu 	access_linear_min = (u_long)STACK_ALLOC(epp->ep_minsaddr, access_size);
    109        1.1      manu 	noaccess_size = max_stack_size - access_size;
    110        1.1      manu 	noaccess_linear_min = (u_long)STACK_ALLOC(STACK_GROW(epp->ep_minsaddr,
    111        1.1      manu 	    access_size), noaccess_size);
    112        1.1      manu 	if (noaccess_size > 0) {
    113       1.16       mrg 		NEW_VMCMD2(&epp->ep_vmcmds, vmcmd_map_zero, noaccess_size,
    114       1.16       mrg 		    noaccess_linear_min, NULLVP, 0, VM_PROT_NONE, VMCMD_STACK);
    115        1.1      manu 	}
    116        1.1      manu 	KASSERT(access_size > 0);
    117       1.16       mrg 	NEW_VMCMD2(&epp->ep_vmcmds, vmcmd_map_zero, access_size,
    118       1.16       mrg 	    access_linear_min, NULLVP, 0, VM_PROT_READ | VM_PROT_WRITE,
    119       1.16       mrg 	    VMCMD_STACK);
    120        1.1      manu 
    121        1.1      manu 	return 0;
    122        1.1      manu }
    123        1.1      manu 
    124        1.1      manu int
    125       1.15    cegger ELFNAME2(linux,copyargs)(struct lwp *l, struct exec_package *pack,
    126       1.15    cegger 	struct ps_strings *arginfo, char **stackp, void *argp)
    127        1.1      manu {
    128        1.1      manu 	struct linux_extra_stack_data64 *esdp, esd;
    129        1.1      manu 	struct elf_args *ap;
    130        1.5  christos 	struct vattr *vap;
    131        1.1      manu 	Elf_Ehdr *eh;
    132        1.1      manu 	Elf_Phdr *ph;
    133        1.1      manu 	u_long phsize;
    134        1.1      manu 	Elf_Addr phdr = 0;
    135        1.1      manu 	int error;
    136        1.1      manu 	int i;
    137        1.1      manu 
    138        1.5  christos 	if ((error = copyargs(l, pack, arginfo, stackp, argp)) != 0)
    139        1.1      manu 		return error;
    140        1.1      manu 
    141        1.1      manu 	/*
    142        1.1      manu 	 * Push extra arguments on the stack needed by dynamically
    143        1.1      manu 	 * linked binaries and static binaries as well.
    144        1.1      manu 	 */
    145        1.1      manu 	memset(&esd, 0, sizeof(esd));
    146        1.1      manu 	esdp = (struct linux_extra_stack_data64 *)(*stackp);
    147        1.1      manu 	ap = (struct elf_args *)pack->ep_emul_arg;
    148        1.1      manu 	vap = pack->ep_vap;
    149        1.1      manu 	eh = (Elf_Ehdr *)pack->ep_hdr;
    150        1.1      manu 
    151        1.1      manu 	/*
    152       1.17     njoly 	 * We forgot this, so we need to reload it now. XXX keep track of it?
    153        1.1      manu 	 */
    154        1.1      manu 	if (ap == NULL) {
    155        1.1      manu 		phsize = eh->e_phnum * sizeof(Elf_Phdr);
    156       1.19      matt 		ph = (Elf_Phdr *)kmem_alloc(phsize, KM_SLEEP);
    157       1.23        ad 		error = exec_read(l, pack->ep_vp, eh->e_phoff, ph, phsize, 0);
    158        1.1      manu 		if (error != 0) {
    159        1.1      manu 			for (i = 0; i < eh->e_phnum; i++) {
    160        1.1      manu 				if (ph[i].p_type == PT_PHDR) {
    161        1.1      manu 					phdr = ph[i].p_vaddr;
    162        1.1      manu 					break;
    163        1.1      manu 				}
    164        1.1      manu 			}
    165        1.1      manu 		}
    166       1.19      matt 		kmem_free(ph, phsize);
    167        1.1      manu 	}
    168        1.1      manu 
    169        1.1      manu 
    170        1.1      manu 	/*
    171        1.1      manu 	 * The exec_package doesn't have a proc pointer and it's not
    172        1.1      manu 	 * exactly trivial to add one since the credentials are
    173        1.1      manu 	 * changing. XXX Linux uses curlwp's credentials.
    174        1.1      manu 	 * Why can't we use them too?
    175        1.1      manu 	 */
    176        1.1      manu 
    177        1.1      manu 	i = 0;
    178        1.1      manu 	esd.ai[i].a_type = LINUX_AT_HWCAP;
    179        1.1      manu 	esd.ai[i++].a_v = rcr4();
    180        1.1      manu 
    181        1.1      manu 	esd.ai[i].a_type = AT_PAGESZ;
    182        1.1      manu 	esd.ai[i++].a_v = PAGE_SIZE;
    183        1.1      manu 
    184        1.1      manu 	esd.ai[i].a_type = LINUX_AT_CLKTCK;
    185        1.1      manu 	esd.ai[i++].a_v = hz;
    186        1.1      manu 
    187        1.1      manu 	esd.ai[i].a_type = AT_PHDR;
    188        1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_phaddr: phdr);
    189        1.1      manu 
    190        1.1      manu 	esd.ai[i].a_type = AT_PHENT;
    191        1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_phentsize : eh->e_phentsize);
    192        1.1      manu 
    193        1.1      manu 	esd.ai[i].a_type = AT_PHNUM;
    194        1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_phnum : eh->e_phnum);
    195        1.1      manu 
    196        1.1      manu 	esd.ai[i].a_type = AT_BASE;
    197        1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_interp : 0);
    198        1.1      manu 
    199        1.1      manu 	esd.ai[i].a_type = AT_FLAGS;
    200        1.1      manu 	esd.ai[i++].a_v = 0;
    201        1.1      manu 
    202        1.1      manu 	esd.ai[i].a_type = AT_ENTRY;
    203        1.1      manu 	esd.ai[i++].a_v = (ap ? ap->arg_entry : eh->e_entry);
    204        1.1      manu 
    205        1.1      manu 	esd.ai[i].a_type = LINUX_AT_EGID;
    206        1.8        ad 	esd.ai[i++].a_v = ((vap->va_mode & S_ISGID) ?
    207        1.8        ad 	    vap->va_gid : kauth_cred_getegid(l->l_cred));
    208        1.1      manu 
    209        1.1      manu 	esd.ai[i].a_type = LINUX_AT_GID;
    210        1.8        ad 	esd.ai[i++].a_v = kauth_cred_getgid(l->l_cred);
    211        1.1      manu 
    212        1.1      manu 	esd.ai[i].a_type = LINUX_AT_EUID;
    213  1.24.26.1  perseant 	esd.ai[i++].a_v = ((vap->va_mode & S_ISUID) ?
    214        1.8        ad 	    vap->va_uid : kauth_cred_geteuid(l->l_cred));
    215        1.1      manu 
    216        1.1      manu 	esd.ai[i].a_type = LINUX_AT_UID;
    217        1.8        ad 	esd.ai[i++].a_v = kauth_cred_getuid(l->l_cred);
    218        1.1      manu 
    219        1.1      manu 	esd.ai[i].a_type = LINUX_AT_SECURE;
    220        1.1      manu 	esd.ai[i++].a_v = 0;
    221        1.1      manu 
    222        1.1      manu 	esd.ai[i].a_type = LINUX_AT_PLATFORM;
    223        1.1      manu 	esd.ai[i++].a_v = (Elf_Addr)&esdp->hw_platform[0];
    224        1.1      manu 
    225       1.20       chs 	esd.ai[i].a_type = LINUX_AT_RANDOM;
    226       1.20       chs 	esd.ai[i++].a_v = (Elf_Addr)&esdp->randbytes[0];
    227       1.22     njoly 	esd.randbytes[0] = cprng_strong32();
    228       1.22     njoly 	esd.randbytes[1] = cprng_strong32();
    229       1.22     njoly 	esd.randbytes[2] = cprng_strong32();
    230       1.22     njoly 	esd.randbytes[3] = cprng_strong32();
    231       1.20       chs 
    232        1.1      manu 	esd.ai[i].a_type = AT_NULL;
    233        1.1      manu 	esd.ai[i++].a_v = 0;
    234        1.1      manu 
    235       1.21      maxv 	KASSERT(i == LINUX_ELF_AUX_ENTRIES);
    236       1.21      maxv 
    237  1.24.26.1  perseant 	strcpy(esd.hw_platform, LINUX_PLATFORM);
    238        1.1      manu 
    239       1.19      matt 	exec_free_emul_arg(pack);
    240       1.19      matt 
    241        1.1      manu 	/*
    242        1.1      manu 	 * Copy out the ELF auxiliary table and hw platform name
    243        1.1      manu 	 */
    244        1.1      manu 	if ((error = copyout(&esd, esdp, sizeof(esd))) != 0)
    245        1.1      manu 		return error;
    246        1.1      manu 	*stackp += sizeof(esd);
    247        1.1      manu 
    248        1.1      manu 	return 0;
    249        1.1      manu }
    250