Home | History | Annotate | Line # | Download | only in rumpkern
emul.c revision 1.191.2.1
      1  1.191.2.1    martin /*	$NetBSD: emul.c,v 1.191.2.1 2023/10/18 12:11:53 martin Exp $	*/
      2        1.1     pooka 
      3        1.1     pooka /*
      4      1.150     pooka  * Copyright (c) 2007-2011 Antti Kantee.  All Rights Reserved.
      5        1.1     pooka  *
      6        1.1     pooka  * Redistribution and use in source and binary forms, with or without
      7        1.1     pooka  * modification, are permitted provided that the following conditions
      8        1.1     pooka  * are met:
      9        1.1     pooka  * 1. Redistributions of source code must retain the above copyright
     10        1.1     pooka  *    notice, this list of conditions and the following disclaimer.
     11        1.1     pooka  * 2. Redistributions in binary form must reproduce the above copyright
     12        1.1     pooka  *    notice, this list of conditions and the following disclaimer in the
     13        1.1     pooka  *    documentation and/or other materials provided with the distribution.
     14        1.1     pooka  *
     15        1.1     pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     16        1.1     pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     17        1.1     pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     18        1.1     pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     19        1.1     pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     20        1.1     pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     21        1.1     pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     22        1.1     pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     23        1.1     pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     24        1.1     pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     25        1.1     pooka  * SUCH DAMAGE.
     26        1.1     pooka  */
     27        1.1     pooka 
     28       1.61     pooka #include <sys/cdefs.h>
     29  1.191.2.1    martin __KERNEL_RCSID(0, "$NetBSD: emul.c,v 1.191.2.1 2023/10/18 12:11:53 martin Exp $");
     30        1.9     pooka 
     31        1.1     pooka #include <sys/param.h>
     32      1.176     pooka #include <sys/cprng.h>
     33      1.176     pooka #include <sys/filedesc.h>
     34      1.181   hannken #include <sys/fstrans.h>
     35        1.1     pooka #include <sys/kauth.h>
     36       1.66     pooka #include <sys/module.h>
     37       1.67     pooka #include <sys/reboot.h>
     38      1.154     pooka #include <sys/syscall.h>
     39      1.185     ozaki #include <sys/pserialize.h>
     40      1.178     ozaki #ifdef LOCKDEBUG
     41      1.178     ozaki #include <sys/sleepq.h>
     42      1.178     ozaki #endif
     43       1.67     pooka 
     44       1.67     pooka #include <dev/cons.h>
     45        1.1     pooka 
     46      1.179     pooka #include <rump-sys/kern.h>
     47      1.179     pooka 
     48       1.44     pooka #include <rump/rumpuser.h>
     49       1.44     pooka 
     50      1.165     pooka void (*rump_vfs_fini)(void) = (void *)nullop;
     51      1.165     pooka 
     52      1.149     pooka /*
     53      1.149     pooka  * physmem is largely unused (except for nmbcluster calculations),
     54      1.149     pooka  * so pick a default value which suits ZFS.  if an application wants
     55      1.149     pooka  * a very small memory footprint, it can still adjust this before
     56      1.149     pooka  * calling rump_init()
     57      1.149     pooka  */
     58      1.149     pooka #define PHYSMEM 512*256
     59      1.180    cherry psize_t physmem = PHYSMEM;
     60      1.149     pooka int nkmempages = PHYSMEM/2; /* from le chapeau */
     61      1.149     pooka #undef PHYSMEM
     62      1.149     pooka 
     63        1.1     pooka struct vnode *rootvp;
     64      1.124     pooka dev_t rootdev = NODEV;
     65      1.149     pooka 
     66       1.19     pooka const int schedppq = 1;
     67       1.53     pooka bool mp_online = false;
     68      1.175     pooka struct timespec boottime;
     69       1.66     pooka int cold = 1;
     70       1.95     pooka int boothowto = AB_SILENT;
     71       1.67     pooka struct tty *constty;
     72        1.1     pooka 
     73      1.135     pooka const struct bdevsw *bdevsw0[255];
     74       1.64     pooka const struct bdevsw **bdevsw = bdevsw0;
     75      1.135     pooka const int sys_cdevsws = 255;
     76      1.135     pooka int max_cdevsws = 255;
     77       1.64     pooka 
     78      1.135     pooka const struct cdevsw *cdevsw0[255];
     79       1.64     pooka const struct cdevsw **cdevsw = cdevsw0;
     80      1.135     pooka const int sys_bdevsws = 255;
     81      1.135     pooka int max_bdevsws = 255;
     82       1.64     pooka 
     83       1.76     pooka int mem_no = 2;
     84       1.76     pooka 
     85      1.151       chs device_t booted_device;
     86      1.151       chs device_t booted_wedge;
     87  1.191.2.1    martin daddr_t booted_startblk;
     88  1.191.2.1    martin uint64_t booted_nblks;
     89       1.92     pooka int booted_partition;
     90      1.183  christos const char *booted_method;
     91       1.92     pooka 
     92      1.120     pooka /* XXX: unused */
     93       1.76     pooka kmutex_t tty_lock;
     94      1.120     pooka krwlock_t exec_lock;
     95       1.64     pooka 
     96      1.139     pooka /* sparc doesn't sport constant page size, pretend we have 4k pages */
     97      1.109     pooka #ifdef __sparc__
     98      1.109     pooka int nbpg = 4096;
     99      1.139     pooka int pgofset = 4096-1;
    100      1.139     pooka int pgshift = 12;
    101      1.109     pooka #endif
    102      1.109     pooka 
    103      1.146   tsutsui /* on sun3 VM_MAX_ADDRESS is a const variable */
    104      1.146   tsutsui /* XXX: should be moved into rump.c and initialize for sun3 and sun3x? */
    105      1.141     pooka #ifdef sun3
    106      1.146   tsutsui const vaddr_t kernbase = KERNBASE3;
    107      1.140     pooka #endif
    108      1.140     pooka 
    109      1.117     pooka struct loadavg averunnable = {
    110      1.117     pooka 	{ 0 * FSCALE,
    111      1.117     pooka 	  1 * FSCALE,
    112      1.117     pooka 	  11 * FSCALE, },
    113      1.117     pooka 	FSCALE,
    114      1.117     pooka };
    115      1.117     pooka 
    116      1.174  pgoyette /*
    117      1.174  pgoyette  * Include the autogenerated list of auto-loadable syscalls
    118      1.174  pgoyette  */
    119      1.174  pgoyette #include <kern/syscalls_autoload.c>
    120      1.174  pgoyette 
    121      1.126     pooka struct emul emul_netbsd = {
    122      1.126     pooka 	.e_name = "netbsd-rump",
    123      1.126     pooka 	.e_sysent = rump_sysent,
    124      1.186  pgoyette 	.e_nomodbits = rump_sysent_nomodbits,
    125      1.154     pooka #ifndef __HAVE_MINIMAL_EMUL
    126      1.154     pooka 	.e_nsysent = SYS_NSYSENT,
    127      1.154     pooka #endif
    128      1.128     pooka 	.e_vm_default_addr = uvm_default_mapaddr,
    129      1.138     pooka #ifdef __HAVE_SYSCALL_INTERN
    130      1.138     pooka 	.e_syscall_intern = syscall_intern,
    131      1.138     pooka #endif
    132      1.174  pgoyette 	.e_sc_autoload = netbsd_syscalls_autoload,
    133      1.126     pooka };
    134      1.126     pooka 
    135      1.161     pooka cprng_strong_t *kern_cprng;
    136      1.161     pooka 
    137      1.164     pooka /* not used, but need the symbols for pointer comparisons */
    138      1.164     pooka syncobj_t mutex_syncobj, rw_syncobj;
    139      1.164     pooka 
    140       1.20     pooka int
    141       1.20     pooka kpause(const char *wmesg, bool intr, int timeo, kmutex_t *mtx)
    142       1.20     pooka {
    143       1.20     pooka 	extern int hz;
    144      1.166    justin 	int rv __diagused;
    145       1.78     pooka 	uint64_t sec, nsec;
    146      1.127     pooka 
    147       1.20     pooka 	if (mtx)
    148       1.20     pooka 		mutex_exit(mtx);
    149       1.40     pooka 
    150       1.78     pooka 	sec = timeo / hz;
    151       1.78     pooka 	nsec = (timeo % hz) * (1000000000 / hz);
    152      1.158     pooka 	rv = rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, sec, nsec);
    153      1.156     pooka 	KASSERT(rv == 0);
    154      1.156     pooka 
    155       1.20     pooka 	if (mtx)
    156       1.20     pooka 		mutex_enter(mtx);
    157       1.20     pooka 
    158       1.20     pooka 	return 0;
    159       1.20     pooka }
    160       1.27     pooka 
    161       1.34      yamt vaddr_t
    162      1.155      para calc_cache_size(vsize_t vasz, int pct, int va_pct)
    163       1.34      yamt {
    164       1.34      yamt 	paddr_t t;
    165       1.34      yamt 
    166       1.34      yamt 	t = (paddr_t)physmem * pct / 100 * PAGE_SIZE;
    167       1.34      yamt 	if ((vaddr_t)t != t) {
    168       1.34      yamt 		panic("%s: needs tweak", __func__);
    169       1.34      yamt 	}
    170       1.34      yamt 	return t;
    171       1.34      yamt }
    172       1.35    martin 
    173      1.184     ozaki #define	RETURN_ADDRESS	(uintptr_t)__builtin_return_address(0)
    174      1.184     ozaki 
    175       1.41     pooka void
    176       1.41     pooka assert_sleepable(void)
    177       1.41     pooka {
    178      1.184     ozaki 	const char *reason = NULL;
    179       1.41     pooka 
    180       1.41     pooka 	/* always sleepable, although we should improve this */
    181      1.184     ozaki 
    182      1.184     ozaki 	if (!pserialize_not_in_read_section()) {
    183      1.184     ozaki 		reason = "pserialize";
    184      1.184     ozaki 	}
    185      1.184     ozaki 
    186      1.184     ozaki 	if (reason) {
    187      1.184     ozaki 		panic("%s: %s caller=%p", __func__, reason,
    188      1.184     ozaki 		    (void *)RETURN_ADDRESS);
    189      1.184     ozaki 	}
    190       1.41     pooka }
    191       1.43     pooka 
    192       1.66     pooka void
    193       1.80    cegger module_init_md(void)
    194       1.66     pooka {
    195       1.66     pooka 
    196       1.66     pooka 	/*
    197       1.66     pooka 	 * Nothing for now.  However, we should load the librump
    198       1.66     pooka 	 * symbol table.
    199       1.66     pooka 	 */
    200       1.66     pooka }
    201       1.67     pooka 
    202      1.167     pooka /*
    203      1.167     pooka  * Try to emulate all the MD definitions of DELAY() / delay().
    204      1.167     pooka  * Would be nice to fix the #defines in MD headers, but this quicker.
    205      1.168     pooka  *
    206      1.168     pooka  * XXX: we'd need a rumpuser_clock_sleep_nowrap() here.  Since we
    207      1.168     pooka  * don't have it in the current hypercall revision, busyloop.
    208      1.168     pooka  * Note that rather than calibrate a loop delay and work with that,
    209      1.168     pooka  * get call gettime (which does not block) in a loop to make sure
    210      1.168     pooka  * we didn't get virtual ghosttime.  That might be slightly inaccurate
    211      1.168     pooka  * for very small delays ...
    212      1.168     pooka  *
    213      1.168     pooka  * The other option would be to run a thread in the hypervisor which
    214      1.168     pooka  * sleeps for us and we can wait for it using rumpuser_cv_wait_nowrap()
    215      1.168     pooka  * Probably too fussy.  Better just wait for hypercall rev 18 ;)
    216      1.167     pooka  */
    217       1.69     pooka static void
    218       1.69     pooka rump_delay(unsigned int us)
    219       1.67     pooka {
    220      1.168     pooka 	struct timespec target, tmp;
    221      1.168     pooka 	uint64_t sec, sec_ini, sec_now;
    222      1.168     pooka 	long nsec, nsec_ini, nsec_now;
    223      1.168     pooka 	int loops;
    224      1.168     pooka 
    225      1.168     pooka 	rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO, &sec_ini, &nsec_ini);
    226       1.67     pooka 
    227      1.167     pooka #ifdef __mac68k__
    228      1.167     pooka 	sec = us / 1000;
    229      1.167     pooka 	nsec = (us % 1000) * 1000000;
    230      1.167     pooka #else
    231       1.78     pooka 	sec = us / 1000000;
    232       1.78     pooka 	nsec = (us % 1000000) * 1000;
    233      1.167     pooka #endif
    234       1.67     pooka 
    235      1.168     pooka 	target.tv_sec = sec_ini;
    236      1.168     pooka 	tmp.tv_sec = sec;
    237      1.168     pooka 	target.tv_nsec = nsec_ini;
    238      1.168     pooka 	tmp.tv_nsec = nsec;
    239      1.168     pooka 	timespecadd(&target, &tmp, &target);
    240      1.168     pooka 
    241       1.78     pooka 	if (__predict_false(sec != 0))
    242       1.67     pooka 		printf("WARNING: over 1s delay\n");
    243       1.67     pooka 
    244      1.168     pooka 	for (loops = 0; loops < 1000*1000*100; loops++) {
    245      1.168     pooka 		struct timespec cur;
    246      1.168     pooka 
    247      1.168     pooka 		rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO,
    248      1.168     pooka 		    &sec_now, &nsec_now);
    249      1.168     pooka 		cur.tv_sec = sec_now;
    250      1.168     pooka 		cur.tv_nsec = nsec_now;
    251      1.168     pooka 		if (timespeccmp(&cur, &target, >=)) {
    252      1.168     pooka 			return;
    253      1.168     pooka 		}
    254      1.168     pooka 	}
    255      1.168     pooka 	printf("WARNING: DELAY ESCAPED\n");
    256       1.67     pooka }
    257       1.69     pooka void (*delay_func)(unsigned int) = rump_delay;
    258      1.167     pooka __strong_alias(delay,rump_delay);
    259      1.167     pooka __strong_alias(_delay,rump_delay);
    260       1.67     pooka 
    261      1.191       kre /* Weak alias for getcwd_common to be used unless librumpvfs is present. */
    262      1.191       kre 
    263      1.191       kre int rump_getcwd_common(struct vnode *, struct vnode *, char **, char *,
    264      1.191       kre     int, int, struct lwp *);
    265      1.191       kre int
    266      1.191       kre rump_getcwd_common(struct vnode *lvp, struct vnode *rvp, char **bpp, char *bufp,
    267      1.191       kre     int limit, int flags, struct lwp *l)
    268      1.191       kre {
    269      1.191       kre 
    270      1.191       kre 	return ENOENT;
    271      1.191       kre }
    272      1.191       kre __weak_alias(getcwd_common,rump_getcwd_common);
    273      1.191       kre 
    274      1.181   hannken /* Weak aliases for fstrans to be used unless librumpvfs is present. */
    275      1.181   hannken 
    276      1.182   hannken void rump_fstrans_start(struct mount *);
    277      1.182   hannken void
    278      1.182   hannken rump_fstrans_start(struct mount *mp)
    279      1.182   hannken {
    280      1.182   hannken 
    281      1.182   hannken }
    282      1.182   hannken __weak_alias(fstrans_start,rump_fstrans_start);
    283      1.182   hannken 
    284      1.182   hannken int rump_fstrans_start_nowait(struct mount *);
    285      1.181   hannken int
    286      1.182   hannken rump_fstrans_start_nowait(struct mount *mp)
    287      1.181   hannken {
    288      1.181   hannken 
    289      1.181   hannken 	return 0;
    290      1.181   hannken }
    291      1.182   hannken __weak_alias(fstrans_start_nowait,rump_fstrans_start_nowait);
    292      1.181   hannken 
    293      1.187   hannken void rump_fstrans_start_lazy(struct mount *);
    294      1.187   hannken void
    295      1.187   hannken rump_fstrans_start_lazy(struct mount *mp)
    296      1.187   hannken {
    297      1.187   hannken 
    298      1.187   hannken }
    299      1.187   hannken __weak_alias(fstrans_start_lazy,rump_fstrans_start_lazy);
    300      1.187   hannken 
    301      1.187   hannken 
    302      1.181   hannken void rump_fstrans_done(struct mount *);
    303      1.181   hannken void
    304      1.181   hannken rump_fstrans_done(struct mount *mp)
    305      1.181   hannken {
    306      1.181   hannken 
    307      1.181   hannken }
    308      1.181   hannken __weak_alias(fstrans_done,rump_fstrans_done);
    309      1.181   hannken 
    310      1.190   hannken 
    311      1.190   hannken void rump_fstrans_lwp_dtor(struct lwp *);
    312      1.190   hannken void
    313      1.190   hannken rump_fstrans_lwp_dtor(struct lwp *l)
    314      1.190   hannken {
    315      1.190   hannken 
    316      1.190   hannken }
    317      1.190   hannken __weak_alias(fstrans_lwp_dtor,rump_fstrans_lwp_dtor);
    318      1.190   hannken 
    319      1.142     pooka /*
    320      1.142     pooka  * Provide weak aliases for tty routines used by printf.
    321      1.142     pooka  * They will be used unless the rumpkern_tty component is present.
    322      1.142     pooka  */
    323      1.142     pooka 
    324      1.142     pooka int rump_ttycheckoutq(struct tty *, int);
    325      1.105     pooka int
    326      1.142     pooka rump_ttycheckoutq(struct tty *tp, int wait)
    327       1.67     pooka {
    328       1.67     pooka 
    329       1.67     pooka 	return 1;
    330       1.67     pooka }
    331      1.142     pooka __weak_alias(ttycheckoutq,rump_ttycheckoutq);
    332       1.67     pooka 
    333      1.142     pooka int rump_tputchar(int, int, struct tty *);
    334      1.142     pooka int
    335      1.142     pooka rump_tputchar(int c, int flags, struct tty *tp)
    336      1.142     pooka {
    337      1.142     pooka 
    338      1.142     pooka 	cnputc(c);
    339      1.142     pooka 	return 0;
    340      1.142     pooka }
    341      1.142     pooka __weak_alias(tputchar,rump_tputchar);
    342      1.142     pooka 
    343       1.67     pooka void
    344       1.67     pooka cnputc(int c)
    345       1.67     pooka {
    346       1.67     pooka 
    347      1.157     pooka 	rumpuser_putchar(c);
    348       1.67     pooka }
    349       1.67     pooka 
    350       1.67     pooka void
    351       1.80    cegger cnflush(void)
    352       1.67     pooka {
    353       1.67     pooka 
    354       1.67     pooka 	/* done */
    355       1.67     pooka }
    356       1.67     pooka 
    357      1.163     pooka void
    358      1.163     pooka resettodr(void)
    359      1.163     pooka {
    360      1.163     pooka 
    361      1.163     pooka 	/* setting clocks is not in the jurisdiction of rump kernels */
    362      1.163     pooka }
    363      1.163     pooka 
    364      1.138     pooka #ifdef __HAVE_SYSCALL_INTERN
    365      1.138     pooka void
    366      1.138     pooka syscall_intern(struct proc *p)
    367      1.138     pooka {
    368      1.138     pooka 
    369      1.160     pooka 	p->p_emuldata = NULL;
    370      1.138     pooka }
    371      1.138     pooka #endif
    372      1.144     pooka 
    373      1.148     pooka #ifdef LOCKDEBUG
    374      1.148     pooka void
    375      1.148     pooka turnstile_print(volatile void *obj, void (*pr)(const char *, ...))
    376      1.148     pooka {
    377      1.148     pooka 
    378      1.148     pooka 	/* nada */
    379      1.148     pooka }
    380      1.148     pooka #endif
    381      1.165     pooka 
    382      1.165     pooka void
    383      1.165     pooka cpu_reboot(int howto, char *bootstr)
    384      1.165     pooka {
    385      1.165     pooka 	int ruhow = 0;
    386      1.165     pooka 	void *finiarg;
    387      1.165     pooka 
    388      1.165     pooka 	printf("rump kernel halting...\n");
    389      1.165     pooka 
    390      1.165     pooka 	if (!RUMP_LOCALPROC_P(curproc))
    391      1.170     pooka 		finiarg = RUMP_SPVM2CTL(curproc->p_vmspace);
    392      1.165     pooka 	else
    393      1.165     pooka 		finiarg = NULL;
    394      1.165     pooka 
    395      1.165     pooka 	/* dump means we really take the dive here */
    396      1.165     pooka 	if ((howto & RB_DUMP) || panicstr) {
    397      1.165     pooka 		ruhow = RUMPUSER_PANIC;
    398      1.165     pooka 		goto out;
    399      1.165     pooka 	}
    400      1.165     pooka 
    401      1.165     pooka 	/* try to sync */
    402      1.165     pooka 	if (!((howto & RB_NOSYNC) || panicstr)) {
    403      1.165     pooka 		rump_vfs_fini();
    404      1.165     pooka 	}
    405      1.165     pooka 
    406      1.165     pooka 	doshutdownhooks();
    407      1.165     pooka 
    408      1.165     pooka 	/* your wish is my command */
    409      1.165     pooka 	if (howto & RB_HALT) {
    410      1.172     pooka 		printf("rump kernel halted (with RB_HALT, not exiting)\n");
    411      1.169     pooka 		rump_sysproxy_fini(finiarg);
    412      1.165     pooka 		for (;;) {
    413      1.165     pooka 			rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, 10, 0);
    414      1.165     pooka 		}
    415      1.165     pooka 	}
    416      1.165     pooka 
    417      1.165     pooka 	/* this function is __dead, we must exit */
    418      1.165     pooka  out:
    419      1.169     pooka 	rump_sysproxy_fini(finiarg);
    420      1.165     pooka 	rumpuser_exit(ruhow);
    421      1.165     pooka }
    422      1.173     pooka 
    423      1.173     pooka const char *
    424      1.173     pooka cpu_getmodel(void)
    425      1.173     pooka {
    426      1.173     pooka 
    427      1.173     pooka 	return "rumpcore (virtual)";
    428      1.173     pooka }
    429