Home | History | Annotate | Line # | Download | only in rumpkern
emul.c revision 1.195
      1  1.195   thorpej /*	$NetBSD: emul.c,v 1.195 2020/01/02 15:42:27 thorpej Exp $	*/
      2    1.1     pooka 
      3    1.1     pooka /*
      4  1.150     pooka  * Copyright (c) 2007-2011 Antti Kantee.  All Rights Reserved.
      5    1.1     pooka  *
      6    1.1     pooka  * Redistribution and use in source and binary forms, with or without
      7    1.1     pooka  * modification, are permitted provided that the following conditions
      8    1.1     pooka  * are met:
      9    1.1     pooka  * 1. Redistributions of source code must retain the above copyright
     10    1.1     pooka  *    notice, this list of conditions and the following disclaimer.
     11    1.1     pooka  * 2. Redistributions in binary form must reproduce the above copyright
     12    1.1     pooka  *    notice, this list of conditions and the following disclaimer in the
     13    1.1     pooka  *    documentation and/or other materials provided with the distribution.
     14    1.1     pooka  *
     15    1.1     pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     16    1.1     pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     17    1.1     pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     18    1.1     pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     19    1.1     pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     20    1.1     pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     21    1.1     pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     22    1.1     pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     23    1.1     pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     24    1.1     pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     25    1.1     pooka  * SUCH DAMAGE.
     26    1.1     pooka  */
     27    1.1     pooka 
     28   1.61     pooka #include <sys/cdefs.h>
     29  1.195   thorpej __KERNEL_RCSID(0, "$NetBSD: emul.c,v 1.195 2020/01/02 15:42:27 thorpej Exp $");
     30    1.9     pooka 
     31    1.1     pooka #include <sys/param.h>
     32  1.176     pooka #include <sys/cprng.h>
     33  1.176     pooka #include <sys/filedesc.h>
     34  1.181   hannken #include <sys/fstrans.h>
     35    1.1     pooka #include <sys/kauth.h>
     36   1.66     pooka #include <sys/module.h>
     37   1.67     pooka #include <sys/reboot.h>
     38  1.154     pooka #include <sys/syscall.h>
     39  1.185     ozaki #include <sys/pserialize.h>
     40  1.178     ozaki #ifdef LOCKDEBUG
     41  1.178     ozaki #include <sys/sleepq.h>
     42  1.178     ozaki #endif
     43   1.67     pooka 
     44   1.67     pooka #include <dev/cons.h>
     45    1.1     pooka 
     46  1.179     pooka #include <rump-sys/kern.h>
     47  1.179     pooka 
     48   1.44     pooka #include <rump/rumpuser.h>
     49   1.44     pooka 
     50  1.165     pooka void (*rump_vfs_fini)(void) = (void *)nullop;
     51  1.165     pooka 
     52  1.149     pooka /*
     53  1.149     pooka  * physmem is largely unused (except for nmbcluster calculations),
     54  1.149     pooka  * so pick a default value which suits ZFS.  if an application wants
     55  1.149     pooka  * a very small memory footprint, it can still adjust this before
     56  1.149     pooka  * calling rump_init()
     57  1.149     pooka  */
     58  1.149     pooka #define PHYSMEM 512*256
     59  1.180    cherry psize_t physmem = PHYSMEM;
     60  1.149     pooka int nkmempages = PHYSMEM/2; /* from le chapeau */
     61  1.149     pooka #undef PHYSMEM
     62  1.149     pooka 
     63    1.1     pooka struct vnode *rootvp;
     64  1.124     pooka dev_t rootdev = NODEV;
     65  1.149     pooka 
     66   1.19     pooka const int schedppq = 1;
     67   1.66     pooka int cold = 1;
     68  1.195   thorpej int shutting_down;
     69   1.95     pooka int boothowto = AB_SILENT;
     70   1.67     pooka struct tty *constty;
     71    1.1     pooka 
     72  1.135     pooka const struct bdevsw *bdevsw0[255];
     73   1.64     pooka const struct bdevsw **bdevsw = bdevsw0;
     74  1.135     pooka const int sys_cdevsws = 255;
     75  1.135     pooka int max_cdevsws = 255;
     76   1.64     pooka 
     77  1.135     pooka const struct cdevsw *cdevsw0[255];
     78   1.64     pooka const struct cdevsw **cdevsw = cdevsw0;
     79  1.135     pooka const int sys_bdevsws = 255;
     80  1.135     pooka int max_bdevsws = 255;
     81   1.64     pooka 
     82   1.76     pooka int mem_no = 2;
     83   1.76     pooka 
     84  1.151       chs device_t booted_device;
     85  1.151       chs device_t booted_wedge;
     86   1.92     pooka int booted_partition;
     87  1.183  christos const char *booted_method;
     88   1.92     pooka 
     89  1.120     pooka /* XXX: unused */
     90   1.76     pooka kmutex_t tty_lock;
     91  1.120     pooka krwlock_t exec_lock;
     92   1.64     pooka 
     93  1.139     pooka /* sparc doesn't sport constant page size, pretend we have 4k pages */
     94  1.109     pooka #ifdef __sparc__
     95  1.109     pooka int nbpg = 4096;
     96  1.139     pooka int pgofset = 4096-1;
     97  1.139     pooka int pgshift = 12;
     98  1.109     pooka #endif
     99  1.109     pooka 
    100  1.146   tsutsui /* on sun3 VM_MAX_ADDRESS is a const variable */
    101  1.146   tsutsui /* XXX: should be moved into rump.c and initialize for sun3 and sun3x? */
    102  1.141     pooka #ifdef sun3
    103  1.146   tsutsui const vaddr_t kernbase = KERNBASE3;
    104  1.140     pooka #endif
    105  1.140     pooka 
    106  1.117     pooka struct loadavg averunnable = {
    107  1.117     pooka 	{ 0 * FSCALE,
    108  1.117     pooka 	  1 * FSCALE,
    109  1.117     pooka 	  11 * FSCALE, },
    110  1.117     pooka 	FSCALE,
    111  1.117     pooka };
    112  1.117     pooka 
    113  1.174  pgoyette /*
    114  1.174  pgoyette  * Include the autogenerated list of auto-loadable syscalls
    115  1.174  pgoyette  */
    116  1.174  pgoyette #include <kern/syscalls_autoload.c>
    117  1.174  pgoyette 
    118  1.126     pooka struct emul emul_netbsd = {
    119  1.126     pooka 	.e_name = "netbsd-rump",
    120  1.126     pooka 	.e_sysent = rump_sysent,
    121  1.186  pgoyette 	.e_nomodbits = rump_sysent_nomodbits,
    122  1.154     pooka #ifndef __HAVE_MINIMAL_EMUL
    123  1.154     pooka 	.e_nsysent = SYS_NSYSENT,
    124  1.154     pooka #endif
    125  1.128     pooka 	.e_vm_default_addr = uvm_default_mapaddr,
    126  1.138     pooka #ifdef __HAVE_SYSCALL_INTERN
    127  1.138     pooka 	.e_syscall_intern = syscall_intern,
    128  1.138     pooka #endif
    129  1.174  pgoyette 	.e_sc_autoload = netbsd_syscalls_autoload,
    130  1.126     pooka };
    131  1.126     pooka 
    132  1.161     pooka cprng_strong_t *kern_cprng;
    133  1.161     pooka 
    134  1.164     pooka /* not used, but need the symbols for pointer comparisons */
    135  1.164     pooka syncobj_t mutex_syncobj, rw_syncobj;
    136  1.164     pooka 
    137   1.20     pooka int
    138   1.20     pooka kpause(const char *wmesg, bool intr, int timeo, kmutex_t *mtx)
    139   1.20     pooka {
    140   1.20     pooka 	extern int hz;
    141  1.166    justin 	int rv __diagused;
    142   1.78     pooka 	uint64_t sec, nsec;
    143  1.127     pooka 
    144   1.20     pooka 	if (mtx)
    145   1.20     pooka 		mutex_exit(mtx);
    146   1.40     pooka 
    147   1.78     pooka 	sec = timeo / hz;
    148   1.78     pooka 	nsec = (timeo % hz) * (1000000000 / hz);
    149  1.158     pooka 	rv = rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, sec, nsec);
    150  1.156     pooka 	KASSERT(rv == 0);
    151  1.156     pooka 
    152   1.20     pooka 	if (mtx)
    153   1.20     pooka 		mutex_enter(mtx);
    154   1.20     pooka 
    155   1.20     pooka 	return 0;
    156   1.20     pooka }
    157   1.27     pooka 
    158   1.34      yamt vaddr_t
    159  1.155      para calc_cache_size(vsize_t vasz, int pct, int va_pct)
    160   1.34      yamt {
    161   1.34      yamt 	paddr_t t;
    162   1.34      yamt 
    163   1.34      yamt 	t = (paddr_t)physmem * pct / 100 * PAGE_SIZE;
    164   1.34      yamt 	if ((vaddr_t)t != t) {
    165   1.34      yamt 		panic("%s: needs tweak", __func__);
    166   1.34      yamt 	}
    167   1.34      yamt 	return t;
    168   1.34      yamt }
    169   1.35    martin 
    170  1.184     ozaki #define	RETURN_ADDRESS	(uintptr_t)__builtin_return_address(0)
    171  1.184     ozaki 
    172   1.41     pooka void
    173   1.41     pooka assert_sleepable(void)
    174   1.41     pooka {
    175  1.184     ozaki 	const char *reason = NULL;
    176   1.41     pooka 
    177   1.41     pooka 	/* always sleepable, although we should improve this */
    178  1.184     ozaki 
    179  1.184     ozaki 	if (!pserialize_not_in_read_section()) {
    180  1.184     ozaki 		reason = "pserialize";
    181  1.184     ozaki 	}
    182  1.184     ozaki 
    183  1.184     ozaki 	if (reason) {
    184  1.184     ozaki 		panic("%s: %s caller=%p", __func__, reason,
    185  1.184     ozaki 		    (void *)RETURN_ADDRESS);
    186  1.184     ozaki 	}
    187   1.41     pooka }
    188   1.43     pooka 
    189   1.66     pooka void
    190   1.80    cegger module_init_md(void)
    191   1.66     pooka {
    192   1.66     pooka 
    193   1.66     pooka 	/*
    194   1.66     pooka 	 * Nothing for now.  However, we should load the librump
    195   1.66     pooka 	 * symbol table.
    196   1.66     pooka 	 */
    197   1.66     pooka }
    198   1.67     pooka 
    199  1.167     pooka /*
    200  1.167     pooka  * Try to emulate all the MD definitions of DELAY() / delay().
    201  1.167     pooka  * Would be nice to fix the #defines in MD headers, but this quicker.
    202  1.168     pooka  *
    203  1.168     pooka  * XXX: we'd need a rumpuser_clock_sleep_nowrap() here.  Since we
    204  1.168     pooka  * don't have it in the current hypercall revision, busyloop.
    205  1.168     pooka  * Note that rather than calibrate a loop delay and work with that,
    206  1.168     pooka  * get call gettime (which does not block) in a loop to make sure
    207  1.168     pooka  * we didn't get virtual ghosttime.  That might be slightly inaccurate
    208  1.168     pooka  * for very small delays ...
    209  1.168     pooka  *
    210  1.168     pooka  * The other option would be to run a thread in the hypervisor which
    211  1.168     pooka  * sleeps for us and we can wait for it using rumpuser_cv_wait_nowrap()
    212  1.168     pooka  * Probably too fussy.  Better just wait for hypercall rev 18 ;)
    213  1.167     pooka  */
    214   1.69     pooka static void
    215   1.69     pooka rump_delay(unsigned int us)
    216   1.67     pooka {
    217  1.168     pooka 	struct timespec target, tmp;
    218  1.168     pooka 	uint64_t sec, sec_ini, sec_now;
    219  1.168     pooka 	long nsec, nsec_ini, nsec_now;
    220  1.168     pooka 	int loops;
    221  1.168     pooka 
    222  1.168     pooka 	rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO, &sec_ini, &nsec_ini);
    223   1.67     pooka 
    224  1.167     pooka #ifdef __mac68k__
    225  1.167     pooka 	sec = us / 1000;
    226  1.167     pooka 	nsec = (us % 1000) * 1000000;
    227  1.167     pooka #else
    228   1.78     pooka 	sec = us / 1000000;
    229   1.78     pooka 	nsec = (us % 1000000) * 1000;
    230  1.167     pooka #endif
    231   1.67     pooka 
    232  1.168     pooka 	target.tv_sec = sec_ini;
    233  1.168     pooka 	tmp.tv_sec = sec;
    234  1.168     pooka 	target.tv_nsec = nsec_ini;
    235  1.168     pooka 	tmp.tv_nsec = nsec;
    236  1.168     pooka 	timespecadd(&target, &tmp, &target);
    237  1.168     pooka 
    238   1.78     pooka 	if (__predict_false(sec != 0))
    239   1.67     pooka 		printf("WARNING: over 1s delay\n");
    240   1.67     pooka 
    241  1.168     pooka 	for (loops = 0; loops < 1000*1000*100; loops++) {
    242  1.168     pooka 		struct timespec cur;
    243  1.168     pooka 
    244  1.168     pooka 		rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO,
    245  1.168     pooka 		    &sec_now, &nsec_now);
    246  1.168     pooka 		cur.tv_sec = sec_now;
    247  1.168     pooka 		cur.tv_nsec = nsec_now;
    248  1.168     pooka 		if (timespeccmp(&cur, &target, >=)) {
    249  1.168     pooka 			return;
    250  1.168     pooka 		}
    251  1.168     pooka 	}
    252  1.168     pooka 	printf("WARNING: DELAY ESCAPED\n");
    253   1.67     pooka }
    254   1.69     pooka void (*delay_func)(unsigned int) = rump_delay;
    255  1.167     pooka __strong_alias(delay,rump_delay);
    256  1.167     pooka __strong_alias(_delay,rump_delay);
    257   1.67     pooka 
    258  1.191       kre /* Weak alias for getcwd_common to be used unless librumpvfs is present. */
    259  1.191       kre 
    260  1.191       kre int rump_getcwd_common(struct vnode *, struct vnode *, char **, char *,
    261  1.191       kre     int, int, struct lwp *);
    262  1.191       kre int
    263  1.191       kre rump_getcwd_common(struct vnode *lvp, struct vnode *rvp, char **bpp, char *bufp,
    264  1.191       kre     int limit, int flags, struct lwp *l)
    265  1.191       kre {
    266  1.191       kre 
    267  1.191       kre 	return ENOENT;
    268  1.191       kre }
    269  1.191       kre __weak_alias(getcwd_common,rump_getcwd_common);
    270  1.191       kre 
    271  1.192       bad /* Weak alias for vnode_to_path to be used unless librumpvfs is present. */
    272  1.192       bad 
    273  1.192       bad int rump_vnode_to_path(char *, size_t, struct vnode *, struct lwp *,
    274  1.192       bad     struct proc *);
    275  1.192       bad int
    276  1.192       bad rump_vnode_to_path(char *path, size_t len, struct vnode *vp, struct lwp *curl,
    277  1.192       bad     struct proc *p)
    278  1.192       bad {
    279  1.192       bad 
    280  1.192       bad 	return ENOENT; /* pretend getcwd_common() failed. */
    281  1.192       bad }
    282  1.192       bad __weak_alias(vnode_to_path,rump_vnode_to_path);
    283  1.192       bad 
    284  1.192       bad 
    285  1.181   hannken /* Weak aliases for fstrans to be used unless librumpvfs is present. */
    286  1.181   hannken 
    287  1.182   hannken void rump_fstrans_start(struct mount *);
    288  1.182   hannken void
    289  1.182   hannken rump_fstrans_start(struct mount *mp)
    290  1.182   hannken {
    291  1.182   hannken 
    292  1.182   hannken }
    293  1.182   hannken __weak_alias(fstrans_start,rump_fstrans_start);
    294  1.182   hannken 
    295  1.182   hannken int rump_fstrans_start_nowait(struct mount *);
    296  1.181   hannken int
    297  1.182   hannken rump_fstrans_start_nowait(struct mount *mp)
    298  1.181   hannken {
    299  1.181   hannken 
    300  1.181   hannken 	return 0;
    301  1.181   hannken }
    302  1.182   hannken __weak_alias(fstrans_start_nowait,rump_fstrans_start_nowait);
    303  1.181   hannken 
    304  1.187   hannken void rump_fstrans_start_lazy(struct mount *);
    305  1.187   hannken void
    306  1.187   hannken rump_fstrans_start_lazy(struct mount *mp)
    307  1.187   hannken {
    308  1.187   hannken 
    309  1.187   hannken }
    310  1.187   hannken __weak_alias(fstrans_start_lazy,rump_fstrans_start_lazy);
    311  1.187   hannken 
    312  1.187   hannken 
    313  1.181   hannken void rump_fstrans_done(struct mount *);
    314  1.181   hannken void
    315  1.181   hannken rump_fstrans_done(struct mount *mp)
    316  1.181   hannken {
    317  1.181   hannken 
    318  1.181   hannken }
    319  1.181   hannken __weak_alias(fstrans_done,rump_fstrans_done);
    320  1.181   hannken 
    321  1.190   hannken 
    322  1.190   hannken void rump_fstrans_lwp_dtor(struct lwp *);
    323  1.190   hannken void
    324  1.190   hannken rump_fstrans_lwp_dtor(struct lwp *l)
    325  1.190   hannken {
    326  1.190   hannken 
    327  1.190   hannken }
    328  1.190   hannken __weak_alias(fstrans_lwp_dtor,rump_fstrans_lwp_dtor);
    329  1.190   hannken 
    330  1.142     pooka /*
    331  1.142     pooka  * Provide weak aliases for tty routines used by printf.
    332  1.142     pooka  * They will be used unless the rumpkern_tty component is present.
    333  1.142     pooka  */
    334  1.142     pooka 
    335  1.142     pooka int rump_ttycheckoutq(struct tty *, int);
    336  1.105     pooka int
    337  1.142     pooka rump_ttycheckoutq(struct tty *tp, int wait)
    338   1.67     pooka {
    339   1.67     pooka 
    340   1.67     pooka 	return 1;
    341   1.67     pooka }
    342  1.142     pooka __weak_alias(ttycheckoutq,rump_ttycheckoutq);
    343   1.67     pooka 
    344  1.142     pooka int rump_tputchar(int, int, struct tty *);
    345  1.142     pooka int
    346  1.142     pooka rump_tputchar(int c, int flags, struct tty *tp)
    347  1.142     pooka {
    348  1.142     pooka 
    349  1.142     pooka 	cnputc(c);
    350  1.142     pooka 	return 0;
    351  1.142     pooka }
    352  1.142     pooka __weak_alias(tputchar,rump_tputchar);
    353  1.142     pooka 
    354   1.67     pooka void
    355   1.67     pooka cnputc(int c)
    356   1.67     pooka {
    357   1.67     pooka 
    358  1.157     pooka 	rumpuser_putchar(c);
    359   1.67     pooka }
    360   1.67     pooka 
    361   1.67     pooka void
    362   1.80    cegger cnflush(void)
    363   1.67     pooka {
    364   1.67     pooka 
    365   1.67     pooka 	/* done */
    366   1.67     pooka }
    367   1.67     pooka 
    368  1.163     pooka void
    369  1.163     pooka resettodr(void)
    370  1.163     pooka {
    371  1.163     pooka 
    372  1.163     pooka 	/* setting clocks is not in the jurisdiction of rump kernels */
    373  1.163     pooka }
    374  1.163     pooka 
    375  1.138     pooka #ifdef __HAVE_SYSCALL_INTERN
    376  1.138     pooka void
    377  1.138     pooka syscall_intern(struct proc *p)
    378  1.138     pooka {
    379  1.138     pooka 
    380  1.160     pooka 	p->p_emuldata = NULL;
    381  1.138     pooka }
    382  1.138     pooka #endif
    383  1.144     pooka 
    384  1.148     pooka #ifdef LOCKDEBUG
    385  1.148     pooka void
    386  1.148     pooka turnstile_print(volatile void *obj, void (*pr)(const char *, ...))
    387  1.148     pooka {
    388  1.148     pooka 
    389  1.148     pooka 	/* nada */
    390  1.148     pooka }
    391  1.148     pooka #endif
    392  1.165     pooka 
    393  1.165     pooka void
    394  1.165     pooka cpu_reboot(int howto, char *bootstr)
    395  1.165     pooka {
    396  1.165     pooka 	int ruhow = 0;
    397  1.165     pooka 	void *finiarg;
    398  1.165     pooka 
    399  1.165     pooka 	printf("rump kernel halting...\n");
    400  1.165     pooka 
    401  1.165     pooka 	if (!RUMP_LOCALPROC_P(curproc))
    402  1.170     pooka 		finiarg = RUMP_SPVM2CTL(curproc->p_vmspace);
    403  1.165     pooka 	else
    404  1.165     pooka 		finiarg = NULL;
    405  1.165     pooka 
    406  1.165     pooka 	/* dump means we really take the dive here */
    407  1.165     pooka 	if ((howto & RB_DUMP) || panicstr) {
    408  1.165     pooka 		ruhow = RUMPUSER_PANIC;
    409  1.165     pooka 		goto out;
    410  1.165     pooka 	}
    411  1.165     pooka 
    412  1.165     pooka 	/* try to sync */
    413  1.165     pooka 	if (!((howto & RB_NOSYNC) || panicstr)) {
    414  1.165     pooka 		rump_vfs_fini();
    415  1.165     pooka 	}
    416  1.165     pooka 
    417  1.165     pooka 	doshutdownhooks();
    418  1.165     pooka 
    419  1.165     pooka 	/* your wish is my command */
    420  1.165     pooka 	if (howto & RB_HALT) {
    421  1.172     pooka 		printf("rump kernel halted (with RB_HALT, not exiting)\n");
    422  1.169     pooka 		rump_sysproxy_fini(finiarg);
    423  1.165     pooka 		for (;;) {
    424  1.165     pooka 			rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, 10, 0);
    425  1.165     pooka 		}
    426  1.165     pooka 	}
    427  1.165     pooka 
    428  1.165     pooka 	/* this function is __dead, we must exit */
    429  1.165     pooka  out:
    430  1.169     pooka 	rump_sysproxy_fini(finiarg);
    431  1.165     pooka 	rumpuser_exit(ruhow);
    432  1.165     pooka }
    433