Home | History | Annotate | Line # | Download | only in rumpkern
emul.c revision 1.173
      1  1.173    pooka /*	$NetBSD: emul.c,v 1.173 2015/08/25 14:47:26 pooka Exp $	*/
      2    1.1    pooka 
      3    1.1    pooka /*
      4  1.150    pooka  * Copyright (c) 2007-2011 Antti Kantee.  All Rights Reserved.
      5    1.1    pooka  *
      6    1.1    pooka  * Redistribution and use in source and binary forms, with or without
      7    1.1    pooka  * modification, are permitted provided that the following conditions
      8    1.1    pooka  * are met:
      9    1.1    pooka  * 1. Redistributions of source code must retain the above copyright
     10    1.1    pooka  *    notice, this list of conditions and the following disclaimer.
     11    1.1    pooka  * 2. Redistributions in binary form must reproduce the above copyright
     12    1.1    pooka  *    notice, this list of conditions and the following disclaimer in the
     13    1.1    pooka  *    documentation and/or other materials provided with the distribution.
     14    1.1    pooka  *
     15    1.1    pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     16    1.1    pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     17    1.1    pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     18    1.1    pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     19    1.1    pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     20    1.1    pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     21    1.1    pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     22    1.1    pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     23    1.1    pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     24    1.1    pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     25    1.1    pooka  * SUCH DAMAGE.
     26    1.1    pooka  */
     27    1.1    pooka 
     28   1.61    pooka #include <sys/cdefs.h>
     29  1.173    pooka __KERNEL_RCSID(0, "$NetBSD: emul.c,v 1.173 2015/08/25 14:47:26 pooka Exp $");
     30    1.9    pooka 
     31    1.1    pooka #include <sys/param.h>
     32    1.1    pooka #include <sys/null.h>
     33    1.1    pooka #include <sys/vnode.h>
     34    1.1    pooka #include <sys/stat.h>
     35   1.35   martin #include <sys/select.h>
     36    1.1    pooka #include <sys/syslog.h>
     37    1.1    pooka #include <sys/namei.h>
     38    1.1    pooka #include <sys/kauth.h>
     39    1.1    pooka #include <sys/conf.h>
     40    1.1    pooka #include <sys/device.h>
     41    1.1    pooka #include <sys/queue.h>
     42   1.20    pooka #include <sys/file.h>
     43  1.162    pooka #include <sys/filedesc.h>
     44   1.15       ad #include <sys/cpu.h>
     45   1.17    pooka #include <sys/kmem.h>
     46   1.20    pooka #include <sys/poll.h>
     47   1.66    pooka #include <sys/timetc.h>
     48   1.53    pooka #include <sys/tprintf.h>
     49   1.66    pooka #include <sys/module.h>
     50   1.67    pooka #include <sys/tty.h>
     51   1.67    pooka #include <sys/reboot.h>
     52  1.154    pooka #include <sys/syscall.h>
     53  1.109    pooka #include <sys/syscallvar.h>
     54  1.109    pooka #include <sys/xcall.h>
     55  1.148    pooka #include <sys/sleepq.h>
     56  1.161    pooka #include <sys/cprng.h>
     57   1.67    pooka 
     58   1.67    pooka #include <dev/cons.h>
     59    1.1    pooka 
     60   1.44    pooka #include <rump/rumpuser.h>
     61   1.44    pooka 
     62    1.8    pooka #include <uvm/uvm_map.h>
     63    1.8    pooka 
     64   1.10    pooka #include "rump_private.h"
     65    1.1    pooka 
     66  1.165    pooka void (*rump_vfs_fini)(void) = (void *)nullop;
     67  1.165    pooka 
     68  1.149    pooka /*
     69  1.149    pooka  * physmem is largely unused (except for nmbcluster calculations),
     70  1.149    pooka  * so pick a default value which suits ZFS.  if an application wants
     71  1.149    pooka  * a very small memory footprint, it can still adjust this before
     72  1.149    pooka  * calling rump_init()
     73  1.149    pooka  */
     74  1.149    pooka #define PHYSMEM 512*256
     75  1.149    pooka int physmem = PHYSMEM;
     76  1.149    pooka int nkmempages = PHYSMEM/2; /* from le chapeau */
     77  1.149    pooka #undef PHYSMEM
     78  1.149    pooka 
     79  1.162    pooka struct lwp lwp0 = {
     80  1.162    pooka 	.l_lid = 1,
     81  1.162    pooka 	.l_proc = &proc0,
     82  1.162    pooka 	.l_fd = &filedesc0,
     83  1.162    pooka };
     84    1.1    pooka struct vnode *rootvp;
     85  1.124    pooka dev_t rootdev = NODEV;
     86  1.149    pooka 
     87   1.19    pooka const int schedppq = 1;
     88   1.53    pooka bool mp_online = false;
     89   1.56    pooka struct timeval boottime;
     90   1.66    pooka int cold = 1;
     91   1.95    pooka int boothowto = AB_SILENT;
     92   1.67    pooka struct tty *constty;
     93    1.1    pooka 
     94  1.135    pooka const struct bdevsw *bdevsw0[255];
     95   1.64    pooka const struct bdevsw **bdevsw = bdevsw0;
     96  1.135    pooka const int sys_cdevsws = 255;
     97  1.135    pooka int max_cdevsws = 255;
     98   1.64    pooka 
     99  1.135    pooka const struct cdevsw *cdevsw0[255];
    100   1.64    pooka const struct cdevsw **cdevsw = cdevsw0;
    101  1.135    pooka const int sys_bdevsws = 255;
    102  1.135    pooka int max_bdevsws = 255;
    103   1.64    pooka 
    104   1.76    pooka int mem_no = 2;
    105   1.76    pooka 
    106  1.151      chs device_t booted_device;
    107  1.151      chs device_t booted_wedge;
    108   1.92    pooka int booted_partition;
    109   1.92    pooka 
    110  1.120    pooka /* XXX: unused */
    111   1.76    pooka kmutex_t tty_lock;
    112  1.120    pooka krwlock_t exec_lock;
    113   1.64    pooka 
    114  1.125    pooka struct lwplist alllwp = LIST_HEAD_INITIALIZER(alllwp);
    115  1.125    pooka 
    116  1.139    pooka /* sparc doesn't sport constant page size, pretend we have 4k pages */
    117  1.109    pooka #ifdef __sparc__
    118  1.109    pooka int nbpg = 4096;
    119  1.139    pooka int pgofset = 4096-1;
    120  1.139    pooka int pgshift = 12;
    121  1.109    pooka #endif
    122  1.109    pooka 
    123  1.146  tsutsui /* on sun3 VM_MAX_ADDRESS is a const variable */
    124  1.146  tsutsui /* XXX: should be moved into rump.c and initialize for sun3 and sun3x? */
    125  1.141    pooka #ifdef sun3
    126  1.146  tsutsui const vaddr_t kernbase = KERNBASE3;
    127  1.140    pooka #endif
    128  1.140    pooka 
    129  1.117    pooka struct loadavg averunnable = {
    130  1.117    pooka 	{ 0 * FSCALE,
    131  1.117    pooka 	  1 * FSCALE,
    132  1.117    pooka 	  11 * FSCALE, },
    133  1.117    pooka 	FSCALE,
    134  1.117    pooka };
    135  1.117    pooka 
    136  1.126    pooka struct emul emul_netbsd = {
    137  1.126    pooka 	.e_name = "netbsd-rump",
    138  1.126    pooka 	.e_sysent = rump_sysent,
    139  1.154    pooka #ifndef __HAVE_MINIMAL_EMUL
    140  1.154    pooka 	.e_nsysent = SYS_NSYSENT,
    141  1.154    pooka #endif
    142  1.128    pooka 	.e_vm_default_addr = uvm_default_mapaddr,
    143  1.138    pooka #ifdef __HAVE_SYSCALL_INTERN
    144  1.138    pooka 	.e_syscall_intern = syscall_intern,
    145  1.138    pooka #endif
    146  1.126    pooka };
    147  1.126    pooka 
    148  1.138    pooka u_int nprocs = 1;
    149   1.20    pooka 
    150  1.161    pooka cprng_strong_t *kern_cprng;
    151  1.161    pooka 
    152  1.164    pooka /* not used, but need the symbols for pointer comparisons */
    153  1.164    pooka syncobj_t mutex_syncobj, rw_syncobj;
    154  1.164    pooka 
    155   1.20    pooka int
    156   1.20    pooka kpause(const char *wmesg, bool intr, int timeo, kmutex_t *mtx)
    157   1.20    pooka {
    158   1.20    pooka 	extern int hz;
    159  1.166   justin 	int rv __diagused;
    160   1.78    pooka 	uint64_t sec, nsec;
    161  1.127    pooka 
    162   1.20    pooka 	if (mtx)
    163   1.20    pooka 		mutex_exit(mtx);
    164   1.40    pooka 
    165   1.78    pooka 	sec = timeo / hz;
    166   1.78    pooka 	nsec = (timeo % hz) * (1000000000 / hz);
    167  1.158    pooka 	rv = rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, sec, nsec);
    168  1.156    pooka 	KASSERT(rv == 0);
    169  1.156    pooka 
    170   1.20    pooka 	if (mtx)
    171   1.20    pooka 		mutex_enter(mtx);
    172   1.20    pooka 
    173   1.20    pooka 	return 0;
    174   1.20    pooka }
    175   1.27    pooka 
    176   1.27    pooka void
    177   1.32      bjs lwp_unsleep(lwp_t *l, bool cleanup)
    178   1.32      bjs {
    179   1.32      bjs 
    180   1.32      bjs 	KASSERT(mutex_owned(l->l_mutex));
    181   1.32      bjs 
    182  1.104    rmind 	(*l->l_syncobj->sobj_unsleep)(l, cleanup);
    183   1.32      bjs }
    184   1.34     yamt 
    185  1.145    pooka void
    186  1.145    pooka lwp_update_creds(struct lwp *l)
    187  1.145    pooka {
    188  1.145    pooka 	struct proc *p;
    189  1.145    pooka 	kauth_cred_t oldcred;
    190  1.145    pooka 
    191  1.145    pooka 	p = l->l_proc;
    192  1.145    pooka 	oldcred = l->l_cred;
    193  1.145    pooka 	l->l_prflag &= ~LPR_CRMOD;
    194  1.145    pooka 
    195  1.145    pooka 	mutex_enter(p->p_lock);
    196  1.145    pooka 	kauth_cred_hold(p->p_cred);
    197  1.145    pooka 	l->l_cred = p->p_cred;
    198  1.145    pooka 	mutex_exit(p->p_lock);
    199  1.145    pooka 
    200  1.145    pooka 	if (oldcred != NULL)
    201  1.145    pooka 		kauth_cred_free(oldcred);
    202  1.145    pooka }
    203  1.145    pooka 
    204   1.34     yamt vaddr_t
    205  1.155     para calc_cache_size(vsize_t vasz, int pct, int va_pct)
    206   1.34     yamt {
    207   1.34     yamt 	paddr_t t;
    208   1.34     yamt 
    209   1.34     yamt 	t = (paddr_t)physmem * pct / 100 * PAGE_SIZE;
    210   1.34     yamt 	if ((vaddr_t)t != t) {
    211   1.34     yamt 		panic("%s: needs tweak", __func__);
    212   1.34     yamt 	}
    213   1.34     yamt 	return t;
    214   1.34     yamt }
    215   1.35   martin 
    216   1.41    pooka void
    217   1.41    pooka assert_sleepable(void)
    218   1.41    pooka {
    219   1.41    pooka 
    220   1.41    pooka 	/* always sleepable, although we should improve this */
    221   1.41    pooka }
    222   1.43    pooka 
    223   1.66    pooka void
    224   1.80   cegger module_init_md(void)
    225   1.66    pooka {
    226   1.66    pooka 
    227   1.66    pooka 	/*
    228   1.66    pooka 	 * Nothing for now.  However, we should load the librump
    229   1.66    pooka 	 * symbol table.
    230   1.66    pooka 	 */
    231   1.66    pooka }
    232   1.67    pooka 
    233  1.167    pooka /*
    234  1.167    pooka  * Try to emulate all the MD definitions of DELAY() / delay().
    235  1.167    pooka  * Would be nice to fix the #defines in MD headers, but this quicker.
    236  1.168    pooka  *
    237  1.168    pooka  * XXX: we'd need a rumpuser_clock_sleep_nowrap() here.  Since we
    238  1.168    pooka  * don't have it in the current hypercall revision, busyloop.
    239  1.168    pooka  * Note that rather than calibrate a loop delay and work with that,
    240  1.168    pooka  * get call gettime (which does not block) in a loop to make sure
    241  1.168    pooka  * we didn't get virtual ghosttime.  That might be slightly inaccurate
    242  1.168    pooka  * for very small delays ...
    243  1.168    pooka  *
    244  1.168    pooka  * The other option would be to run a thread in the hypervisor which
    245  1.168    pooka  * sleeps for us and we can wait for it using rumpuser_cv_wait_nowrap()
    246  1.168    pooka  * Probably too fussy.  Better just wait for hypercall rev 18 ;)
    247  1.167    pooka  */
    248   1.69    pooka static void
    249   1.69    pooka rump_delay(unsigned int us)
    250   1.67    pooka {
    251  1.168    pooka 	struct timespec target, tmp;
    252  1.168    pooka 	uint64_t sec, sec_ini, sec_now;
    253  1.168    pooka 	long nsec, nsec_ini, nsec_now;
    254  1.168    pooka 	int loops;
    255  1.168    pooka 
    256  1.168    pooka 	rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO, &sec_ini, &nsec_ini);
    257   1.67    pooka 
    258  1.167    pooka #ifdef __mac68k__
    259  1.167    pooka 	sec = us / 1000;
    260  1.167    pooka 	nsec = (us % 1000) * 1000000;
    261  1.167    pooka #else
    262   1.78    pooka 	sec = us / 1000000;
    263   1.78    pooka 	nsec = (us % 1000000) * 1000;
    264  1.167    pooka #endif
    265   1.67    pooka 
    266  1.168    pooka 	target.tv_sec = sec_ini;
    267  1.168    pooka 	tmp.tv_sec = sec;
    268  1.168    pooka 	target.tv_nsec = nsec_ini;
    269  1.168    pooka 	tmp.tv_nsec = nsec;
    270  1.168    pooka 	timespecadd(&target, &tmp, &target);
    271  1.168    pooka 
    272   1.78    pooka 	if (__predict_false(sec != 0))
    273   1.67    pooka 		printf("WARNING: over 1s delay\n");
    274   1.67    pooka 
    275  1.168    pooka 	for (loops = 0; loops < 1000*1000*100; loops++) {
    276  1.168    pooka 		struct timespec cur;
    277  1.168    pooka 
    278  1.168    pooka 		rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO,
    279  1.168    pooka 		    &sec_now, &nsec_now);
    280  1.168    pooka 		cur.tv_sec = sec_now;
    281  1.168    pooka 		cur.tv_nsec = nsec_now;
    282  1.168    pooka 		if (timespeccmp(&cur, &target, >=)) {
    283  1.168    pooka 			return;
    284  1.168    pooka 		}
    285  1.168    pooka 	}
    286  1.168    pooka 	printf("WARNING: DELAY ESCAPED\n");
    287   1.67    pooka }
    288   1.69    pooka void (*delay_func)(unsigned int) = rump_delay;
    289  1.167    pooka __strong_alias(delay,rump_delay);
    290  1.167    pooka __strong_alias(_delay,rump_delay);
    291   1.67    pooka 
    292  1.142    pooka /*
    293  1.142    pooka  * Provide weak aliases for tty routines used by printf.
    294  1.142    pooka  * They will be used unless the rumpkern_tty component is present.
    295  1.142    pooka  */
    296  1.142    pooka 
    297  1.142    pooka int rump_ttycheckoutq(struct tty *, int);
    298  1.105    pooka int
    299  1.142    pooka rump_ttycheckoutq(struct tty *tp, int wait)
    300   1.67    pooka {
    301   1.67    pooka 
    302   1.67    pooka 	return 1;
    303   1.67    pooka }
    304  1.142    pooka __weak_alias(ttycheckoutq,rump_ttycheckoutq);
    305   1.67    pooka 
    306  1.142    pooka int rump_tputchar(int, int, struct tty *);
    307  1.142    pooka int
    308  1.142    pooka rump_tputchar(int c, int flags, struct tty *tp)
    309  1.142    pooka {
    310  1.142    pooka 
    311  1.142    pooka 	cnputc(c);
    312  1.142    pooka 	return 0;
    313  1.142    pooka }
    314  1.142    pooka __weak_alias(tputchar,rump_tputchar);
    315  1.142    pooka 
    316   1.67    pooka void
    317   1.67    pooka cnputc(int c)
    318   1.67    pooka {
    319   1.67    pooka 
    320  1.157    pooka 	rumpuser_putchar(c);
    321   1.67    pooka }
    322   1.67    pooka 
    323   1.67    pooka void
    324   1.80   cegger cnflush(void)
    325   1.67    pooka {
    326   1.67    pooka 
    327   1.67    pooka 	/* done */
    328   1.67    pooka }
    329   1.67    pooka 
    330  1.163    pooka void
    331  1.163    pooka resettodr(void)
    332  1.163    pooka {
    333  1.163    pooka 
    334  1.163    pooka 	/* setting clocks is not in the jurisdiction of rump kernels */
    335  1.163    pooka }
    336  1.163    pooka 
    337  1.138    pooka #ifdef __HAVE_SYSCALL_INTERN
    338  1.138    pooka void
    339  1.138    pooka syscall_intern(struct proc *p)
    340  1.138    pooka {
    341  1.138    pooka 
    342  1.160    pooka 	p->p_emuldata = NULL;
    343  1.138    pooka }
    344  1.138    pooka #endif
    345  1.144    pooka 
    346  1.148    pooka #ifdef LOCKDEBUG
    347  1.148    pooka void
    348  1.148    pooka turnstile_print(volatile void *obj, void (*pr)(const char *, ...))
    349  1.148    pooka {
    350  1.148    pooka 
    351  1.148    pooka 	/* nada */
    352  1.148    pooka }
    353  1.148    pooka #endif
    354  1.165    pooka 
    355  1.165    pooka void
    356  1.165    pooka cpu_reboot(int howto, char *bootstr)
    357  1.165    pooka {
    358  1.165    pooka 	int ruhow = 0;
    359  1.165    pooka 	void *finiarg;
    360  1.165    pooka 
    361  1.165    pooka 	printf("rump kernel halting...\n");
    362  1.165    pooka 
    363  1.165    pooka 	if (!RUMP_LOCALPROC_P(curproc))
    364  1.170    pooka 		finiarg = RUMP_SPVM2CTL(curproc->p_vmspace);
    365  1.165    pooka 	else
    366  1.165    pooka 		finiarg = NULL;
    367  1.165    pooka 
    368  1.165    pooka 	/* dump means we really take the dive here */
    369  1.165    pooka 	if ((howto & RB_DUMP) || panicstr) {
    370  1.165    pooka 		ruhow = RUMPUSER_PANIC;
    371  1.165    pooka 		goto out;
    372  1.165    pooka 	}
    373  1.165    pooka 
    374  1.165    pooka 	/* try to sync */
    375  1.165    pooka 	if (!((howto & RB_NOSYNC) || panicstr)) {
    376  1.165    pooka 		rump_vfs_fini();
    377  1.165    pooka 	}
    378  1.165    pooka 
    379  1.165    pooka 	doshutdownhooks();
    380  1.165    pooka 
    381  1.165    pooka 	/* your wish is my command */
    382  1.165    pooka 	if (howto & RB_HALT) {
    383  1.172    pooka 		printf("rump kernel halted (with RB_HALT, not exiting)\n");
    384  1.169    pooka 		rump_sysproxy_fini(finiarg);
    385  1.165    pooka 		for (;;) {
    386  1.165    pooka 			rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, 10, 0);
    387  1.165    pooka 		}
    388  1.165    pooka 	}
    389  1.165    pooka 
    390  1.165    pooka 	/* this function is __dead, we must exit */
    391  1.165    pooka  out:
    392  1.169    pooka 	rump_sysproxy_fini(finiarg);
    393  1.165    pooka 	rumpuser_exit(ruhow);
    394  1.165    pooka }
    395  1.173    pooka 
    396  1.173    pooka const char *
    397  1.173    pooka cpu_getmodel(void)
    398  1.173    pooka {
    399  1.173    pooka 
    400  1.173    pooka 	return "rumpcore (virtual)";
    401  1.173    pooka }
    402