Home | History | Annotate | Line # | Download | only in rumpkern
emul.c revision 1.175
      1  1.175     pooka /*	$NetBSD: emul.c,v 1.175 2016/01/18 15:53:38 pooka Exp $	*/
      2    1.1     pooka 
      3    1.1     pooka /*
      4  1.150     pooka  * Copyright (c) 2007-2011 Antti Kantee.  All Rights Reserved.
      5    1.1     pooka  *
      6    1.1     pooka  * Redistribution and use in source and binary forms, with or without
      7    1.1     pooka  * modification, are permitted provided that the following conditions
      8    1.1     pooka  * are met:
      9    1.1     pooka  * 1. Redistributions of source code must retain the above copyright
     10    1.1     pooka  *    notice, this list of conditions and the following disclaimer.
     11    1.1     pooka  * 2. Redistributions in binary form must reproduce the above copyright
     12    1.1     pooka  *    notice, this list of conditions and the following disclaimer in the
     13    1.1     pooka  *    documentation and/or other materials provided with the distribution.
     14    1.1     pooka  *
     15    1.1     pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     16    1.1     pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     17    1.1     pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     18    1.1     pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     19    1.1     pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     20    1.1     pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     21    1.1     pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     22    1.1     pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     23    1.1     pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     24    1.1     pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     25    1.1     pooka  * SUCH DAMAGE.
     26    1.1     pooka  */
     27    1.1     pooka 
     28   1.61     pooka #include <sys/cdefs.h>
     29  1.175     pooka __KERNEL_RCSID(0, "$NetBSD: emul.c,v 1.175 2016/01/18 15:53:38 pooka Exp $");
     30    1.9     pooka 
     31    1.1     pooka #include <sys/param.h>
     32    1.1     pooka #include <sys/null.h>
     33    1.1     pooka #include <sys/vnode.h>
     34    1.1     pooka #include <sys/stat.h>
     35   1.35    martin #include <sys/select.h>
     36    1.1     pooka #include <sys/syslog.h>
     37    1.1     pooka #include <sys/namei.h>
     38    1.1     pooka #include <sys/kauth.h>
     39  1.175     pooka #include <sys/kernel.h>
     40    1.1     pooka #include <sys/conf.h>
     41    1.1     pooka #include <sys/device.h>
     42    1.1     pooka #include <sys/queue.h>
     43   1.20     pooka #include <sys/file.h>
     44  1.162     pooka #include <sys/filedesc.h>
     45   1.15        ad #include <sys/cpu.h>
     46   1.17     pooka #include <sys/kmem.h>
     47   1.20     pooka #include <sys/poll.h>
     48   1.66     pooka #include <sys/timetc.h>
     49   1.53     pooka #include <sys/tprintf.h>
     50   1.66     pooka #include <sys/module.h>
     51   1.67     pooka #include <sys/tty.h>
     52   1.67     pooka #include <sys/reboot.h>
     53  1.154     pooka #include <sys/syscall.h>
     54  1.109     pooka #include <sys/syscallvar.h>
     55  1.109     pooka #include <sys/xcall.h>
     56  1.148     pooka #include <sys/sleepq.h>
     57  1.161     pooka #include <sys/cprng.h>
     58   1.67     pooka 
     59   1.67     pooka #include <dev/cons.h>
     60    1.1     pooka 
     61   1.44     pooka #include <rump/rumpuser.h>
     62   1.44     pooka 
     63    1.8     pooka #include <uvm/uvm_map.h>
     64    1.8     pooka 
     65   1.10     pooka #include "rump_private.h"
     66    1.1     pooka 
     67  1.165     pooka void (*rump_vfs_fini)(void) = (void *)nullop;
     68  1.165     pooka 
     69  1.149     pooka /*
     70  1.149     pooka  * physmem is largely unused (except for nmbcluster calculations),
     71  1.149     pooka  * so pick a default value which suits ZFS.  if an application wants
     72  1.149     pooka  * a very small memory footprint, it can still adjust this before
     73  1.149     pooka  * calling rump_init()
     74  1.149     pooka  */
     75  1.149     pooka #define PHYSMEM 512*256
     76  1.149     pooka int physmem = PHYSMEM;
     77  1.149     pooka int nkmempages = PHYSMEM/2; /* from le chapeau */
     78  1.149     pooka #undef PHYSMEM
     79  1.149     pooka 
     80  1.162     pooka struct lwp lwp0 = {
     81  1.162     pooka 	.l_lid = 1,
     82  1.162     pooka 	.l_proc = &proc0,
     83  1.162     pooka 	.l_fd = &filedesc0,
     84  1.162     pooka };
     85    1.1     pooka struct vnode *rootvp;
     86  1.124     pooka dev_t rootdev = NODEV;
     87  1.149     pooka 
     88   1.19     pooka const int schedppq = 1;
     89   1.53     pooka bool mp_online = false;
     90  1.175     pooka struct timespec boottime;
     91   1.66     pooka int cold = 1;
     92   1.95     pooka int boothowto = AB_SILENT;
     93   1.67     pooka struct tty *constty;
     94    1.1     pooka 
     95  1.135     pooka const struct bdevsw *bdevsw0[255];
     96   1.64     pooka const struct bdevsw **bdevsw = bdevsw0;
     97  1.135     pooka const int sys_cdevsws = 255;
     98  1.135     pooka int max_cdevsws = 255;
     99   1.64     pooka 
    100  1.135     pooka const struct cdevsw *cdevsw0[255];
    101   1.64     pooka const struct cdevsw **cdevsw = cdevsw0;
    102  1.135     pooka const int sys_bdevsws = 255;
    103  1.135     pooka int max_bdevsws = 255;
    104   1.64     pooka 
    105   1.76     pooka int mem_no = 2;
    106   1.76     pooka 
    107  1.151       chs device_t booted_device;
    108  1.151       chs device_t booted_wedge;
    109   1.92     pooka int booted_partition;
    110   1.92     pooka 
    111  1.120     pooka /* XXX: unused */
    112   1.76     pooka kmutex_t tty_lock;
    113  1.120     pooka krwlock_t exec_lock;
    114   1.64     pooka 
    115  1.125     pooka struct lwplist alllwp = LIST_HEAD_INITIALIZER(alllwp);
    116  1.125     pooka 
    117  1.139     pooka /* sparc doesn't sport constant page size, pretend we have 4k pages */
    118  1.109     pooka #ifdef __sparc__
    119  1.109     pooka int nbpg = 4096;
    120  1.139     pooka int pgofset = 4096-1;
    121  1.139     pooka int pgshift = 12;
    122  1.109     pooka #endif
    123  1.109     pooka 
    124  1.146   tsutsui /* on sun3 VM_MAX_ADDRESS is a const variable */
    125  1.146   tsutsui /* XXX: should be moved into rump.c and initialize for sun3 and sun3x? */
    126  1.141     pooka #ifdef sun3
    127  1.146   tsutsui const vaddr_t kernbase = KERNBASE3;
    128  1.140     pooka #endif
    129  1.140     pooka 
    130  1.117     pooka struct loadavg averunnable = {
    131  1.117     pooka 	{ 0 * FSCALE,
    132  1.117     pooka 	  1 * FSCALE,
    133  1.117     pooka 	  11 * FSCALE, },
    134  1.117     pooka 	FSCALE,
    135  1.117     pooka };
    136  1.117     pooka 
    137  1.174  pgoyette /*
    138  1.174  pgoyette  * Include the autogenerated list of auto-loadable syscalls
    139  1.174  pgoyette  */
    140  1.174  pgoyette #include <kern/syscalls_autoload.c>
    141  1.174  pgoyette 
    142  1.126     pooka struct emul emul_netbsd = {
    143  1.126     pooka 	.e_name = "netbsd-rump",
    144  1.126     pooka 	.e_sysent = rump_sysent,
    145  1.154     pooka #ifndef __HAVE_MINIMAL_EMUL
    146  1.154     pooka 	.e_nsysent = SYS_NSYSENT,
    147  1.154     pooka #endif
    148  1.128     pooka 	.e_vm_default_addr = uvm_default_mapaddr,
    149  1.138     pooka #ifdef __HAVE_SYSCALL_INTERN
    150  1.138     pooka 	.e_syscall_intern = syscall_intern,
    151  1.138     pooka #endif
    152  1.174  pgoyette 	.e_sc_autoload = netbsd_syscalls_autoload,
    153  1.126     pooka };
    154  1.126     pooka 
    155  1.138     pooka u_int nprocs = 1;
    156   1.20     pooka 
    157  1.161     pooka cprng_strong_t *kern_cprng;
    158  1.161     pooka 
    159  1.164     pooka /* not used, but need the symbols for pointer comparisons */
    160  1.164     pooka syncobj_t mutex_syncobj, rw_syncobj;
    161  1.164     pooka 
    162   1.20     pooka int
    163   1.20     pooka kpause(const char *wmesg, bool intr, int timeo, kmutex_t *mtx)
    164   1.20     pooka {
    165   1.20     pooka 	extern int hz;
    166  1.166    justin 	int rv __diagused;
    167   1.78     pooka 	uint64_t sec, nsec;
    168  1.127     pooka 
    169   1.20     pooka 	if (mtx)
    170   1.20     pooka 		mutex_exit(mtx);
    171   1.40     pooka 
    172   1.78     pooka 	sec = timeo / hz;
    173   1.78     pooka 	nsec = (timeo % hz) * (1000000000 / hz);
    174  1.158     pooka 	rv = rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, sec, nsec);
    175  1.156     pooka 	KASSERT(rv == 0);
    176  1.156     pooka 
    177   1.20     pooka 	if (mtx)
    178   1.20     pooka 		mutex_enter(mtx);
    179   1.20     pooka 
    180   1.20     pooka 	return 0;
    181   1.20     pooka }
    182   1.27     pooka 
    183   1.27     pooka void
    184   1.32       bjs lwp_unsleep(lwp_t *l, bool cleanup)
    185   1.32       bjs {
    186   1.32       bjs 
    187   1.32       bjs 	KASSERT(mutex_owned(l->l_mutex));
    188   1.32       bjs 
    189  1.104     rmind 	(*l->l_syncobj->sobj_unsleep)(l, cleanup);
    190   1.32       bjs }
    191   1.34      yamt 
    192  1.145     pooka void
    193  1.145     pooka lwp_update_creds(struct lwp *l)
    194  1.145     pooka {
    195  1.145     pooka 	struct proc *p;
    196  1.145     pooka 	kauth_cred_t oldcred;
    197  1.145     pooka 
    198  1.145     pooka 	p = l->l_proc;
    199  1.145     pooka 	oldcred = l->l_cred;
    200  1.145     pooka 	l->l_prflag &= ~LPR_CRMOD;
    201  1.145     pooka 
    202  1.145     pooka 	mutex_enter(p->p_lock);
    203  1.145     pooka 	kauth_cred_hold(p->p_cred);
    204  1.145     pooka 	l->l_cred = p->p_cred;
    205  1.145     pooka 	mutex_exit(p->p_lock);
    206  1.145     pooka 
    207  1.145     pooka 	if (oldcred != NULL)
    208  1.145     pooka 		kauth_cred_free(oldcred);
    209  1.145     pooka }
    210  1.145     pooka 
    211   1.34      yamt vaddr_t
    212  1.155      para calc_cache_size(vsize_t vasz, int pct, int va_pct)
    213   1.34      yamt {
    214   1.34      yamt 	paddr_t t;
    215   1.34      yamt 
    216   1.34      yamt 	t = (paddr_t)physmem * pct / 100 * PAGE_SIZE;
    217   1.34      yamt 	if ((vaddr_t)t != t) {
    218   1.34      yamt 		panic("%s: needs tweak", __func__);
    219   1.34      yamt 	}
    220   1.34      yamt 	return t;
    221   1.34      yamt }
    222   1.35    martin 
    223   1.41     pooka void
    224   1.41     pooka assert_sleepable(void)
    225   1.41     pooka {
    226   1.41     pooka 
    227   1.41     pooka 	/* always sleepable, although we should improve this */
    228   1.41     pooka }
    229   1.43     pooka 
    230   1.66     pooka void
    231   1.80    cegger module_init_md(void)
    232   1.66     pooka {
    233   1.66     pooka 
    234   1.66     pooka 	/*
    235   1.66     pooka 	 * Nothing for now.  However, we should load the librump
    236   1.66     pooka 	 * symbol table.
    237   1.66     pooka 	 */
    238   1.66     pooka }
    239   1.67     pooka 
    240  1.167     pooka /*
    241  1.167     pooka  * Try to emulate all the MD definitions of DELAY() / delay().
    242  1.167     pooka  * Would be nice to fix the #defines in MD headers, but this quicker.
    243  1.168     pooka  *
    244  1.168     pooka  * XXX: we'd need a rumpuser_clock_sleep_nowrap() here.  Since we
    245  1.168     pooka  * don't have it in the current hypercall revision, busyloop.
    246  1.168     pooka  * Note that rather than calibrate a loop delay and work with that,
    247  1.168     pooka  * get call gettime (which does not block) in a loop to make sure
    248  1.168     pooka  * we didn't get virtual ghosttime.  That might be slightly inaccurate
    249  1.168     pooka  * for very small delays ...
    250  1.168     pooka  *
    251  1.168     pooka  * The other option would be to run a thread in the hypervisor which
    252  1.168     pooka  * sleeps for us and we can wait for it using rumpuser_cv_wait_nowrap()
    253  1.168     pooka  * Probably too fussy.  Better just wait for hypercall rev 18 ;)
    254  1.167     pooka  */
    255   1.69     pooka static void
    256   1.69     pooka rump_delay(unsigned int us)
    257   1.67     pooka {
    258  1.168     pooka 	struct timespec target, tmp;
    259  1.168     pooka 	uint64_t sec, sec_ini, sec_now;
    260  1.168     pooka 	long nsec, nsec_ini, nsec_now;
    261  1.168     pooka 	int loops;
    262  1.168     pooka 
    263  1.168     pooka 	rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO, &sec_ini, &nsec_ini);
    264   1.67     pooka 
    265  1.167     pooka #ifdef __mac68k__
    266  1.167     pooka 	sec = us / 1000;
    267  1.167     pooka 	nsec = (us % 1000) * 1000000;
    268  1.167     pooka #else
    269   1.78     pooka 	sec = us / 1000000;
    270   1.78     pooka 	nsec = (us % 1000000) * 1000;
    271  1.167     pooka #endif
    272   1.67     pooka 
    273  1.168     pooka 	target.tv_sec = sec_ini;
    274  1.168     pooka 	tmp.tv_sec = sec;
    275  1.168     pooka 	target.tv_nsec = nsec_ini;
    276  1.168     pooka 	tmp.tv_nsec = nsec;
    277  1.168     pooka 	timespecadd(&target, &tmp, &target);
    278  1.168     pooka 
    279   1.78     pooka 	if (__predict_false(sec != 0))
    280   1.67     pooka 		printf("WARNING: over 1s delay\n");
    281   1.67     pooka 
    282  1.168     pooka 	for (loops = 0; loops < 1000*1000*100; loops++) {
    283  1.168     pooka 		struct timespec cur;
    284  1.168     pooka 
    285  1.168     pooka 		rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO,
    286  1.168     pooka 		    &sec_now, &nsec_now);
    287  1.168     pooka 		cur.tv_sec = sec_now;
    288  1.168     pooka 		cur.tv_nsec = nsec_now;
    289  1.168     pooka 		if (timespeccmp(&cur, &target, >=)) {
    290  1.168     pooka 			return;
    291  1.168     pooka 		}
    292  1.168     pooka 	}
    293  1.168     pooka 	printf("WARNING: DELAY ESCAPED\n");
    294   1.67     pooka }
    295   1.69     pooka void (*delay_func)(unsigned int) = rump_delay;
    296  1.167     pooka __strong_alias(delay,rump_delay);
    297  1.167     pooka __strong_alias(_delay,rump_delay);
    298   1.67     pooka 
    299  1.142     pooka /*
    300  1.142     pooka  * Provide weak aliases for tty routines used by printf.
    301  1.142     pooka  * They will be used unless the rumpkern_tty component is present.
    302  1.142     pooka  */
    303  1.142     pooka 
    304  1.142     pooka int rump_ttycheckoutq(struct tty *, int);
    305  1.105     pooka int
    306  1.142     pooka rump_ttycheckoutq(struct tty *tp, int wait)
    307   1.67     pooka {
    308   1.67     pooka 
    309   1.67     pooka 	return 1;
    310   1.67     pooka }
    311  1.142     pooka __weak_alias(ttycheckoutq,rump_ttycheckoutq);
    312   1.67     pooka 
    313  1.142     pooka int rump_tputchar(int, int, struct tty *);
    314  1.142     pooka int
    315  1.142     pooka rump_tputchar(int c, int flags, struct tty *tp)
    316  1.142     pooka {
    317  1.142     pooka 
    318  1.142     pooka 	cnputc(c);
    319  1.142     pooka 	return 0;
    320  1.142     pooka }
    321  1.142     pooka __weak_alias(tputchar,rump_tputchar);
    322  1.142     pooka 
    323   1.67     pooka void
    324   1.67     pooka cnputc(int c)
    325   1.67     pooka {
    326   1.67     pooka 
    327  1.157     pooka 	rumpuser_putchar(c);
    328   1.67     pooka }
    329   1.67     pooka 
    330   1.67     pooka void
    331   1.80    cegger cnflush(void)
    332   1.67     pooka {
    333   1.67     pooka 
    334   1.67     pooka 	/* done */
    335   1.67     pooka }
    336   1.67     pooka 
    337  1.163     pooka void
    338  1.163     pooka resettodr(void)
    339  1.163     pooka {
    340  1.163     pooka 
    341  1.163     pooka 	/* setting clocks is not in the jurisdiction of rump kernels */
    342  1.163     pooka }
    343  1.163     pooka 
    344  1.138     pooka #ifdef __HAVE_SYSCALL_INTERN
    345  1.138     pooka void
    346  1.138     pooka syscall_intern(struct proc *p)
    347  1.138     pooka {
    348  1.138     pooka 
    349  1.160     pooka 	p->p_emuldata = NULL;
    350  1.138     pooka }
    351  1.138     pooka #endif
    352  1.144     pooka 
    353  1.148     pooka #ifdef LOCKDEBUG
    354  1.148     pooka void
    355  1.148     pooka turnstile_print(volatile void *obj, void (*pr)(const char *, ...))
    356  1.148     pooka {
    357  1.148     pooka 
    358  1.148     pooka 	/* nada */
    359  1.148     pooka }
    360  1.148     pooka #endif
    361  1.165     pooka 
    362  1.165     pooka void
    363  1.165     pooka cpu_reboot(int howto, char *bootstr)
    364  1.165     pooka {
    365  1.165     pooka 	int ruhow = 0;
    366  1.165     pooka 	void *finiarg;
    367  1.165     pooka 
    368  1.165     pooka 	printf("rump kernel halting...\n");
    369  1.165     pooka 
    370  1.165     pooka 	if (!RUMP_LOCALPROC_P(curproc))
    371  1.170     pooka 		finiarg = RUMP_SPVM2CTL(curproc->p_vmspace);
    372  1.165     pooka 	else
    373  1.165     pooka 		finiarg = NULL;
    374  1.165     pooka 
    375  1.165     pooka 	/* dump means we really take the dive here */
    376  1.165     pooka 	if ((howto & RB_DUMP) || panicstr) {
    377  1.165     pooka 		ruhow = RUMPUSER_PANIC;
    378  1.165     pooka 		goto out;
    379  1.165     pooka 	}
    380  1.165     pooka 
    381  1.165     pooka 	/* try to sync */
    382  1.165     pooka 	if (!((howto & RB_NOSYNC) || panicstr)) {
    383  1.165     pooka 		rump_vfs_fini();
    384  1.165     pooka 	}
    385  1.165     pooka 
    386  1.165     pooka 	doshutdownhooks();
    387  1.165     pooka 
    388  1.165     pooka 	/* your wish is my command */
    389  1.165     pooka 	if (howto & RB_HALT) {
    390  1.172     pooka 		printf("rump kernel halted (with RB_HALT, not exiting)\n");
    391  1.169     pooka 		rump_sysproxy_fini(finiarg);
    392  1.165     pooka 		for (;;) {
    393  1.165     pooka 			rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, 10, 0);
    394  1.165     pooka 		}
    395  1.165     pooka 	}
    396  1.165     pooka 
    397  1.165     pooka 	/* this function is __dead, we must exit */
    398  1.165     pooka  out:
    399  1.169     pooka 	rump_sysproxy_fini(finiarg);
    400  1.165     pooka 	rumpuser_exit(ruhow);
    401  1.165     pooka }
    402  1.173     pooka 
    403  1.173     pooka const char *
    404  1.173     pooka cpu_getmodel(void)
    405  1.173     pooka {
    406  1.173     pooka 
    407  1.173     pooka 	return "rumpcore (virtual)";
    408  1.173     pooka }
    409