Home | History | Annotate | Line # | Download | only in rumpkern
      1  1.202       bad /*	$NetBSD: emul.c,v 1.202 2024/07/28 13:01:55 bad Exp $	*/
      2    1.1     pooka 
      3    1.1     pooka /*
      4  1.150     pooka  * Copyright (c) 2007-2011 Antti Kantee.  All Rights Reserved.
      5    1.1     pooka  *
      6    1.1     pooka  * Redistribution and use in source and binary forms, with or without
      7    1.1     pooka  * modification, are permitted provided that the following conditions
      8    1.1     pooka  * are met:
      9    1.1     pooka  * 1. Redistributions of source code must retain the above copyright
     10    1.1     pooka  *    notice, this list of conditions and the following disclaimer.
     11    1.1     pooka  * 2. Redistributions in binary form must reproduce the above copyright
     12    1.1     pooka  *    notice, this list of conditions and the following disclaimer in the
     13    1.1     pooka  *    documentation and/or other materials provided with the distribution.
     14    1.1     pooka  *
     15    1.1     pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     16    1.1     pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     17    1.1     pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     18    1.1     pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     19    1.1     pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     20    1.1     pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     21    1.1     pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     22    1.1     pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     23    1.1     pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     24    1.1     pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     25    1.1     pooka  * SUCH DAMAGE.
     26    1.1     pooka  */
     27    1.1     pooka 
     28   1.61     pooka #include <sys/cdefs.h>
     29  1.202       bad __KERNEL_RCSID(0, "$NetBSD: emul.c,v 1.202 2024/07/28 13:01:55 bad Exp $");
     30    1.9     pooka 
     31    1.1     pooka #include <sys/param.h>
     32  1.176     pooka #include <sys/cprng.h>
     33  1.176     pooka #include <sys/filedesc.h>
     34  1.181   hannken #include <sys/fstrans.h>
     35    1.1     pooka #include <sys/kauth.h>
     36   1.66     pooka #include <sys/module.h>
     37   1.67     pooka #include <sys/reboot.h>
     38  1.154     pooka #include <sys/syscall.h>
     39  1.185     ozaki #include <sys/pserialize.h>
     40  1.178     ozaki #ifdef LOCKDEBUG
     41  1.178     ozaki #include <sys/sleepq.h>
     42  1.178     ozaki #endif
     43  1.201  riastrad #include <sys/syncobj.h>
     44   1.67     pooka 
     45   1.67     pooka #include <dev/cons.h>
     46    1.1     pooka 
     47  1.179     pooka #include <rump-sys/kern.h>
     48  1.179     pooka 
     49   1.44     pooka #include <rump/rumpuser.h>
     50   1.44     pooka 
     51  1.165     pooka void (*rump_vfs_fini)(void) = (void *)nullop;
     52  1.165     pooka 
     53  1.149     pooka /*
     54  1.149     pooka  * physmem is largely unused (except for nmbcluster calculations),
     55  1.149     pooka  * so pick a default value which suits ZFS.  if an application wants
     56  1.149     pooka  * a very small memory footprint, it can still adjust this before
     57  1.149     pooka  * calling rump_init()
     58  1.149     pooka  */
     59  1.149     pooka #define PHYSMEM 512*256
     60  1.180    cherry psize_t physmem = PHYSMEM;
     61  1.197     skrll size_t nkmempages = PHYSMEM/2; /* from le chapeau */
     62  1.149     pooka #undef PHYSMEM
     63  1.149     pooka 
     64    1.1     pooka struct vnode *rootvp;
     65  1.124     pooka dev_t rootdev = NODEV;
     66  1.149     pooka 
     67   1.19     pooka const int schedppq = 1;
     68   1.66     pooka int cold = 1;
     69  1.195   thorpej int shutting_down;
     70   1.95     pooka int boothowto = AB_SILENT;
     71   1.67     pooka struct tty *constty;
     72    1.1     pooka 
     73  1.135     pooka const struct bdevsw *bdevsw0[255];
     74   1.64     pooka const struct bdevsw **bdevsw = bdevsw0;
     75  1.202       bad const int sys_bdevsws = 255;
     76  1.202       bad int max_bdevsws = 255;
     77   1.64     pooka 
     78  1.135     pooka const struct cdevsw *cdevsw0[255];
     79   1.64     pooka const struct cdevsw **cdevsw = cdevsw0;
     80  1.202       bad const int sys_cdevsws = 255;
     81  1.202       bad int max_cdevsws = 255;
     82   1.64     pooka 
     83   1.76     pooka int mem_no = 2;
     84   1.76     pooka 
     85  1.151       chs device_t booted_device;
     86  1.151       chs device_t booted_wedge;
     87  1.200      manu daddr_t booted_startblk;
     88  1.200      manu uint64_t booted_nblks;
     89   1.92     pooka int booted_partition;
     90  1.183  christos const char *booted_method;
     91   1.92     pooka 
     92  1.120     pooka /* XXX: unused */
     93   1.76     pooka kmutex_t tty_lock;
     94  1.120     pooka krwlock_t exec_lock;
     95   1.64     pooka 
     96  1.139     pooka /* sparc doesn't sport constant page size, pretend we have 4k pages */
     97  1.109     pooka #ifdef __sparc__
     98  1.109     pooka int nbpg = 4096;
     99  1.139     pooka int pgofset = 4096-1;
    100  1.139     pooka int pgshift = 12;
    101  1.109     pooka #endif
    102  1.109     pooka 
    103  1.146   tsutsui /* on sun3 VM_MAX_ADDRESS is a const variable */
    104  1.146   tsutsui /* XXX: should be moved into rump.c and initialize for sun3 and sun3x? */
    105  1.141     pooka #ifdef sun3
    106  1.146   tsutsui const vaddr_t kernbase = KERNBASE3;
    107  1.140     pooka #endif
    108  1.140     pooka 
    109  1.117     pooka struct loadavg averunnable = {
    110  1.117     pooka 	{ 0 * FSCALE,
    111  1.117     pooka 	  1 * FSCALE,
    112  1.117     pooka 	  11 * FSCALE, },
    113  1.117     pooka 	FSCALE,
    114  1.117     pooka };
    115  1.117     pooka 
    116  1.174  pgoyette /*
    117  1.174  pgoyette  * Include the autogenerated list of auto-loadable syscalls
    118  1.174  pgoyette  */
    119  1.174  pgoyette #include <kern/syscalls_autoload.c>
    120  1.174  pgoyette 
    121  1.126     pooka struct emul emul_netbsd = {
    122  1.126     pooka 	.e_name = "netbsd-rump",
    123  1.126     pooka 	.e_sysent = rump_sysent,
    124  1.186  pgoyette 	.e_nomodbits = rump_sysent_nomodbits,
    125  1.154     pooka #ifndef __HAVE_MINIMAL_EMUL
    126  1.154     pooka 	.e_nsysent = SYS_NSYSENT,
    127  1.154     pooka #endif
    128  1.128     pooka 	.e_vm_default_addr = uvm_default_mapaddr,
    129  1.138     pooka #ifdef __HAVE_SYSCALL_INTERN
    130  1.138     pooka 	.e_syscall_intern = syscall_intern,
    131  1.138     pooka #endif
    132  1.174  pgoyette 	.e_sc_autoload = netbsd_syscalls_autoload,
    133  1.126     pooka };
    134  1.126     pooka 
    135  1.164     pooka /* not used, but need the symbols for pointer comparisons */
    136  1.164     pooka syncobj_t mutex_syncobj, rw_syncobj;
    137  1.164     pooka 
    138   1.20     pooka int
    139   1.20     pooka kpause(const char *wmesg, bool intr, int timeo, kmutex_t *mtx)
    140   1.20     pooka {
    141   1.20     pooka 	extern int hz;
    142  1.166    justin 	int rv __diagused;
    143   1.78     pooka 	uint64_t sec, nsec;
    144  1.127     pooka 
    145   1.20     pooka 	if (mtx)
    146   1.20     pooka 		mutex_exit(mtx);
    147   1.40     pooka 
    148   1.78     pooka 	sec = timeo / hz;
    149   1.78     pooka 	nsec = (timeo % hz) * (1000000000 / hz);
    150  1.158     pooka 	rv = rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, sec, nsec);
    151  1.156     pooka 	KASSERT(rv == 0);
    152  1.156     pooka 
    153   1.20     pooka 	if (mtx)
    154   1.20     pooka 		mutex_enter(mtx);
    155   1.20     pooka 
    156   1.20     pooka 	return 0;
    157   1.20     pooka }
    158   1.27     pooka 
    159   1.34      yamt vaddr_t
    160  1.155      para calc_cache_size(vsize_t vasz, int pct, int va_pct)
    161   1.34      yamt {
    162   1.34      yamt 	paddr_t t;
    163   1.34      yamt 
    164   1.34      yamt 	t = (paddr_t)physmem * pct / 100 * PAGE_SIZE;
    165   1.34      yamt 	if ((vaddr_t)t != t) {
    166   1.34      yamt 		panic("%s: needs tweak", __func__);
    167   1.34      yamt 	}
    168   1.34      yamt 	return t;
    169   1.34      yamt }
    170   1.35    martin 
    171  1.184     ozaki #define	RETURN_ADDRESS	(uintptr_t)__builtin_return_address(0)
    172  1.184     ozaki 
    173   1.41     pooka void
    174   1.41     pooka assert_sleepable(void)
    175   1.41     pooka {
    176  1.184     ozaki 	const char *reason = NULL;
    177   1.41     pooka 
    178   1.41     pooka 	/* always sleepable, although we should improve this */
    179  1.184     ozaki 
    180  1.184     ozaki 	if (!pserialize_not_in_read_section()) {
    181  1.184     ozaki 		reason = "pserialize";
    182  1.184     ozaki 	}
    183  1.184     ozaki 
    184  1.184     ozaki 	if (reason) {
    185  1.184     ozaki 		panic("%s: %s caller=%p", __func__, reason,
    186  1.184     ozaki 		    (void *)RETURN_ADDRESS);
    187  1.184     ozaki 	}
    188   1.41     pooka }
    189   1.43     pooka 
    190   1.66     pooka void
    191   1.80    cegger module_init_md(void)
    192   1.66     pooka {
    193   1.66     pooka 
    194   1.66     pooka 	/*
    195   1.66     pooka 	 * Nothing for now.  However, we should load the librump
    196   1.66     pooka 	 * symbol table.
    197   1.66     pooka 	 */
    198   1.66     pooka }
    199   1.67     pooka 
    200  1.167     pooka /*
    201  1.167     pooka  * Try to emulate all the MD definitions of DELAY() / delay().
    202  1.167     pooka  * Would be nice to fix the #defines in MD headers, but this quicker.
    203  1.168     pooka  *
    204  1.168     pooka  * XXX: we'd need a rumpuser_clock_sleep_nowrap() here.  Since we
    205  1.168     pooka  * don't have it in the current hypercall revision, busyloop.
    206  1.168     pooka  * Note that rather than calibrate a loop delay and work with that,
    207  1.168     pooka  * get call gettime (which does not block) in a loop to make sure
    208  1.168     pooka  * we didn't get virtual ghosttime.  That might be slightly inaccurate
    209  1.168     pooka  * for very small delays ...
    210  1.168     pooka  *
    211  1.168     pooka  * The other option would be to run a thread in the hypervisor which
    212  1.168     pooka  * sleeps for us and we can wait for it using rumpuser_cv_wait_nowrap()
    213  1.168     pooka  * Probably too fussy.  Better just wait for hypercall rev 18 ;)
    214  1.167     pooka  */
    215   1.69     pooka static void
    216   1.69     pooka rump_delay(unsigned int us)
    217   1.67     pooka {
    218  1.168     pooka 	struct timespec target, tmp;
    219  1.168     pooka 	uint64_t sec, sec_ini, sec_now;
    220  1.168     pooka 	long nsec, nsec_ini, nsec_now;
    221  1.168     pooka 	int loops;
    222  1.168     pooka 
    223  1.168     pooka 	rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO, &sec_ini, &nsec_ini);
    224   1.67     pooka 
    225  1.167     pooka #ifdef __mac68k__
    226  1.167     pooka 	sec = us / 1000;
    227  1.167     pooka 	nsec = (us % 1000) * 1000000;
    228  1.167     pooka #else
    229   1.78     pooka 	sec = us / 1000000;
    230   1.78     pooka 	nsec = (us % 1000000) * 1000;
    231  1.167     pooka #endif
    232   1.67     pooka 
    233  1.168     pooka 	target.tv_sec = sec_ini;
    234  1.168     pooka 	tmp.tv_sec = sec;
    235  1.168     pooka 	target.tv_nsec = nsec_ini;
    236  1.168     pooka 	tmp.tv_nsec = nsec;
    237  1.168     pooka 	timespecadd(&target, &tmp, &target);
    238  1.168     pooka 
    239   1.78     pooka 	if (__predict_false(sec != 0))
    240   1.67     pooka 		printf("WARNING: over 1s delay\n");
    241   1.67     pooka 
    242  1.168     pooka 	for (loops = 0; loops < 1000*1000*100; loops++) {
    243  1.168     pooka 		struct timespec cur;
    244  1.168     pooka 
    245  1.168     pooka 		rumpuser_clock_gettime(RUMPUSER_CLOCK_ABSMONO,
    246  1.168     pooka 		    &sec_now, &nsec_now);
    247  1.168     pooka 		cur.tv_sec = sec_now;
    248  1.168     pooka 		cur.tv_nsec = nsec_now;
    249  1.168     pooka 		if (timespeccmp(&cur, &target, >=)) {
    250  1.168     pooka 			return;
    251  1.168     pooka 		}
    252  1.168     pooka 	}
    253  1.168     pooka 	printf("WARNING: DELAY ESCAPED\n");
    254   1.67     pooka }
    255   1.69     pooka void (*delay_func)(unsigned int) = rump_delay;
    256  1.167     pooka __strong_alias(delay,rump_delay);
    257  1.167     pooka __strong_alias(_delay,rump_delay);
    258   1.67     pooka 
    259  1.191       kre /* Weak alias for getcwd_common to be used unless librumpvfs is present. */
    260  1.191       kre 
    261  1.191       kre int rump_getcwd_common(struct vnode *, struct vnode *, char **, char *,
    262  1.191       kre     int, int, struct lwp *);
    263  1.191       kre int
    264  1.191       kre rump_getcwd_common(struct vnode *lvp, struct vnode *rvp, char **bpp, char *bufp,
    265  1.191       kre     int limit, int flags, struct lwp *l)
    266  1.191       kre {
    267  1.191       kre 
    268  1.191       kre 	return ENOENT;
    269  1.191       kre }
    270  1.191       kre __weak_alias(getcwd_common,rump_getcwd_common);
    271  1.191       kre 
    272  1.192       bad /* Weak alias for vnode_to_path to be used unless librumpvfs is present. */
    273  1.192       bad 
    274  1.192       bad int rump_vnode_to_path(char *, size_t, struct vnode *, struct lwp *,
    275  1.192       bad     struct proc *);
    276  1.192       bad int
    277  1.192       bad rump_vnode_to_path(char *path, size_t len, struct vnode *vp, struct lwp *curl,
    278  1.192       bad     struct proc *p)
    279  1.192       bad {
    280  1.192       bad 
    281  1.192       bad 	return ENOENT; /* pretend getcwd_common() failed. */
    282  1.192       bad }
    283  1.192       bad __weak_alias(vnode_to_path,rump_vnode_to_path);
    284  1.192       bad 
    285  1.192       bad 
    286  1.181   hannken /* Weak aliases for fstrans to be used unless librumpvfs is present. */
    287  1.181   hannken 
    288  1.182   hannken void rump_fstrans_start(struct mount *);
    289  1.182   hannken void
    290  1.182   hannken rump_fstrans_start(struct mount *mp)
    291  1.182   hannken {
    292  1.182   hannken 
    293  1.182   hannken }
    294  1.182   hannken __weak_alias(fstrans_start,rump_fstrans_start);
    295  1.182   hannken 
    296  1.182   hannken int rump_fstrans_start_nowait(struct mount *);
    297  1.181   hannken int
    298  1.182   hannken rump_fstrans_start_nowait(struct mount *mp)
    299  1.181   hannken {
    300  1.181   hannken 
    301  1.181   hannken 	return 0;
    302  1.181   hannken }
    303  1.182   hannken __weak_alias(fstrans_start_nowait,rump_fstrans_start_nowait);
    304  1.181   hannken 
    305  1.187   hannken void rump_fstrans_start_lazy(struct mount *);
    306  1.187   hannken void
    307  1.187   hannken rump_fstrans_start_lazy(struct mount *mp)
    308  1.187   hannken {
    309  1.187   hannken 
    310  1.187   hannken }
    311  1.187   hannken __weak_alias(fstrans_start_lazy,rump_fstrans_start_lazy);
    312  1.187   hannken 
    313  1.187   hannken 
    314  1.181   hannken void rump_fstrans_done(struct mount *);
    315  1.181   hannken void
    316  1.181   hannken rump_fstrans_done(struct mount *mp)
    317  1.181   hannken {
    318  1.181   hannken 
    319  1.181   hannken }
    320  1.181   hannken __weak_alias(fstrans_done,rump_fstrans_done);
    321  1.181   hannken 
    322  1.190   hannken 
    323  1.190   hannken void rump_fstrans_lwp_dtor(struct lwp *);
    324  1.190   hannken void
    325  1.190   hannken rump_fstrans_lwp_dtor(struct lwp *l)
    326  1.190   hannken {
    327  1.190   hannken 
    328  1.190   hannken }
    329  1.190   hannken __weak_alias(fstrans_lwp_dtor,rump_fstrans_lwp_dtor);
    330  1.190   hannken 
    331  1.198  riastrad static int
    332  1.198  riastrad rump_filt_fsattach(struct knote *kn)
    333  1.198  riastrad {
    334  1.198  riastrad 
    335  1.198  riastrad 	return EOPNOTSUPP;
    336  1.198  riastrad }
    337  1.198  riastrad 
    338  1.198  riastrad struct filterops rump_fs_filtops = {
    339  1.198  riastrad 	.f_attach = rump_filt_fsattach,
    340  1.198  riastrad };
    341  1.198  riastrad __weak_alias(fs_filtops,rump_fs_filtops);
    342  1.198  riastrad 
    343  1.199  riastrad struct pool_cache *rump_pnbuf_cache;
    344  1.199  riastrad __weak_alias(pnbuf_cache,rump_pnbuf_cache);
    345  1.199  riastrad 
    346  1.142     pooka /*
    347  1.142     pooka  * Provide weak aliases for tty routines used by printf.
    348  1.142     pooka  * They will be used unless the rumpkern_tty component is present.
    349  1.142     pooka  */
    350  1.142     pooka 
    351  1.142     pooka int rump_ttycheckoutq(struct tty *, int);
    352  1.105     pooka int
    353  1.142     pooka rump_ttycheckoutq(struct tty *tp, int wait)
    354   1.67     pooka {
    355   1.67     pooka 
    356   1.67     pooka 	return 1;
    357   1.67     pooka }
    358  1.142     pooka __weak_alias(ttycheckoutq,rump_ttycheckoutq);
    359   1.67     pooka 
    360  1.142     pooka int rump_tputchar(int, int, struct tty *);
    361  1.142     pooka int
    362  1.142     pooka rump_tputchar(int c, int flags, struct tty *tp)
    363  1.142     pooka {
    364  1.142     pooka 
    365  1.142     pooka 	cnputc(c);
    366  1.142     pooka 	return 0;
    367  1.142     pooka }
    368  1.142     pooka __weak_alias(tputchar,rump_tputchar);
    369  1.142     pooka 
    370   1.67     pooka void
    371   1.67     pooka cnputc(int c)
    372   1.67     pooka {
    373   1.67     pooka 
    374  1.157     pooka 	rumpuser_putchar(c);
    375   1.67     pooka }
    376   1.67     pooka 
    377   1.67     pooka void
    378   1.80    cegger cnflush(void)
    379   1.67     pooka {
    380   1.67     pooka 
    381   1.67     pooka 	/* done */
    382   1.67     pooka }
    383   1.67     pooka 
    384  1.163     pooka void
    385  1.163     pooka resettodr(void)
    386  1.163     pooka {
    387  1.163     pooka 
    388  1.163     pooka 	/* setting clocks is not in the jurisdiction of rump kernels */
    389  1.163     pooka }
    390  1.163     pooka 
    391  1.138     pooka #ifdef __HAVE_SYSCALL_INTERN
    392  1.138     pooka void
    393  1.138     pooka syscall_intern(struct proc *p)
    394  1.138     pooka {
    395  1.138     pooka 
    396  1.160     pooka 	p->p_emuldata = NULL;
    397  1.138     pooka }
    398  1.138     pooka #endif
    399  1.144     pooka 
    400  1.148     pooka #ifdef LOCKDEBUG
    401  1.148     pooka void
    402  1.148     pooka turnstile_print(volatile void *obj, void (*pr)(const char *, ...))
    403  1.148     pooka {
    404  1.148     pooka 
    405  1.148     pooka 	/* nada */
    406  1.148     pooka }
    407  1.148     pooka #endif
    408  1.165     pooka 
    409  1.165     pooka void
    410  1.165     pooka cpu_reboot(int howto, char *bootstr)
    411  1.165     pooka {
    412  1.165     pooka 	int ruhow = 0;
    413  1.165     pooka 	void *finiarg;
    414  1.165     pooka 
    415  1.165     pooka 	printf("rump kernel halting...\n");
    416  1.165     pooka 
    417  1.165     pooka 	if (!RUMP_LOCALPROC_P(curproc))
    418  1.170     pooka 		finiarg = RUMP_SPVM2CTL(curproc->p_vmspace);
    419  1.165     pooka 	else
    420  1.165     pooka 		finiarg = NULL;
    421  1.165     pooka 
    422  1.165     pooka 	/* dump means we really take the dive here */
    423  1.165     pooka 	if ((howto & RB_DUMP) || panicstr) {
    424  1.165     pooka 		ruhow = RUMPUSER_PANIC;
    425  1.165     pooka 		goto out;
    426  1.165     pooka 	}
    427  1.165     pooka 
    428  1.165     pooka 	/* try to sync */
    429  1.165     pooka 	if (!((howto & RB_NOSYNC) || panicstr)) {
    430  1.165     pooka 		rump_vfs_fini();
    431  1.165     pooka 	}
    432  1.165     pooka 
    433  1.165     pooka 	doshutdownhooks();
    434  1.165     pooka 
    435  1.165     pooka 	/* your wish is my command */
    436  1.165     pooka 	if (howto & RB_HALT) {
    437  1.172     pooka 		printf("rump kernel halted (with RB_HALT, not exiting)\n");
    438  1.169     pooka 		rump_sysproxy_fini(finiarg);
    439  1.165     pooka 		for (;;) {
    440  1.165     pooka 			rumpuser_clock_sleep(RUMPUSER_CLOCK_RELWALL, 10, 0);
    441  1.165     pooka 		}
    442  1.165     pooka 	}
    443  1.165     pooka 
    444  1.165     pooka 	/* this function is __dead, we must exit */
    445  1.165     pooka  out:
    446  1.169     pooka 	rump_sysproxy_fini(finiarg);
    447  1.165     pooka 	rumpuser_exit(ruhow);
    448  1.165     pooka }
    449