Home | History | Annotate | Line # | Download | only in rumpkern
rump.c revision 1.53
      1  1.53   pooka /*	$NetBSD: rump.c,v 1.53 2008/08/08 14:40:07 pooka Exp $	*/
      2   1.1   pooka 
      3   1.1   pooka /*
      4   1.1   pooka  * Copyright (c) 2007 Antti Kantee.  All Rights Reserved.
      5   1.1   pooka  *
      6   1.1   pooka  * Development of this software was supported by Google Summer of Code.
      7   1.1   pooka  *
      8   1.1   pooka  * Redistribution and use in source and binary forms, with or without
      9   1.1   pooka  * modification, are permitted provided that the following conditions
     10   1.1   pooka  * are met:
     11   1.1   pooka  * 1. Redistributions of source code must retain the above copyright
     12   1.1   pooka  *    notice, this list of conditions and the following disclaimer.
     13   1.1   pooka  * 2. Redistributions in binary form must reproduce the above copyright
     14   1.1   pooka  *    notice, this list of conditions and the following disclaimer in the
     15   1.1   pooka  *    documentation and/or other materials provided with the distribution.
     16   1.1   pooka  *
     17   1.1   pooka  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     18   1.1   pooka  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     19   1.1   pooka  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     20   1.1   pooka  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     21   1.1   pooka  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     22   1.1   pooka  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     23   1.1   pooka  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     24   1.1   pooka  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     25   1.1   pooka  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     26   1.1   pooka  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     27   1.1   pooka  * SUCH DAMAGE.
     28   1.1   pooka  */
     29   1.1   pooka 
     30   1.1   pooka #include <sys/param.h>
     31  1.27   pooka #include <sys/cpu.h>
     32   1.1   pooka #include <sys/filedesc.h>
     33   1.1   pooka #include <sys/kauth.h>
     34  1.14   pooka #include <sys/kmem.h>
     35  1.49  simonb #include <sys/module.h>
     36   1.1   pooka #include <sys/mount.h>
     37   1.1   pooka #include <sys/namei.h>
     38   1.1   pooka #include <sys/queue.h>
     39   1.1   pooka #include <sys/resourcevar.h>
     40  1.27   pooka #include <sys/select.h>
     41   1.1   pooka #include <sys/vnode.h>
     42  1.36   pooka #include <sys/vfs_syscalls.h>
     43  1.49  simonb #include <sys/wapbl.h>
     44  1.51   pooka #include <sys/sysctl.h>
     45   1.1   pooka 
     46   1.4   pooka #include <miscfs/specfs/specdev.h>
     47   1.4   pooka 
     48  1.48   pooka #include <rump/rumpuser.h>
     49  1.48   pooka 
     50   1.8   pooka #include "rump_private.h"
     51   1.1   pooka 
     52  1.40      ad struct proc proc0;
     53   1.1   pooka struct cwdinfo rump_cwdi;
     54   1.1   pooka struct pstats rump_stats;
     55   1.1   pooka struct plimit rump_limits;
     56  1.31   pooka kauth_cred_t rump_cred = RUMPCRED_SUSER;
     57   1.1   pooka struct cpu_info rump_cpu;
     58  1.40      ad struct filedesc rump_filedesc0;
     59  1.36   pooka struct proclist allproc;
     60  1.46      ad char machine[] = "rump";
     61   1.1   pooka 
     62  1.19   pooka kmutex_t rump_giantlock;
     63  1.19   pooka 
     64  1.24   pooka sigset_t sigcantmask;
     65  1.24   pooka 
     66   1.2   pooka struct fakeblk {
     67   1.2   pooka 	char path[MAXPATHLEN];
     68   1.2   pooka 	LIST_ENTRY(fakeblk) entries;
     69   1.2   pooka };
     70   1.2   pooka 
     71   1.2   pooka static LIST_HEAD(, fakeblk) fakeblks = LIST_HEAD_INITIALIZER(fakeblks);
     72   1.2   pooka 
     73  1.29   pooka #ifndef RUMP_WITHOUT_THREADS
     74  1.14   pooka static void
     75  1.14   pooka rump_aiodone_worker(struct work *wk, void *dummy)
     76  1.14   pooka {
     77  1.14   pooka 	struct buf *bp = (struct buf *)wk;
     78  1.14   pooka 
     79  1.14   pooka 	KASSERT(&bp->b_work == wk);
     80  1.14   pooka 	bp->b_iodone(bp);
     81  1.14   pooka }
     82  1.29   pooka #endif /* RUMP_WITHOUT_THREADS */
     83  1.14   pooka 
     84  1.51   pooka static int rump_inited;
     85  1.51   pooka static struct emul emul_rump;
     86  1.27   pooka 
     87   1.1   pooka void
     88   1.1   pooka rump_init()
     89   1.1   pooka {
     90   1.1   pooka 	extern char hostname[];
     91   1.1   pooka 	extern size_t hostnamelen;
     92  1.25   pooka 	extern kmutex_t rump_atomic_lock;
     93  1.36   pooka 	char buf[256];
     94  1.14   pooka 	struct proc *p;
     95  1.14   pooka 	struct lwp *l;
     96   1.1   pooka 	int error;
     97   1.1   pooka 
     98  1.27   pooka 	/* XXX */
     99  1.27   pooka 	if (rump_inited)
    100  1.27   pooka 		return;
    101  1.27   pooka 	rump_inited = 1;
    102  1.27   pooka 
    103  1.36   pooka 	if (rumpuser_getenv("RUMP_NVNODES", buf, sizeof(buf), &error) == 0) {
    104  1.36   pooka 		desiredvnodes = strtoul(buf, NULL, 10);
    105  1.36   pooka 	} else {
    106  1.36   pooka 		desiredvnodes = 1<<16;
    107  1.36   pooka 	}
    108  1.36   pooka 
    109  1.52   pooka 	rumpvm_init();
    110  1.52   pooka 	rump_sleepers_init();
    111  1.52   pooka #ifdef RUMP_USE_REAL_KMEM
    112  1.52   pooka 	kmem_init();
    113  1.52   pooka #endif
    114  1.52   pooka 
    115  1.47      ad 	cache_cpu_init(&rump_cpu);
    116  1.39   pooka 	rw_init(&rump_cwdi.cwdi_lock);
    117  1.14   pooka 	l = &lwp0;
    118  1.40      ad 	p = &proc0;
    119  1.14   pooka 	p->p_stats = &rump_stats;
    120  1.14   pooka 	p->p_cwdi = &rump_cwdi;
    121  1.14   pooka 	p->p_limit = &rump_limits;
    122  1.14   pooka 	p->p_pid = 0;
    123  1.40      ad 	p->p_fd = &rump_filedesc0;
    124  1.27   pooka 	p->p_vmspace = &rump_vmspace;
    125  1.51   pooka 	p->p_emul = &emul_rump;
    126  1.14   pooka 	l->l_cred = rump_cred;
    127  1.14   pooka 	l->l_proc = p;
    128  1.14   pooka 	l->l_lid = 1;
    129  1.36   pooka 
    130  1.36   pooka 	LIST_INSERT_HEAD(&allproc, p, p_list);
    131  1.36   pooka 
    132  1.25   pooka 	mutex_init(&rump_atomic_lock, MUTEX_DEFAULT, IPL_NONE);
    133   1.1   pooka 
    134   1.1   pooka 	rump_limits.pl_rlimit[RLIMIT_FSIZE].rlim_cur = RLIM_INFINITY;
    135  1.27   pooka 	rump_limits.pl_rlimit[RLIMIT_NOFILE].rlim_cur = RLIM_INFINITY;
    136   1.1   pooka 
    137  1.12   pooka 	syncdelay = 0;
    138  1.36   pooka 	dovfsusermount = 1;
    139  1.12   pooka 
    140  1.43   pooka 	rumpuser_thrinit();
    141  1.43   pooka 
    142  1.43   pooka 	fd_sys_init();
    143  1.44      ad 	module_init();
    144  1.51   pooka 	sysctl_init();
    145   1.1   pooka 	vfsinit();
    146   1.5   pooka 	bufinit();
    147  1.49  simonb 	wapbl_init();
    148   1.1   pooka 
    149  1.31   pooka 	rumpvfs_init();
    150  1.31   pooka 
    151  1.21   pooka 	rumpuser_mutex_recursive_init(&rump_giantlock.kmtx_mtx);
    152  1.19   pooka 
    153  1.29   pooka #ifndef RUMP_WITHOUT_THREADS
    154  1.14   pooka 	/* aieeeedondest */
    155  1.14   pooka 	if (workqueue_create(&uvm.aiodone_queue, "aiodoned",
    156  1.14   pooka 	    rump_aiodone_worker, NULL, 0, 0, 0))
    157  1.14   pooka 		panic("aiodoned");
    158  1.29   pooka #endif /* RUMP_WITHOUT_THREADS */
    159  1.14   pooka 
    160   1.1   pooka 	rumpuser_gethostname(hostname, MAXHOSTNAMELEN, &error);
    161   1.1   pooka 	hostnamelen = strlen(hostname);
    162  1.24   pooka 
    163  1.24   pooka 	sigemptyset(&sigcantmask);
    164  1.27   pooka 
    165  1.40      ad 	fd_init(&rump_filedesc0);
    166  1.37   pooka 	rump_cwdi.cwdi_cdir = rootvnode;
    167   1.1   pooka }
    168   1.1   pooka 
    169   1.8   pooka struct mount *
    170   1.8   pooka rump_mnt_init(struct vfsops *vfsops, int mntflags)
    171   1.1   pooka {
    172   1.1   pooka 	struct mount *mp;
    173   1.1   pooka 
    174  1.28   pooka 	mp = kmem_zalloc(sizeof(struct mount), KM_SLEEP);
    175   1.1   pooka 
    176   1.1   pooka 	mp->mnt_op = vfsops;
    177   1.8   pooka 	mp->mnt_flag = mntflags;
    178   1.1   pooka 	TAILQ_INIT(&mp->mnt_vnodelist);
    179  1.45      ad 	rw_init(&mp->mnt_unmounting);
    180  1.45      ad 	mutex_init(&mp->mnt_updating, MUTEX_DEFAULT, IPL_NONE);
    181  1.36   pooka 	mutex_init(&mp->mnt_renamelock, MUTEX_DEFAULT, IPL_NONE);
    182  1.35      ad 	mp->mnt_refcnt = 1;
    183   1.8   pooka 
    184  1.20   pooka 	mount_initspecific(mp);
    185  1.20   pooka 
    186   1.8   pooka 	return mp;
    187   1.8   pooka }
    188   1.8   pooka 
    189   1.8   pooka int
    190  1.22   pooka rump_mnt_mount(struct mount *mp, const char *path, void *data, size_t *dlen)
    191   1.8   pooka {
    192   1.8   pooka 	int rv;
    193   1.8   pooka 
    194  1.22   pooka 	rv = VFS_MOUNT(mp, path, data, dlen);
    195   1.8   pooka 	if (rv)
    196   1.8   pooka 		return rv;
    197   1.8   pooka 
    198  1.27   pooka 	(void) VFS_STATVFS(mp, &mp->mnt_stat);
    199  1.27   pooka 	rv = VFS_START(mp, 0);
    200   1.8   pooka 	if (rv)
    201  1.22   pooka 		VFS_UNMOUNT(mp, MNT_FORCE);
    202   1.8   pooka 
    203   1.8   pooka 	return rv;
    204   1.1   pooka }
    205   1.1   pooka 
    206   1.1   pooka void
    207   1.8   pooka rump_mnt_destroy(struct mount *mp)
    208   1.1   pooka {
    209   1.1   pooka 
    210  1.20   pooka 	mount_finispecific(mp);
    211  1.28   pooka 	kmem_free(mp, sizeof(*mp));
    212   1.1   pooka }
    213   1.1   pooka 
    214   1.1   pooka struct componentname *
    215   1.1   pooka rump_makecn(u_long nameiop, u_long flags, const char *name, size_t namelen,
    216  1.10   pooka 	kauth_cred_t creds, struct lwp *l)
    217   1.1   pooka {
    218   1.1   pooka 	struct componentname *cnp;
    219  1.31   pooka 	const char *cp = NULL;
    220   1.1   pooka 
    221  1.28   pooka 	cnp = kmem_zalloc(sizeof(struct componentname), KM_SLEEP);
    222   1.1   pooka 
    223   1.1   pooka 	cnp->cn_nameiop = nameiop;
    224   1.1   pooka 	cnp->cn_flags = flags;
    225   1.1   pooka 
    226   1.1   pooka 	cnp->cn_pnbuf = PNBUF_GET();
    227   1.1   pooka 	strcpy(cnp->cn_pnbuf, name);
    228   1.1   pooka 	cnp->cn_nameptr = cnp->cn_pnbuf;
    229   1.1   pooka 	cnp->cn_namelen = namelen;
    230  1.31   pooka 	cnp->cn_hash = namei_hash(name, &cp);
    231   1.1   pooka 
    232  1.10   pooka 	cnp->cn_cred = creds;
    233   1.1   pooka 
    234   1.1   pooka 	return cnp;
    235   1.1   pooka }
    236   1.1   pooka 
    237   1.1   pooka void
    238   1.9   pooka rump_freecn(struct componentname *cnp, int flags)
    239   1.1   pooka {
    240   1.1   pooka 
    241   1.9   pooka 	if (flags & RUMPCN_FREECRED)
    242  1.10   pooka 		rump_cred_destroy(cnp->cn_cred);
    243   1.9   pooka 
    244  1.36   pooka 	if ((flags & RUMPCN_HASNTBUF) == 0) {
    245  1.36   pooka 		if (cnp->cn_flags & SAVENAME) {
    246  1.36   pooka 			if (flags & RUMPCN_ISLOOKUP ||cnp->cn_flags & SAVESTART)
    247  1.36   pooka 				PNBUF_PUT(cnp->cn_pnbuf);
    248  1.36   pooka 		} else {
    249   1.1   pooka 			PNBUF_PUT(cnp->cn_pnbuf);
    250  1.36   pooka 		}
    251  1.36   pooka 	}
    252  1.36   pooka 	kmem_free(cnp, sizeof(*cnp));
    253  1.36   pooka }
    254  1.36   pooka 
    255  1.36   pooka /* hey baby, what's your namei? */
    256  1.36   pooka int
    257  1.36   pooka rump_namei(uint32_t op, uint32_t flags, const char *namep,
    258  1.36   pooka 	struct vnode **dvpp, struct vnode **vpp, struct componentname **cnpp)
    259  1.36   pooka {
    260  1.36   pooka 	struct nameidata nd;
    261  1.36   pooka 	int rv;
    262  1.36   pooka 
    263  1.36   pooka 	NDINIT(&nd, op, flags, UIO_SYSSPACE, namep);
    264  1.36   pooka 	rv = namei(&nd);
    265  1.36   pooka 	if (rv)
    266  1.36   pooka 		return rv;
    267  1.36   pooka 
    268  1.36   pooka 	if (dvpp) {
    269  1.36   pooka 		KASSERT(flags & LOCKPARENT);
    270  1.36   pooka 		*dvpp = nd.ni_dvp;
    271  1.36   pooka 	} else {
    272  1.36   pooka 		KASSERT((flags & LOCKPARENT) == 0);
    273  1.36   pooka 	}
    274  1.36   pooka 
    275  1.36   pooka 	if (vpp) {
    276  1.36   pooka 		*vpp = nd.ni_vp;
    277   1.1   pooka 	} else {
    278  1.36   pooka 		if (nd.ni_vp) {
    279  1.36   pooka 			if (flags & LOCKLEAF)
    280  1.36   pooka 				vput(nd.ni_vp);
    281  1.36   pooka 			else
    282  1.36   pooka 				vrele(nd.ni_vp);
    283  1.36   pooka 		}
    284   1.1   pooka 	}
    285  1.36   pooka 
    286  1.36   pooka 	if (cnpp) {
    287  1.36   pooka 		struct componentname *cnp;
    288  1.36   pooka 
    289  1.36   pooka 		cnp = kmem_alloc(sizeof(*cnp), KM_SLEEP);
    290  1.36   pooka 		memcpy(cnp, &nd.ni_cnd, sizeof(*cnp));
    291  1.36   pooka 		*cnpp = cnp;
    292  1.36   pooka 	} else if (nd.ni_cnd.cn_flags & HASBUF) {
    293  1.36   pooka 		panic("%s: pathbuf mismatch", __func__);
    294  1.36   pooka 	}
    295  1.36   pooka 
    296  1.36   pooka 	return rv;
    297   1.1   pooka }
    298   1.1   pooka 
    299   1.2   pooka static struct fakeblk *
    300   1.2   pooka _rump_fakeblk_find(const char *path)
    301   1.2   pooka {
    302   1.2   pooka 	char buf[MAXPATHLEN];
    303   1.2   pooka 	struct fakeblk *fblk;
    304   1.3   pooka 	int error;
    305   1.2   pooka 
    306   1.3   pooka 	if (rumpuser_realpath(path, buf, &error) == NULL)
    307   1.3   pooka 		return NULL;
    308   1.2   pooka 
    309   1.2   pooka 	LIST_FOREACH(fblk, &fakeblks, entries)
    310   1.2   pooka 		if (strcmp(fblk->path, buf) == 0)
    311   1.2   pooka 			return fblk;
    312   1.2   pooka 
    313   1.2   pooka 	return NULL;
    314   1.2   pooka }
    315   1.2   pooka 
    316   1.2   pooka int
    317   1.2   pooka rump_fakeblk_register(const char *path)
    318   1.2   pooka {
    319   1.2   pooka 	char buf[MAXPATHLEN];
    320   1.2   pooka 	struct fakeblk *fblk;
    321   1.3   pooka 	int error;
    322   1.2   pooka 
    323   1.2   pooka 	if (_rump_fakeblk_find(path))
    324   1.2   pooka 		return EEXIST;
    325   1.2   pooka 
    326   1.3   pooka 	if (rumpuser_realpath(path, buf, &error) == NULL)
    327   1.3   pooka 		return error;
    328   1.3   pooka 
    329  1.28   pooka 	fblk = kmem_alloc(sizeof(struct fakeblk), KM_NOSLEEP);
    330   1.2   pooka 	if (fblk == NULL)
    331   1.2   pooka 		return ENOMEM;
    332   1.2   pooka 
    333   1.3   pooka 	strlcpy(fblk->path, buf, MAXPATHLEN);
    334   1.2   pooka 	LIST_INSERT_HEAD(&fakeblks, fblk, entries);
    335   1.2   pooka 
    336   1.2   pooka 	return 0;
    337   1.2   pooka }
    338   1.2   pooka 
    339   1.2   pooka int
    340   1.2   pooka rump_fakeblk_find(const char *path)
    341   1.2   pooka {
    342   1.2   pooka 
    343   1.2   pooka 	return _rump_fakeblk_find(path) != NULL;
    344   1.2   pooka }
    345   1.2   pooka 
    346   1.2   pooka void
    347   1.2   pooka rump_fakeblk_deregister(const char *path)
    348   1.2   pooka {
    349   1.2   pooka 	struct fakeblk *fblk;
    350   1.2   pooka 
    351   1.2   pooka 	fblk = _rump_fakeblk_find(path);
    352   1.2   pooka 	if (fblk == NULL)
    353   1.3   pooka 		return;
    354   1.2   pooka 
    355   1.2   pooka 	LIST_REMOVE(fblk, entries);
    356  1.28   pooka 	kmem_free(fblk, sizeof(*fblk));
    357   1.2   pooka }
    358   1.4   pooka 
    359   1.4   pooka void
    360   1.4   pooka rump_getvninfo(struct vnode *vp, enum vtype *vtype, voff_t *vsize, dev_t *vdev)
    361   1.4   pooka {
    362   1.4   pooka 
    363   1.4   pooka 	*vtype = vp->v_type;
    364   1.4   pooka 	*vsize = vp->v_size;
    365  1.30      ad 	if (vp->v_specnode)
    366   1.4   pooka 		*vdev = vp->v_rdev;
    367   1.4   pooka 	else
    368   1.4   pooka 		*vdev = 0;
    369   1.4   pooka }
    370   1.6   pooka 
    371   1.6   pooka struct vfsops *
    372   1.6   pooka rump_vfslist_iterate(struct vfsops *ops)
    373   1.6   pooka {
    374   1.6   pooka 
    375   1.6   pooka 	if (ops == NULL)
    376   1.6   pooka 		return LIST_FIRST(&vfs_list);
    377   1.6   pooka 	else
    378   1.6   pooka 		return LIST_NEXT(ops, vfs_list);
    379   1.6   pooka }
    380   1.6   pooka 
    381   1.6   pooka struct vfsops *
    382   1.6   pooka rump_vfs_getopsbyname(const char *name)
    383   1.6   pooka {
    384   1.6   pooka 
    385   1.6   pooka 	return vfs_getopsbyname(name);
    386   1.6   pooka }
    387   1.7   pooka 
    388   1.8   pooka struct vattr*
    389   1.8   pooka rump_vattr_init()
    390   1.8   pooka {
    391   1.8   pooka 	struct vattr *vap;
    392   1.8   pooka 
    393  1.28   pooka 	vap = kmem_alloc(sizeof(struct vattr), KM_SLEEP);
    394   1.8   pooka 	vattr_null(vap);
    395   1.8   pooka 
    396   1.8   pooka 	return vap;
    397   1.8   pooka }
    398   1.8   pooka 
    399   1.8   pooka void
    400   1.8   pooka rump_vattr_settype(struct vattr *vap, enum vtype vt)
    401   1.8   pooka {
    402   1.8   pooka 
    403   1.8   pooka 	vap->va_type = vt;
    404   1.8   pooka }
    405   1.8   pooka 
    406   1.7   pooka void
    407   1.8   pooka rump_vattr_setmode(struct vattr *vap, mode_t mode)
    408   1.7   pooka {
    409   1.7   pooka 
    410   1.8   pooka 	vap->va_mode = mode;
    411   1.8   pooka }
    412   1.8   pooka 
    413   1.8   pooka void
    414   1.8   pooka rump_vattr_setrdev(struct vattr *vap, dev_t dev)
    415   1.8   pooka {
    416   1.8   pooka 
    417   1.8   pooka 	vap->va_rdev = dev;
    418   1.8   pooka }
    419   1.8   pooka 
    420   1.8   pooka void
    421   1.8   pooka rump_vattr_free(struct vattr *vap)
    422   1.8   pooka {
    423   1.8   pooka 
    424  1.28   pooka 	kmem_free(vap, sizeof(*vap));
    425   1.8   pooka }
    426   1.8   pooka 
    427   1.8   pooka void
    428   1.8   pooka rump_vp_incref(struct vnode *vp)
    429   1.8   pooka {
    430   1.8   pooka 
    431  1.32   pooka 	mutex_enter(&vp->v_interlock);
    432   1.8   pooka 	++vp->v_usecount;
    433  1.32   pooka 	mutex_exit(&vp->v_interlock);
    434   1.8   pooka }
    435   1.8   pooka 
    436   1.8   pooka int
    437   1.8   pooka rump_vp_getref(struct vnode *vp)
    438   1.8   pooka {
    439   1.8   pooka 
    440   1.8   pooka 	return vp->v_usecount;
    441   1.8   pooka }
    442   1.8   pooka 
    443   1.8   pooka void
    444   1.8   pooka rump_vp_decref(struct vnode *vp)
    445   1.8   pooka {
    446   1.8   pooka 
    447  1.32   pooka 	mutex_enter(&vp->v_interlock);
    448   1.8   pooka 	--vp->v_usecount;
    449  1.32   pooka 	mutex_exit(&vp->v_interlock);
    450  1.32   pooka }
    451  1.32   pooka 
    452  1.33   pooka /*
    453  1.33   pooka  * Really really recycle with a cherry on top.  We should be
    454  1.33   pooka  * extra-sure we can do this.  For example with p2k there is
    455  1.33   pooka  * no problem, since puffs in the kernel takes care of refcounting
    456  1.33   pooka  * for us.
    457  1.33   pooka  */
    458  1.32   pooka void
    459  1.33   pooka rump_vp_recycle_nokidding(struct vnode *vp)
    460  1.32   pooka {
    461  1.32   pooka 
    462  1.32   pooka 	mutex_enter(&vp->v_interlock);
    463  1.33   pooka 	vp->v_usecount = 1;
    464  1.32   pooka 	vclean(vp, DOCLOSE);
    465  1.34   pooka 	vrelel(vp, 0);
    466  1.32   pooka }
    467  1.32   pooka 
    468  1.32   pooka void
    469  1.32   pooka rump_vp_rele(struct vnode *vp)
    470  1.32   pooka {
    471  1.32   pooka 
    472  1.32   pooka 	vrele(vp);
    473   1.8   pooka }
    474   1.8   pooka 
    475   1.8   pooka struct uio *
    476   1.8   pooka rump_uio_setup(void *buf, size_t bufsize, off_t offset, enum rump_uiorw rw)
    477   1.8   pooka {
    478   1.8   pooka 	struct uio *uio;
    479   1.8   pooka 	enum uio_rw uiorw;
    480   1.8   pooka 
    481   1.8   pooka 	switch (rw) {
    482   1.8   pooka 	case RUMPUIO_READ:
    483   1.8   pooka 		uiorw = UIO_READ;
    484   1.8   pooka 		break;
    485   1.8   pooka 	case RUMPUIO_WRITE:
    486   1.8   pooka 		uiorw = UIO_WRITE;
    487   1.8   pooka 		break;
    488  1.11   pooka 	default:
    489  1.11   pooka 		panic("%s: invalid rw %d", __func__, rw);
    490   1.8   pooka 	}
    491   1.8   pooka 
    492  1.28   pooka 	uio = kmem_alloc(sizeof(struct uio), KM_SLEEP);
    493  1.28   pooka 	uio->uio_iov = kmem_alloc(sizeof(struct iovec), KM_SLEEP);
    494   1.8   pooka 
    495   1.8   pooka 	uio->uio_iov->iov_base = buf;
    496   1.8   pooka 	uio->uio_iov->iov_len = bufsize;
    497   1.8   pooka 
    498   1.8   pooka 	uio->uio_iovcnt = 1;
    499   1.8   pooka 	uio->uio_offset = offset;
    500   1.8   pooka 	uio->uio_resid = bufsize;
    501   1.8   pooka 	uio->uio_rw = uiorw;
    502   1.8   pooka 	uio->uio_vmspace = UIO_VMSPACE_SYS;
    503   1.8   pooka 
    504   1.8   pooka 	return uio;
    505   1.8   pooka }
    506   1.8   pooka 
    507   1.8   pooka size_t
    508   1.8   pooka rump_uio_getresid(struct uio *uio)
    509   1.8   pooka {
    510   1.8   pooka 
    511   1.8   pooka 	return uio->uio_resid;
    512   1.8   pooka }
    513   1.8   pooka 
    514   1.8   pooka off_t
    515   1.8   pooka rump_uio_getoff(struct uio *uio)
    516   1.8   pooka {
    517   1.8   pooka 
    518   1.8   pooka 	return uio->uio_offset;
    519   1.8   pooka }
    520   1.8   pooka 
    521   1.8   pooka size_t
    522   1.8   pooka rump_uio_free(struct uio *uio)
    523   1.8   pooka {
    524   1.8   pooka 	size_t resid;
    525   1.8   pooka 
    526   1.8   pooka 	resid = uio->uio_resid;
    527  1.28   pooka 	kmem_free(uio->uio_iov, sizeof(*uio->uio_iov));
    528  1.28   pooka 	kmem_free(uio, sizeof(*uio));
    529   1.8   pooka 
    530   1.8   pooka 	return resid;
    531   1.8   pooka }
    532   1.8   pooka 
    533   1.8   pooka void
    534   1.8   pooka rump_vp_lock_exclusive(struct vnode *vp)
    535   1.8   pooka {
    536   1.8   pooka 
    537   1.8   pooka 	/* we can skip vn_lock() */
    538   1.8   pooka 	VOP_LOCK(vp, LK_EXCLUSIVE);
    539   1.8   pooka }
    540   1.8   pooka 
    541   1.8   pooka void
    542   1.8   pooka rump_vp_lock_shared(struct vnode *vp)
    543   1.8   pooka {
    544   1.8   pooka 
    545   1.8   pooka 	VOP_LOCK(vp, LK_SHARED);
    546   1.8   pooka }
    547   1.8   pooka 
    548   1.8   pooka void
    549   1.8   pooka rump_vp_unlock(struct vnode *vp)
    550   1.8   pooka {
    551   1.8   pooka 
    552   1.8   pooka 	VOP_UNLOCK(vp, 0);
    553   1.8   pooka }
    554   1.8   pooka 
    555   1.8   pooka int
    556   1.8   pooka rump_vp_islocked(struct vnode *vp)
    557   1.8   pooka {
    558   1.8   pooka 
    559   1.8   pooka 	return VOP_ISLOCKED(vp);
    560   1.8   pooka }
    561   1.8   pooka 
    562  1.26   pooka void
    563  1.26   pooka rump_vp_interlock(struct vnode *vp)
    564  1.26   pooka {
    565  1.26   pooka 
    566  1.26   pooka 	mutex_enter(&vp->v_interlock);
    567  1.26   pooka }
    568  1.26   pooka 
    569   1.8   pooka int
    570  1.22   pooka rump_vfs_unmount(struct mount *mp, int mntflags)
    571   1.8   pooka {
    572   1.8   pooka 
    573  1.22   pooka 	return VFS_UNMOUNT(mp, mntflags);
    574   1.8   pooka }
    575   1.8   pooka 
    576   1.8   pooka int
    577  1.12   pooka rump_vfs_root(struct mount *mp, struct vnode **vpp, int lock)
    578   1.8   pooka {
    579  1.12   pooka 	int rv;
    580  1.12   pooka 
    581  1.12   pooka 	rv = VFS_ROOT(mp, vpp);
    582  1.12   pooka 	if (rv)
    583  1.12   pooka 		return rv;
    584  1.12   pooka 
    585  1.12   pooka 	if (!lock)
    586  1.12   pooka 		VOP_UNLOCK(*vpp, 0);
    587   1.8   pooka 
    588  1.12   pooka 	return 0;
    589   1.8   pooka }
    590   1.8   pooka 
    591   1.8   pooka int
    592  1.22   pooka rump_vfs_statvfs(struct mount *mp, struct statvfs *sbp)
    593   1.8   pooka {
    594   1.8   pooka 
    595  1.22   pooka 	return VFS_STATVFS(mp, sbp);
    596   1.8   pooka }
    597   1.8   pooka 
    598   1.8   pooka int
    599  1.22   pooka rump_vfs_sync(struct mount *mp, int wait, kauth_cred_t cred)
    600   1.8   pooka {
    601   1.8   pooka 
    602  1.22   pooka 	return VFS_SYNC(mp, wait ? MNT_WAIT : MNT_NOWAIT, cred);
    603   1.8   pooka }
    604   1.8   pooka 
    605   1.8   pooka int
    606   1.8   pooka rump_vfs_fhtovp(struct mount *mp, struct fid *fid, struct vnode **vpp)
    607   1.8   pooka {
    608   1.8   pooka 
    609   1.8   pooka 	return VFS_FHTOVP(mp, fid, vpp);
    610   1.8   pooka }
    611   1.8   pooka 
    612   1.8   pooka int
    613   1.8   pooka rump_vfs_vptofh(struct vnode *vp, struct fid *fid, size_t *fidsize)
    614   1.8   pooka {
    615   1.8   pooka 
    616   1.8   pooka 	return VFS_VPTOFH(vp, fid, fidsize);
    617   1.7   pooka }
    618  1.12   pooka 
    619  1.16   pooka /*ARGSUSED*/
    620  1.16   pooka void
    621  1.16   pooka rump_vfs_syncwait(struct mount *mp)
    622  1.16   pooka {
    623  1.16   pooka 	int n;
    624  1.16   pooka 
    625  1.16   pooka 	n = buf_syncwait();
    626  1.16   pooka 	if (n)
    627  1.16   pooka 		printf("syncwait: unsynced buffers: %d\n", n);
    628  1.16   pooka }
    629  1.16   pooka 
    630  1.50   pooka int
    631  1.50   pooka rump_vfs_load(struct modinfo **mi)
    632  1.50   pooka {
    633  1.50   pooka 
    634  1.50   pooka 	if (!module_compatible((*mi)->mi_version, __NetBSD_Version__))
    635  1.50   pooka 		return EPROGMISMATCH;
    636  1.50   pooka 
    637  1.50   pooka 	return (*mi)->mi_modcmd(MODULE_CMD_INIT, NULL);
    638  1.50   pooka }
    639  1.50   pooka 
    640  1.12   pooka void
    641  1.12   pooka rump_bioops_sync()
    642  1.12   pooka {
    643  1.12   pooka 
    644  1.12   pooka 	if (bioopsp)
    645  1.12   pooka 		bioopsp->io_sync(NULL);
    646  1.12   pooka }
    647  1.14   pooka 
    648  1.14   pooka struct lwp *
    649  1.14   pooka rump_setup_curlwp(pid_t pid, lwpid_t lid, int set)
    650  1.14   pooka {
    651  1.14   pooka 	struct lwp *l;
    652  1.14   pooka 	struct proc *p;
    653  1.14   pooka 
    654  1.37   pooka 	l = kmem_zalloc(sizeof(struct lwp), KM_SLEEP);
    655  1.53   pooka 	if (pid != 0) {
    656  1.53   pooka 		p = kmem_zalloc(sizeof(struct proc), KM_SLEEP);
    657  1.53   pooka 		p->p_cwdi = cwdinit();
    658  1.53   pooka 
    659  1.53   pooka 		p->p_stats = &rump_stats;
    660  1.53   pooka 		p->p_limit = &rump_limits;
    661  1.53   pooka 		p->p_pid = pid;
    662  1.53   pooka 		p->p_vmspace = &rump_vmspace;
    663  1.53   pooka 		p->p_fd = fd_init(NULL);
    664  1.53   pooka 	} else {
    665  1.53   pooka 		p = &proc0;
    666  1.53   pooka 	}
    667  1.37   pooka 
    668  1.14   pooka 	l->l_cred = rump_cred;
    669  1.14   pooka 	l->l_proc = p;
    670  1.53   pooka 	l->l_lid = lid;
    671  1.53   pooka 	l->l_fd = p->p_fd;
    672  1.38   pooka 
    673  1.14   pooka 	if (set)
    674  1.14   pooka 		rumpuser_set_curlwp(l);
    675  1.14   pooka 
    676  1.14   pooka 	return l;
    677  1.14   pooka }
    678  1.14   pooka 
    679  1.14   pooka void
    680  1.14   pooka rump_clear_curlwp()
    681  1.14   pooka {
    682  1.14   pooka 	struct lwp *l;
    683  1.14   pooka 
    684  1.14   pooka 	l = rumpuser_get_curlwp();
    685  1.53   pooka 	if (l->l_proc->p_pid != 0) {
    686  1.53   pooka 		fd_free();
    687  1.53   pooka 		cwdfree(l->l_proc->p_cwdi);
    688  1.53   pooka 		kmem_free(l->l_proc, sizeof(*l->l_proc));
    689  1.53   pooka 	}
    690  1.37   pooka 	kmem_free(l, sizeof(*l));
    691  1.14   pooka 	rumpuser_set_curlwp(NULL);
    692  1.14   pooka }
    693  1.14   pooka 
    694  1.14   pooka struct lwp *
    695  1.14   pooka rump_get_curlwp()
    696  1.14   pooka {
    697  1.14   pooka 	struct lwp *l;
    698  1.14   pooka 
    699  1.14   pooka 	l = rumpuser_get_curlwp();
    700  1.14   pooka 	if (l == NULL)
    701  1.14   pooka 		l = &lwp0;
    702  1.14   pooka 
    703  1.14   pooka 	return l;
    704  1.14   pooka }
    705  1.15   pooka 
    706  1.18   pooka int
    707  1.18   pooka rump_splfoo()
    708  1.18   pooka {
    709  1.18   pooka 
    710  1.21   pooka 	if (rumpuser_whatis_ipl() != RUMPUSER_IPL_INTR) {
    711  1.18   pooka 		rumpuser_rw_enter(&rumpspl, 0);
    712  1.21   pooka 		rumpuser_set_ipl(RUMPUSER_IPL_SPLFOO);
    713  1.21   pooka 	}
    714  1.18   pooka 
    715  1.18   pooka 	return 0;
    716  1.18   pooka }
    717  1.18   pooka 
    718  1.18   pooka static void
    719  1.18   pooka rump_intr_enter(void)
    720  1.18   pooka {
    721  1.18   pooka 
    722  1.21   pooka 	rumpuser_set_ipl(RUMPUSER_IPL_INTR);
    723  1.18   pooka 	rumpuser_rw_enter(&rumpspl, 1);
    724  1.18   pooka }
    725  1.18   pooka 
    726  1.18   pooka static void
    727  1.18   pooka rump_intr_exit(void)
    728  1.18   pooka {
    729  1.18   pooka 
    730  1.18   pooka 	rumpuser_rw_exit(&rumpspl);
    731  1.21   pooka 	rumpuser_clear_ipl(RUMPUSER_IPL_INTR);
    732  1.18   pooka }
    733  1.18   pooka 
    734  1.18   pooka void
    735  1.18   pooka rump_splx(int dummy)
    736  1.18   pooka {
    737  1.18   pooka 
    738  1.21   pooka 	if (rumpuser_whatis_ipl() != RUMPUSER_IPL_INTR) {
    739  1.21   pooka 		rumpuser_clear_ipl(RUMPUSER_IPL_SPLFOO);
    740  1.18   pooka 		rumpuser_rw_exit(&rumpspl);
    741  1.21   pooka 	}
    742  1.18   pooka }
    743  1.18   pooka 
    744  1.15   pooka void
    745  1.15   pooka rump_biodone(void *arg, size_t count, int error)
    746  1.15   pooka {
    747  1.15   pooka 	struct buf *bp = arg;
    748  1.15   pooka 
    749  1.15   pooka 	bp->b_resid = bp->b_bcount - count;
    750  1.15   pooka 	KASSERT(bp->b_resid >= 0);
    751  1.15   pooka 	bp->b_error = error;
    752  1.18   pooka 
    753  1.18   pooka 	rump_intr_enter();
    754  1.15   pooka 	biodone(bp);
    755  1.18   pooka 	rump_intr_exit();
    756  1.15   pooka }
    757