Home | History | Annotate | Line # | Download | only in puffs
puffs_node.c revision 1.9
      1 /*	$NetBSD: puffs_node.c,v 1.9 2008/01/02 11:48:43 ad Exp $	*/
      2 
      3 /*
      4  * Copyright (c) 2005, 2006, 2007  Antti Kantee.  All Rights Reserved.
      5  *
      6  * Development of this software was supported by the
      7  * Google Summer of Code program, the Ulla Tuominen Foundation
      8  * and the Finnish Cultural Foundation.
      9  *
     10  * Redistribution and use in source and binary forms, with or without
     11  * modification, are permitted provided that the following conditions
     12  * are met:
     13  * 1. Redistributions of source code must retain the above copyright
     14  *    notice, this list of conditions and the following disclaimer.
     15  * 2. Redistributions in binary form must reproduce the above copyright
     16  *    notice, this list of conditions and the following disclaimer in the
     17  *    documentation and/or other materials provided with the distribution.
     18  *
     19  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
     20  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     21  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     22  * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     23  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     24  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
     25  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     26  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     27  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     28  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     29  * SUCH DAMAGE.
     30  */
     31 
     32 #include <sys/cdefs.h>
     33 __KERNEL_RCSID(0, "$NetBSD: puffs_node.c,v 1.9 2008/01/02 11:48:43 ad Exp $");
     34 
     35 #include <sys/param.h>
     36 #include <sys/hash.h>
     37 #include <sys/kmem.h>
     38 #include <sys/malloc.h>
     39 #include <sys/mount.h>
     40 #include <sys/namei.h>
     41 #include <sys/vnode.h>
     42 
     43 #include <fs/puffs/puffs_msgif.h>
     44 #include <fs/puffs/puffs_sys.h>
     45 
     46 #include <miscfs/genfs/genfs_node.h>
     47 #include <miscfs/specfs/specdev.h>
     48 
     49 static const struct genfs_ops puffs_genfsops = {
     50 	.gop_size = puffs_gop_size,
     51 	.gop_write = genfs_gop_write,
     52 	.gop_markupdate = puffs_gop_markupdate,
     53 #if 0
     54 	.gop_alloc, should ask userspace
     55 #endif
     56 };
     57 
     58 static __inline struct puffs_node_hashlist
     59 	*puffs_cookie2hashlist(struct puffs_mount *, void *);
     60 static struct puffs_node *puffs_cookie2pnode(struct puffs_mount *, void *);
     61 
     62 struct pool puffs_pnpool;
     63 
     64 /*
     65  * Grab a vnode, intialize all the puffs-dependant stuff.
     66  */
     67 int
     68 puffs_getvnode(struct mount *mp, void *cookie, enum vtype type,
     69 	voff_t vsize, dev_t rdev, struct vnode **vpp)
     70 {
     71 	struct puffs_mount *pmp;
     72 	struct puffs_newcookie *pnc;
     73 	struct vnode *vp, *nvp;
     74 	struct puffs_node *pnode;
     75 	struct puffs_node_hashlist *plist;
     76 	int error;
     77 
     78 	pmp = MPTOPUFFSMP(mp);
     79 
     80 	error = EPROTO;
     81 	if (type <= VNON || type >= VBAD) {
     82 		puffs_senderr(pmp, PUFFS_ERR_MAKENODE, EINVAL,
     83 		    "bad node type", cookie);
     84 		goto bad;
     85 	}
     86 	if (vsize == VSIZENOTSET) {
     87 		puffs_senderr(pmp, PUFFS_ERR_MAKENODE, EINVAL,
     88 		    "VSIZENOTSET is not a valid size", cookie);
     89 		goto bad;
     90 	}
     91 
     92 	/*
     93 	 * XXX: there is a deadlock condition between vfs_busy() and
     94 	 * vnode locks.  For an unmounting file system the mountpoint
     95 	 * is frozen, but in unmount(FORCE) vflush() wants to access all
     96 	 * of the vnodes.  If we are here waiting for the mountpoint
     97 	 * lock while holding on to a vnode lock, well, we ain't
     98 	 * just pining for the fjords anymore.  If we release the
     99 	 * vnode lock, we will be in the situation "mount point
    100 	 * is dying" and panic() will ensue in insmntque.  So as a
    101 	 * temporary workaround, get a vnode without putting it on
    102 	 * the mount point list, check if mount point is still alive
    103 	 * and kicking and only then add the vnode to the list.
    104 	 */
    105 	error = getnewvnode(VT_PUFFS, NULL, puffs_vnodeop_p, &vp);
    106 	if (error)
    107 		goto bad;
    108 	vp->v_vnlock = NULL;
    109 	vp->v_type = type;
    110 
    111 	/*
    112 	 * Check what mount point isn't going away.  This will work
    113 	 * until we decide to remove biglock or make the kernel
    114 	 * preemptive.  But hopefully the real problem will be fixed
    115 	 * by then.
    116 	 *
    117 	 * XXX: yes, should call vfs_busy(), but thar be rabbits with
    118 	 * vicious streaks a mile wide ...
    119 	 *
    120 	 * XXX: there is a transient failure here: if someone is unmounting
    121 	 * the file system but doesn't succeed (due to it being busy),
    122 	 * we incorrectly fail new vnode allocation.  This is *very*
    123 	 * hard to fix with the current structure of file system unmounting.
    124 	 */
    125 	if (mp->mnt_iflag & IMNT_UNMOUNT) {
    126 		DPRINTF(("puffs_getvnode: mp %p unmount, unable to create "
    127 		    "vnode for cookie %p\n", mp, cookie));
    128 		ungetnewvnode(vp);
    129 		error = ENXIO;
    130 		goto bad;
    131 	}
    132 
    133 	/*
    134 	 * Creation should not fail after this point.  Or if it does,
    135 	 * care must be taken so that VOP_INACTIVE() isn't called.
    136 	 */
    137 
    138 	/* So mp is not dead yet.. good.. inform new vnode of its master */
    139 	mutex_enter(&mntvnode_lock);
    140 	TAILQ_INSERT_TAIL(&mp->mnt_vnodelist, vp, v_mntvnodes);
    141 	vp->v_mount = mp;
    142 	mutex_exit(&mntvnode_lock);
    143 
    144 	/*
    145 	 * clerical tasks & footwork
    146 	 */
    147 
    148 	/* default size */
    149 	uvm_vnp_setsize(vp, 0);
    150 
    151 	/* dances based on vnode type. almost ufs_vinit(), but not quite */
    152 	switch (type) {
    153 	case VCHR:
    154 	case VBLK:
    155 		/*
    156 		 * replace vnode operation vector with the specops vector.
    157 		 * our user server has very little control over the node
    158 		 * if it decides its a character or block special file
    159 		 */
    160 		vp->v_op = puffs_specop_p;
    161 
    162 		/* do the standard checkalias-dance */
    163 		if ((nvp = checkalias(vp, rdev, mp)) != NULL) {
    164 			/*
    165 			 * found: release & unallocate aliased
    166 			 * old (well, actually, new) node
    167 			 */
    168 			vp->v_op = spec_vnodeop_p;
    169 			vp->v_vflag &= ~VV_LOCKSWORK;
    170 			vgone(vp); /* cya */
    171 
    172 			/* init "new" vnode */
    173 			vp = nvp;
    174 			vp->v_vnlock = NULL;
    175 			vp->v_mount = mp;
    176 		}
    177 		break;
    178 
    179 	case VFIFO:
    180 		vp->v_op = puffs_fifoop_p;
    181 		break;
    182 
    183 	case VREG:
    184 		uvm_vnp_setsize(vp, vsize);
    185 		break;
    186 
    187 	case VDIR:
    188 	case VLNK:
    189 	case VSOCK:
    190 		break;
    191 	default:
    192 		panic("puffs_getvnode: invalid vtype %d", type);
    193 	}
    194 
    195 	pnode = pool_get(&puffs_pnpool, PR_WAITOK);
    196 	memset(pnode, 0, sizeof(struct puffs_node));
    197 
    198 	pnode->pn_cookie = cookie;
    199 	pnode->pn_refcount = 1;
    200 
    201 	/* insert cookie on list, take off of interlock list */
    202 	mutex_init(&pnode->pn_mtx, MUTEX_DEFAULT, IPL_NONE);
    203 	SLIST_INIT(&pnode->pn_sel.sel_klist);
    204 	plist = puffs_cookie2hashlist(pmp, cookie);
    205 	mutex_enter(&pmp->pmp_lock);
    206 	LIST_INSERT_HEAD(plist, pnode, pn_hashent);
    207 	if (cookie != pmp->pmp_root_cookie) {
    208 		LIST_FOREACH(pnc, &pmp->pmp_newcookie, pnc_entries) {
    209 			if (pnc->pnc_cookie == cookie) {
    210 				LIST_REMOVE(pnc, pnc_entries);
    211 				kmem_free(pnc, sizeof(struct puffs_newcookie));
    212 				break;
    213 			}
    214 		}
    215 		KASSERT(pnc != NULL);
    216 	}
    217 	mutex_exit(&pmp->pmp_lock);
    218 
    219 	vp->v_data = pnode;
    220 	vp->v_type = type;
    221 	pnode->pn_vp = vp;
    222 	pnode->pn_serversize = vsize;
    223 
    224 	genfs_node_init(vp, &puffs_genfsops);
    225 	*vpp = vp;
    226 
    227 	DPRINTF(("new vnode at %p, pnode %p, cookie %p\n", vp,
    228 	    pnode, pnode->pn_cookie));
    229 
    230 	return 0;
    231 
    232  bad:
    233 	/* remove staging cookie from list */
    234 	if (cookie != pmp->pmp_root_cookie) {
    235 		mutex_enter(&pmp->pmp_lock);
    236 		LIST_FOREACH(pnc, &pmp->pmp_newcookie, pnc_entries) {
    237 			if (pnc->pnc_cookie == cookie) {
    238 				LIST_REMOVE(pnc, pnc_entries);
    239 				kmem_free(pnc, sizeof(struct puffs_newcookie));
    240 				break;
    241 			}
    242 		}
    243 		KASSERT(pnc != NULL);
    244 		mutex_exit(&pmp->pmp_lock);
    245 	}
    246 
    247 	return error;
    248 }
    249 
    250 /* new node creating for creative vop ops (create, symlink, mkdir, mknod) */
    251 int
    252 puffs_newnode(struct mount *mp, struct vnode *dvp, struct vnode **vpp,
    253 	void *cookie, struct componentname *cnp, enum vtype type, dev_t rdev)
    254 {
    255 	struct puffs_mount *pmp = MPTOPUFFSMP(mp);
    256 	struct puffs_newcookie *pnc;
    257 	struct vnode *vp;
    258 	int error;
    259 
    260 	/* userspace probably has this as a NULL op */
    261 	if (cookie == NULL) {
    262 		error = EOPNOTSUPP;
    263 		return error;
    264 	}
    265 
    266 	/*
    267 	 * Check for previous node with the same designation.
    268 	 * Explicitly check the root node cookie, since it might be
    269 	 * reclaimed from the kernel when this check is made.
    270 	 */
    271 	mutex_enter(&pmp->pmp_lock);
    272 	if (cookie == pmp->pmp_root_cookie
    273 	    || puffs_cookie2pnode(pmp, cookie) != NULL) {
    274 		mutex_exit(&pmp->pmp_lock);
    275 		puffs_senderr(pmp, PUFFS_ERR_MAKENODE, EEXIST,
    276 		    "cookie exists", cookie);
    277 		return EPROTO;
    278 	}
    279 
    280 	LIST_FOREACH(pnc, &pmp->pmp_newcookie, pnc_entries) {
    281 		if (pnc->pnc_cookie == cookie) {
    282 			mutex_exit(&pmp->pmp_lock);
    283 			puffs_senderr(pmp, PUFFS_ERR_MAKENODE, EEXIST,
    284 			    "cookie exists", cookie);
    285 			return EPROTO;
    286 		}
    287 	}
    288 	pnc = kmem_alloc(sizeof(struct puffs_newcookie), KM_SLEEP);
    289 	pnc->pnc_cookie = cookie;
    290 	LIST_INSERT_HEAD(&pmp->pmp_newcookie, pnc, pnc_entries);
    291 	mutex_exit(&pmp->pmp_lock);
    292 
    293 	error = puffs_getvnode(dvp->v_mount, cookie, type, 0, rdev, &vp);
    294 	if (error)
    295 		return error;
    296 
    297 	vp->v_type = type;
    298 	vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
    299 	*vpp = vp;
    300 
    301 	if ((cnp->cn_flags & MAKEENTRY) && PUFFS_USE_NAMECACHE(pmp))
    302 		cache_enter(dvp, vp, cnp);
    303 
    304 	return 0;
    305 }
    306 
    307 void
    308 puffs_putvnode(struct vnode *vp)
    309 {
    310 	struct puffs_mount *pmp;
    311 	struct puffs_node *pnode;
    312 
    313 	pmp = VPTOPUFFSMP(vp);
    314 	pnode = VPTOPP(vp);
    315 
    316 #ifdef DIAGNOSTIC
    317 	if (vp->v_tag != VT_PUFFS)
    318 		panic("puffs_putvnode: %p not a puffs vnode", vp);
    319 #endif
    320 
    321 	LIST_REMOVE(pnode, pn_hashent);
    322 	genfs_node_destroy(vp);
    323 	puffs_releasenode(pnode);
    324 	vp->v_data = NULL;
    325 
    326 	return;
    327 }
    328 
    329 static __inline struct puffs_node_hashlist *
    330 puffs_cookie2hashlist(struct puffs_mount *pmp, void *cookie)
    331 {
    332 	uint32_t hash;
    333 
    334 	hash = hash32_buf(&cookie, sizeof(void *), HASH32_BUF_INIT);
    335 	return &pmp->pmp_pnodehash[hash % pmp->pmp_npnodehash];
    336 }
    337 
    338 /*
    339  * Translate cookie to puffs_node.  Caller must hold pmp_lock
    340  * and it will be held upon return.
    341  */
    342 static struct puffs_node *
    343 puffs_cookie2pnode(struct puffs_mount *pmp, void *cookie)
    344 {
    345 	struct puffs_node_hashlist *plist;
    346 	struct puffs_node *pnode;
    347 
    348 	plist = puffs_cookie2hashlist(pmp, cookie);
    349 	LIST_FOREACH(pnode, plist, pn_hashent) {
    350 		if (pnode->pn_cookie == cookie)
    351 			break;
    352 	}
    353 
    354 	return pnode;
    355 }
    356 
    357 /*
    358  * Make sure root vnode exists and reference it.  Does NOT lock.
    359  */
    360 static int
    361 puffs_makeroot(struct puffs_mount *pmp)
    362 {
    363 	struct vnode *vp;
    364 	int rv;
    365 
    366 	/*
    367 	 * pmp_lock must be held if vref()'ing or vrele()'ing the
    368 	 * root vnode.  the latter is controlled by puffs_inactive().
    369 	 *
    370 	 * pmp_root is set here and cleared in puffs_reclaim().
    371 	 */
    372  retry:
    373 	mutex_enter(&pmp->pmp_lock);
    374 	vp = pmp->pmp_root;
    375 	if (vp) {
    376 		mutex_enter(&vp->v_interlock);
    377 		mutex_exit(&pmp->pmp_lock);
    378 		if (vget(vp, LK_INTERLOCK) == 0)
    379 			return 0;
    380 	} else
    381 		mutex_exit(&pmp->pmp_lock);
    382 
    383 	/*
    384 	 * So, didn't have the magic root vnode available.
    385 	 * No matter, grab another and stuff it with the cookie.
    386 	 */
    387 	if ((rv = puffs_getvnode(pmp->pmp_mp, pmp->pmp_root_cookie,
    388 	    pmp->pmp_root_vtype, pmp->pmp_root_vsize, pmp->pmp_root_rdev, &vp)))
    389 		return rv;
    390 
    391 	/*
    392 	 * Someone magically managed to race us into puffs_getvnode?
    393 	 * Put our previous new vnode back and retry.
    394 	 */
    395 	mutex_enter(&pmp->pmp_lock);
    396 	if (pmp->pmp_root) {
    397 		mutex_exit(&pmp->pmp_lock);
    398 		puffs_putvnode(vp);
    399 		goto retry;
    400 	}
    401 
    402 	/* store cache */
    403 	vp->v_vflag |= VV_ROOT;
    404 	pmp->pmp_root = vp;
    405 	mutex_exit(&pmp->pmp_lock);
    406 
    407 	return 0;
    408 }
    409 
    410 /*
    411  * Locate the in-kernel vnode based on the cookie received given
    412  * from userspace.  Returns a vnode, if found, NULL otherwise.
    413  * The parameter "lock" control whether to lock the possible or
    414  * not.  Locking always might cause us to lock against ourselves
    415  * in situations where we want the vnode but don't care for the
    416  * vnode lock, e.g. file server issued putpages.
    417  */
    418 int
    419 puffs_cookie2vnode(struct puffs_mount *pmp, void *cookie, int lock,
    420 	int willcreate, struct vnode **vpp)
    421 {
    422 	struct puffs_node *pnode;
    423 	struct puffs_newcookie *pnc;
    424 	struct vnode *vp;
    425 	int vgetflags, rv;
    426 
    427 	/*
    428 	 * Handle root in a special manner, since we want to make sure
    429 	 * pmp_root is properly set.
    430 	 */
    431 	if (cookie == pmp->pmp_root_cookie) {
    432 		if ((rv = puffs_makeroot(pmp)))
    433 			return rv;
    434 		if (lock)
    435 			vn_lock(pmp->pmp_root, LK_EXCLUSIVE | LK_RETRY);
    436 
    437 		*vpp = pmp->pmp_root;
    438 		return 0;
    439 	}
    440 
    441 	mutex_enter(&pmp->pmp_lock);
    442 	pnode = puffs_cookie2pnode(pmp, cookie);
    443 	if (pnode == NULL) {
    444 		if (willcreate) {
    445 			pnc = kmem_alloc(sizeof(struct puffs_newcookie),
    446 			    KM_SLEEP);
    447 			pnc->pnc_cookie = cookie;
    448 			LIST_INSERT_HEAD(&pmp->pmp_newcookie, pnc, pnc_entries);
    449 		}
    450 		mutex_exit(&pmp->pmp_lock);
    451 		return PUFFS_NOSUCHCOOKIE;
    452 	}
    453 	vp = pnode->pn_vp;
    454 	mutex_enter(&vp->v_interlock);
    455 	mutex_exit(&pmp->pmp_lock);
    456 
    457 	vgetflags = LK_INTERLOCK;
    458 	if (lock)
    459 		vgetflags |= LK_EXCLUSIVE | LK_RETRY;
    460 	if ((rv = vget(vp, vgetflags)))
    461 		return rv;
    462 
    463 	*vpp = vp;
    464 	return 0;
    465 }
    466 
    467 void
    468 puffs_updatenode(struct puffs_node *pn, int flags, voff_t size)
    469 {
    470 	struct timespec ts;
    471 
    472 	if (flags == 0)
    473 		return;
    474 
    475 	nanotime(&ts);
    476 
    477 	if (flags & PUFFS_UPDATEATIME) {
    478 		pn->pn_mc_atime = ts;
    479 		pn->pn_stat |= PNODE_METACACHE_ATIME;
    480 	}
    481 	if (flags & PUFFS_UPDATECTIME) {
    482 		pn->pn_mc_ctime = ts;
    483 		pn->pn_stat |= PNODE_METACACHE_CTIME;
    484 	}
    485 	if (flags & PUFFS_UPDATEMTIME) {
    486 		pn->pn_mc_mtime = ts;
    487 		pn->pn_stat |= PNODE_METACACHE_MTIME;
    488 	}
    489 	if (flags & PUFFS_UPDATESIZE) {
    490 		pn->pn_mc_size = size;
    491 		pn->pn_stat |= PNODE_METACACHE_SIZE;
    492 	}
    493 }
    494 
    495 /*
    496  * Add reference to node.
    497  *  mutex held on entry and return
    498  */
    499 void
    500 puffs_referencenode(struct puffs_node *pn)
    501 {
    502 
    503 	KASSERT(mutex_owned(&pn->pn_mtx));
    504 	pn->pn_refcount++;
    505 }
    506 
    507 /*
    508  * Release pnode structure which dealing with references to the
    509  * puffs_node instead of the vnode.  Can't use vref()/vrele() on
    510  * the vnode there, since that causes the lovely VOP_INACTIVE(),
    511  * which in turn causes the lovely deadlock when called by the one
    512  * who is supposed to handle it.
    513  */
    514 void
    515 puffs_releasenode(struct puffs_node *pn)
    516 {
    517 
    518 	mutex_enter(&pn->pn_mtx);
    519 	if (--pn->pn_refcount == 0) {
    520 		mutex_exit(&pn->pn_mtx);
    521 		mutex_destroy(&pn->pn_mtx);
    522 		pool_put(&puffs_pnpool, pn);
    523 	} else {
    524 		mutex_exit(&pn->pn_mtx);
    525 	}
    526 }
    527