Home | History | Annotate | Line # | Download | only in nfs
nfs_node.c revision 1.116
      1  1.116     rmind /*	$NetBSD: nfs_node.c,v 1.116 2011/06/12 03:35:59 rmind Exp $	*/
      2   1.12       cgd 
      3    1.1       cgd /*
      4    1.9   mycroft  * Copyright (c) 1989, 1993
      5    1.9   mycroft  *	The Regents of the University of California.  All rights reserved.
      6    1.1       cgd  *
      7    1.1       cgd  * This code is derived from software contributed to Berkeley by
      8    1.1       cgd  * Rick Macklem at The University of Guelph.
      9    1.1       cgd  *
     10    1.1       cgd  * Redistribution and use in source and binary forms, with or without
     11    1.1       cgd  * modification, are permitted provided that the following conditions
     12    1.1       cgd  * are met:
     13    1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     14    1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     15    1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     16    1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     17    1.1       cgd  *    documentation and/or other materials provided with the distribution.
     18   1.70       agc  * 3. Neither the name of the University nor the names of its contributors
     19    1.1       cgd  *    may be used to endorse or promote products derived from this software
     20    1.1       cgd  *    without specific prior written permission.
     21    1.1       cgd  *
     22    1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     23    1.1       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     24    1.1       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     25    1.1       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     26    1.1       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     27    1.1       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     28    1.1       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     29    1.1       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     30    1.1       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     31    1.1       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     32    1.1       cgd  * SUCH DAMAGE.
     33    1.1       cgd  *
     34   1.16      fvdl  *	@(#)nfs_node.c	8.6 (Berkeley) 5/22/95
     35    1.1       cgd  */
     36   1.47     lukem 
     37   1.47     lukem #include <sys/cdefs.h>
     38  1.116     rmind __KERNEL_RCSID(0, "$NetBSD: nfs_node.c,v 1.116 2011/06/12 03:35:59 rmind Exp $");
     39    1.1       cgd 
     40  1.107        ad #ifdef _KERNEL_OPT
     41   1.35     bjh21 #include "opt_nfs.h"
     42  1.107        ad #endif
     43   1.16      fvdl 
     44    1.4   mycroft #include <sys/param.h>
     45    1.4   mycroft #include <sys/systm.h>
     46    1.4   mycroft #include <sys/proc.h>
     47    1.4   mycroft #include <sys/mount.h>
     48    1.4   mycroft #include <sys/namei.h>
     49    1.4   mycroft #include <sys/vnode.h>
     50    1.4   mycroft #include <sys/kernel.h>
     51   1.28   thorpej #include <sys/pool.h>
     52   1.22      fvdl #include <sys/lock.h>
     53   1.48     lukem #include <sys/hash.h>
     54   1.84      elad #include <sys/kauth.h>
     55    1.1       cgd 
     56    1.9   mycroft #include <nfs/rpcv2.h>
     57   1.16      fvdl #include <nfs/nfsproto.h>
     58    1.4   mycroft #include <nfs/nfs.h>
     59    1.4   mycroft #include <nfs/nfsnode.h>
     60    1.4   mycroft #include <nfs/nfsmount.h>
     61   1.15  christos #include <nfs/nfs_var.h>
     62    1.1       cgd 
     63  1.104     pooka struct pool nfs_node_pool;
     64  1.104     pooka struct pool nfs_vattr_pool;
     65  1.108        ad static struct workqueue *nfs_sillyworkq;
     66   1.28   thorpej 
     67   1.41   tsutsui extern int prtactive;
     68    1.1       cgd 
     69  1.108        ad static void nfs_gop_size(struct vnode *, off_t, off_t *, int);
     70  1.108        ad static int nfs_gop_alloc(struct vnode *, off_t, off_t, int, kauth_cred_t);
     71  1.108        ad static int nfs_gop_write(struct vnode *, struct vm_page **, int, int);
     72  1.108        ad static void nfs_sillyworker(struct work *, void *);
     73   1.46       chs 
     74   1.80      yamt static const struct genfs_ops nfs_genfsops = {
     75   1.80      yamt 	.gop_size = nfs_gop_size,
     76   1.80      yamt 	.gop_alloc = nfs_gop_alloc,
     77   1.80      yamt 	.gop_write = nfs_gop_write,
     78   1.46       chs };
     79   1.46       chs 
     80    1.1       cgd /*
     81  1.105      matt  * Reinitialize inode hash table.
     82    1.1       cgd  */
     83   1.15  christos void
     84  1.110    cegger nfs_node_init(void)
     85    1.1       cgd {
     86  1.108        ad 
     87  1.104     pooka 	pool_init(&nfs_node_pool, sizeof(struct nfsnode), 0, 0, 0, "nfsnodepl",
     88  1.104     pooka 	    &pool_allocator_nointr, IPL_NONE);
     89  1.104     pooka 	pool_init(&nfs_vattr_pool, sizeof(struct vattr), 0, 0, 0, "nfsvapl",
     90  1.104     pooka 	    &pool_allocator_nointr, IPL_NONE);
     91  1.108        ad 	if (workqueue_create(&nfs_sillyworkq, "nfssilly", nfs_sillyworker,
     92  1.108        ad 	    NULL, PRI_NONE, IPL_NONE, 0) != 0) {
     93  1.108        ad 	    	panic("nfs_node_init");
     94  1.108        ad 	}
     95   1.31  jdolecek }
     96   1.31  jdolecek 
     97   1.31  jdolecek /*
     98  1.105      matt  * Free resources previously allocated in nfs_node_reinit().
     99   1.45       chs  */
    100  1.105      matt void
    101  1.110    cegger nfs_node_done(void)
    102  1.105      matt {
    103  1.108        ad 
    104  1.105      matt 	pool_destroy(&nfs_node_pool);
    105  1.105      matt 	pool_destroy(&nfs_vattr_pool);
    106  1.108        ad 	workqueue_destroy(nfs_sillyworkq);
    107  1.105      matt }
    108  1.105      matt 
    109  1.105      matt struct fh_match {
    110  1.105      matt 	nfsfh_t *fhm_fhp;
    111  1.105      matt 	size_t fhm_fhsize;
    112  1.105      matt 	size_t fhm_fhoffset;
    113  1.105      matt };
    114  1.105      matt 
    115  1.105      matt static int
    116  1.114     rmind nfs_compare_nodes(void *ctx, const void *parent, const void *node)
    117  1.105      matt {
    118  1.114     rmind 	const struct nfsnode * const pnp = parent;
    119  1.114     rmind 	const struct nfsnode * const np = node;
    120  1.105      matt 
    121  1.105      matt 	if (pnp->n_fhsize != np->n_fhsize)
    122  1.105      matt 		return np->n_fhsize - pnp->n_fhsize;
    123   1.45       chs 
    124  1.105      matt 	return memcmp(np->n_fhp, pnp->n_fhp, np->n_fhsize);
    125  1.105      matt }
    126  1.105      matt 
    127  1.105      matt static int
    128  1.114     rmind nfs_compare_node_fh(void *ctx, const void *b, const void *key)
    129   1.45       chs {
    130  1.114     rmind 	const struct nfsnode * const pnp = b;
    131  1.105      matt 	const struct fh_match * const fhm = key;
    132   1.45       chs 
    133  1.105      matt 	if (pnp->n_fhsize != fhm->fhm_fhsize)
    134  1.105      matt 		return fhm->fhm_fhsize - pnp->n_fhsize;
    135   1.79     perry 
    136  1.105      matt 	return memcmp(fhm->fhm_fhp, pnp->n_fhp, pnp->n_fhsize);
    137   1.45       chs }
    138   1.45       chs 
    139  1.114     rmind static const rb_tree_ops_t nfs_node_rbtree_ops = {
    140  1.105      matt 	.rbto_compare_nodes = nfs_compare_nodes,
    141  1.105      matt 	.rbto_compare_key = nfs_compare_node_fh,
    142  1.114     rmind 	.rbto_node_offset = offsetof(struct nfsnode, n_rbnode),
    143  1.114     rmind 	.rbto_context = NULL
    144  1.105      matt };
    145  1.105      matt 
    146   1.31  jdolecek void
    147  1.105      matt nfs_rbtinit(struct nfsmount *nmp)
    148   1.31  jdolecek {
    149  1.114     rmind 
    150  1.105      matt 	rb_tree_init(&nmp->nm_rbtree, &nfs_node_rbtree_ops);
    151  1.105      matt }
    152  1.104     pooka 
    153    1.1       cgd /*
    154    1.1       cgd  * Look up a vnode/nfsnode by file handle.
    155    1.1       cgd  * Callers must check for mount points!!
    156    1.1       cgd  * In all cases, a pointer to a
    157    1.1       cgd  * nfsnode structure is returned.
    158    1.1       cgd  */
    159   1.15  christos int
    160  1.114     rmind nfs_nget1(struct mount *mntp, nfsfh_t *fhp, int fhsize, struct nfsnode **npp,
    161  1.114     rmind     int lkflags)
    162    1.1       cgd {
    163  1.105      matt 	struct nfsnode *np;
    164   1.33  augustss 	struct vnode *vp;
    165  1.105      matt 	struct nfsmount *nmp = VFSTONFS(mntp);
    166    1.1       cgd 	int error;
    167  1.105      matt 	struct fh_match fhm;
    168  1.105      matt 
    169  1.105      matt 	fhm.fhm_fhp = fhp;
    170  1.105      matt 	fhm.fhm_fhsize = fhsize;
    171    1.1       cgd 
    172    1.1       cgd loop:
    173  1.105      matt 	rw_enter(&nmp->nm_rbtlock, RW_READER);
    174  1.114     rmind 	np = rb_tree_find_node(&nmp->nm_rbtree, &fhm);
    175  1.114     rmind 	if (np != NULL) {
    176    1.1       cgd 		vp = NFSTOV(np);
    177  1.116     rmind 		mutex_enter(vp->v_interlock);
    178  1.105      matt 		rw_exit(&nmp->nm_rbtlock);
    179  1.113   hannken 		error = vget(vp, LK_EXCLUSIVE | lkflags);
    180   1.75      yamt 		if (error == EBUSY)
    181   1.75      yamt 			return error;
    182   1.75      yamt 		if (error)
    183    1.1       cgd 			goto loop;
    184    1.1       cgd 		*npp = np;
    185    1.1       cgd 		return(0);
    186    1.1       cgd 	}
    187  1.105      matt 	rw_exit(&nmp->nm_rbtlock);
    188  1.100        ad 
    189  1.116     rmind 	error = getnewvnode(VT_NFS, mntp, nfsv2_vnodeop_p, NULL, &vp);
    190   1.15  christos 	if (error) {
    191    1.1       cgd 		*npp = 0;
    192    1.1       cgd 		return (error);
    193    1.1       cgd 	}
    194   1.28   thorpej 	np = pool_get(&nfs_node_pool, PR_WAITOK);
    195   1.38       chs 	memset(np, 0, sizeof *np);
    196    1.1       cgd 	np->n_vnode = vp;
    197   1.38       chs 
    198    1.1       cgd 	/*
    199    1.1       cgd 	 * Insert the nfsnode in the hash queue for its new file handle
    200    1.1       cgd 	 */
    201   1.46       chs 
    202   1.16      fvdl 	if (fhsize > NFS_SMALLFH) {
    203   1.98      yamt 		np->n_fhp = kmem_alloc(fhsize, KM_SLEEP);
    204   1.16      fvdl 	} else
    205   1.16      fvdl 		np->n_fhp = &np->n_fh;
    206   1.38       chs 	memcpy(np->n_fhp, fhp, fhsize);
    207   1.16      fvdl 	np->n_fhsize = fhsize;
    208   1.30      fvdl 	np->n_accstamp = -1;
    209   1.28   thorpej 	np->n_vattr = pool_get(&nfs_vattr_pool, PR_WAITOK);
    210   1.71      fvdl 
    211  1.105      matt 	rw_enter(&nmp->nm_rbtlock, RW_WRITER);
    212  1.105      matt 	if (NULL != rb_tree_find_node(&nmp->nm_rbtree, &fhm)) {
    213  1.105      matt 		rw_exit(&nmp->nm_rbtlock);
    214  1.100        ad 		if (fhsize > NFS_SMALLFH) {
    215  1.100        ad 			kmem_free(np->n_fhp, fhsize);
    216  1.100        ad 		}
    217  1.100        ad 		pool_put(&nfs_vattr_pool, np->n_vattr);
    218  1.100        ad 		pool_put(&nfs_node_pool, np);
    219  1.100        ad 		ungetnewvnode(vp);
    220  1.100        ad 		goto loop;
    221  1.100        ad 	}
    222  1.100        ad 	vp->v_data = np;
    223  1.100        ad 	genfs_node_init(vp, &nfs_genfsops);
    224   1.71      fvdl 	/*
    225   1.71      fvdl 	 * Initalize read/write creds to useful values. VOP_OPEN will
    226   1.71      fvdl 	 * overwrite these.
    227   1.71      fvdl 	 */
    228   1.85        ad 	np->n_rcred = curlwp->l_cred;
    229   1.84      elad 	kauth_cred_hold(np->n_rcred);
    230   1.85        ad 	np->n_wcred = curlwp->l_cred;
    231   1.84      elad 	kauth_cred_hold(np->n_wcred);
    232  1.112   hannken 	VOP_LOCK(vp, LK_EXCLUSIVE);
    233   1.74      yamt 	NFS_INVALIDATE_ATTRCACHE(np);
    234   1.74      yamt 	uvm_vnp_setsize(vp, 0);
    235  1.114     rmind 	(void)rb_tree_insert_node(&nmp->nm_rbtree, np);
    236  1.105      matt 	rw_exit(&nmp->nm_rbtlock);
    237  1.100        ad 
    238    1.1       cgd 	*npp = np;
    239    1.1       cgd 	return (0);
    240    1.1       cgd }
    241    1.1       cgd 
    242   1.15  christos int
    243  1.109       dsl nfs_inactive(void *v)
    244   1.15  christos {
    245    1.9   mycroft 	struct vop_inactive_args /* {
    246    1.9   mycroft 		struct vnode *a_vp;
    247   1.97        ad 		bool *a_recycle;
    248   1.15  christos 	} */ *ap = v;
    249   1.33  augustss 	struct nfsnode *np;
    250   1.33  augustss 	struct sillyrename *sp;
    251   1.40      fvdl 	struct vnode *vp = ap->a_vp;
    252    1.1       cgd 
    253   1.40      fvdl 	np = VTONFS(vp);
    254   1.40      fvdl 	if (vp->v_type != VDIR) {
    255   1.16      fvdl 		sp = np->n_sillyrename;
    256   1.18      fvdl 		np->n_sillyrename = (struct sillyrename *)0;
    257   1.18      fvdl 	} else
    258   1.44      fvdl 		sp = NULL;
    259   1.44      fvdl 	if (sp != NULL)
    260   1.97        ad 		nfs_vinvalbuf(vp, 0, sp->s_cred, curlwp, 1);
    261   1.97        ad 	*ap->a_recycle = (np->n_flag & NREMOVED) != 0;
    262   1.94      yamt 	np->n_flag &=
    263   1.94      yamt 	    (NMODIFIED | NFLUSHINPROG | NFLUSHWANT | NEOFVALID | NTRUNCDELAYED);
    264   1.76      yamt 
    265   1.76      yamt 	if (vp->v_type == VDIR && np->n_dircache)
    266   1.78      yamt 		nfs_invaldircache(vp,
    267   1.78      yamt 		    NFS_INVALDIRCACHE_FORCE | NFS_INVALDIRCACHE_KEEPEOF);
    268   1.76      yamt 
    269  1.111   hannken 	VOP_UNLOCK(vp);
    270   1.76      yamt 
    271   1.44      fvdl 	if (sp != NULL) {
    272  1.108        ad 		workqueue_enqueue(nfs_sillyworkq, &sp->s_work, NULL);
    273    1.1       cgd 	}
    274   1.59      fvdl 
    275    1.1       cgd 	return (0);
    276    1.1       cgd }
    277    1.1       cgd 
    278    1.1       cgd /*
    279    1.1       cgd  * Reclaim an nfsnode so that it can be used for other purposes.
    280    1.1       cgd  */
    281   1.15  christos int
    282  1.109       dsl nfs_reclaim(void *v)
    283   1.15  christos {
    284    1.9   mycroft 	struct vop_reclaim_args /* {
    285    1.9   mycroft 		struct vnode *a_vp;
    286   1.15  christos 	} */ *ap = v;
    287   1.33  augustss 	struct vnode *vp = ap->a_vp;
    288   1.33  augustss 	struct nfsnode *np = VTONFS(vp);
    289  1.105      matt 	struct nfsmount *nmp = VFSTONFS(vp->v_mount);
    290    1.1       cgd 
    291   1.99        ad 	if (prtactive && vp->v_usecount > 1)
    292    1.1       cgd 		vprint("nfs_reclaim: pushing active", vp);
    293   1.60  drochner 
    294  1.105      matt 	rw_enter(&nmp->nm_rbtlock, RW_WRITER);
    295  1.114     rmind 	rb_tree_remove_node(&nmp->nm_rbtree, np);
    296  1.105      matt 	rw_exit(&nmp->nm_rbtlock);
    297   1.16      fvdl 
    298   1.16      fvdl 	/*
    299   1.16      fvdl 	 * Free up any directory cookie structures and
    300   1.16      fvdl 	 * large file handle structures that might be associated with
    301   1.16      fvdl 	 * this nfs node.
    302   1.16      fvdl 	 */
    303  1.103      tron 	if (vp->v_type == VDIR && np->n_dircache != NULL) {
    304  1.103      tron 		nfs_invaldircache(vp, NFS_INVALDIRCACHE_FORCE);
    305  1.102        ad 		hashdone(np->n_dircache, HASH_LIST, nfsdirhashmask);
    306  1.103      tron 	}
    307   1.65      yamt 	KASSERT(np->n_dirgens == NULL);
    308   1.59      fvdl 
    309   1.59      fvdl 	if (np->n_fhsize > NFS_SMALLFH)
    310   1.98      yamt 		kmem_free(np->n_fhp, np->n_fhsize);
    311   1.16      fvdl 
    312   1.28   thorpej 	pool_put(&nfs_vattr_pool, np->n_vattr);
    313   1.59      fvdl 	if (np->n_rcred)
    314   1.84      elad 		kauth_cred_free(np->n_rcred);
    315   1.59      fvdl 
    316   1.59      fvdl 	if (np->n_wcred)
    317   1.84      elad 		kauth_cred_free(np->n_wcred);
    318   1.59      fvdl 
    319   1.90      yamt 	if (vp->v_type == VREG) {
    320   1.90      yamt 		mutex_destroy(&np->n_commitlock);
    321   1.90      yamt 	}
    322   1.91        ad 	genfs_node_destroy(vp);
    323   1.90      yamt 	pool_put(&nfs_node_pool, np);
    324   1.38       chs 	vp->v_data = NULL;
    325    1.1       cgd 	return (0);
    326   1.46       chs }
    327   1.46       chs 
    328   1.46       chs void
    329   1.87      yamt nfs_gop_size(struct vnode *vp, off_t size, off_t *eobp, int flags)
    330   1.46       chs {
    331   1.83      yamt 
    332   1.46       chs 	*eobp = MAX(size, vp->v_size);
    333   1.46       chs }
    334   1.46       chs 
    335   1.46       chs int
    336   1.87      yamt nfs_gop_alloc(struct vnode *vp, off_t off, off_t len, int flags,
    337   1.87      yamt     kauth_cred_t cred)
    338   1.46       chs {
    339   1.87      yamt 
    340   1.46       chs 	return 0;
    341   1.53       chs }
    342   1.53       chs 
    343   1.53       chs int
    344   1.53       chs nfs_gop_write(struct vnode *vp, struct vm_page **pgs, int npages, int flags)
    345   1.53       chs {
    346   1.53       chs 	int i;
    347   1.53       chs 
    348  1.116     rmind 	mutex_enter(vp->v_interlock);
    349   1.53       chs 	for (i = 0; i < npages; i++) {
    350   1.53       chs 		pmap_page_protect(pgs[i], VM_PROT_READ);
    351   1.53       chs 	}
    352  1.116     rmind 	mutex_exit(vp->v_interlock);
    353  1.116     rmind 
    354   1.53       chs 	return genfs_gop_write(vp, pgs, npages, flags);
    355    1.1       cgd }
    356  1.108        ad 
    357  1.108        ad /*
    358  1.108        ad  * Remove a silly file that was rename'd earlier
    359  1.108        ad  */
    360  1.108        ad static void
    361  1.108        ad nfs_sillyworker(struct work *work, void *arg)
    362  1.108        ad {
    363  1.108        ad 	struct sillyrename *sp;
    364  1.108        ad 	int error;
    365  1.108        ad 
    366  1.108        ad 	sp = (struct sillyrename *)work;
    367  1.108        ad 	error = vn_lock(sp->s_dvp, LK_EXCLUSIVE);
    368  1.108        ad 	if (error || sp->s_dvp->v_data == NULL) {
    369  1.108        ad 		/* XXX should recover */
    370  1.108        ad 		printf("%s: vp=%p error=%d\n", __func__, sp->s_dvp, error);
    371  1.108        ad 		if (error == 0) {
    372  1.108        ad 			vput(sp->s_dvp);
    373  1.108        ad 		} else {
    374  1.108        ad 			vrele(sp->s_dvp);
    375  1.108        ad 		}
    376  1.108        ad 	} else {
    377  1.108        ad 		nfs_removeit(sp);
    378  1.108        ad 		vput(sp->s_dvp);
    379  1.108        ad 	}
    380  1.108        ad 	kauth_cred_free(sp->s_cred);
    381  1.108        ad 	kmem_free(sp, sizeof(*sp));
    382  1.108        ad }
    383