Home | History | Annotate | Line # | Download | only in ffs
ffs_vnops.c revision 1.107
      1 /*	$NetBSD: ffs_vnops.c,v 1.107 2008/12/22 12:18:48 ad Exp $	*/
      2 
      3 /*-
      4  * Copyright (c) 2008 The NetBSD Foundation, Inc.
      5  * All rights reserved.
      6  *
      7  * This code is derived from software contributed to The NetBSD Foundation
      8  * by Wasabi Systems, Inc.
      9  *
     10  * Redistribution and use in source and binary forms, with or without
     11  * modification, are permitted provided that the following conditions
     12  * are met:
     13  * 1. Redistributions of source code must retain the above copyright
     14  *    notice, this list of conditions and the following disclaimer.
     15  * 2. Redistributions in binary form must reproduce the above copyright
     16  *    notice, this list of conditions and the following disclaimer in the
     17  *    documentation and/or other materials provided with the distribution.
     18  *
     19  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29  * POSSIBILITY OF SUCH DAMAGE.
     30  */
     31 
     32 /*
     33  * Copyright (c) 1982, 1986, 1989, 1993
     34  *	The Regents of the University of California.  All rights reserved.
     35  *
     36  * Redistribution and use in source and binary forms, with or without
     37  * modification, are permitted provided that the following conditions
     38  * are met:
     39  * 1. Redistributions of source code must retain the above copyright
     40  *    notice, this list of conditions and the following disclaimer.
     41  * 2. Redistributions in binary form must reproduce the above copyright
     42  *    notice, this list of conditions and the following disclaimer in the
     43  *    documentation and/or other materials provided with the distribution.
     44  * 3. Neither the name of the University nor the names of its contributors
     45  *    may be used to endorse or promote products derived from this software
     46  *    without specific prior written permission.
     47  *
     48  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     49  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     50  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     51  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     52  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     53  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     54  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     55  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     56  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     57  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     58  * SUCH DAMAGE.
     59  *
     60  *	@(#)ffs_vnops.c	8.15 (Berkeley) 5/14/95
     61  */
     62 
     63 #include <sys/cdefs.h>
     64 __KERNEL_RCSID(0, "$NetBSD: ffs_vnops.c,v 1.107 2008/12/22 12:18:48 ad Exp $");
     65 
     66 #if defined(_KERNEL_OPT)
     67 #include "opt_ffs.h"
     68 #include "opt_wapbl.h"
     69 #endif
     70 
     71 #include <sys/param.h>
     72 #include <sys/systm.h>
     73 #include <sys/resourcevar.h>
     74 #include <sys/kernel.h>
     75 #include <sys/file.h>
     76 #include <sys/stat.h>
     77 #include <sys/buf.h>
     78 #include <sys/event.h>
     79 #include <sys/proc.h>
     80 #include <sys/mount.h>
     81 #include <sys/vnode.h>
     82 #include <sys/pool.h>
     83 #include <sys/signalvar.h>
     84 #include <sys/kauth.h>
     85 #include <sys/wapbl.h>
     86 #include <sys/fstrans.h>
     87 
     88 #include <miscfs/fifofs/fifo.h>
     89 #include <miscfs/genfs/genfs.h>
     90 #include <miscfs/specfs/specdev.h>
     91 
     92 #include <ufs/ufs/inode.h>
     93 #include <ufs/ufs/dir.h>
     94 #include <ufs/ufs/ufs_extern.h>
     95 #include <ufs/ufs/ufsmount.h>
     96 #include <ufs/ufs/ufs_wapbl.h>
     97 
     98 #include <ufs/ffs/fs.h>
     99 #include <ufs/ffs/ffs_extern.h>
    100 
    101 #include <uvm/uvm.h>
    102 
    103 /* Global vfs data structures for ufs. */
    104 int (**ffs_vnodeop_p)(void *);
    105 const struct vnodeopv_entry_desc ffs_vnodeop_entries[] = {
    106 	{ &vop_default_desc, vn_default_error },
    107 	{ &vop_lookup_desc, ufs_lookup },		/* lookup */
    108 	{ &vop_create_desc, ufs_create },		/* create */
    109 	{ &vop_whiteout_desc, ufs_whiteout },		/* whiteout */
    110 	{ &vop_mknod_desc, ufs_mknod },			/* mknod */
    111 	{ &vop_open_desc, ufs_open },			/* open */
    112 	{ &vop_close_desc, ufs_close },			/* close */
    113 	{ &vop_access_desc, ufs_access },		/* access */
    114 	{ &vop_getattr_desc, ufs_getattr },		/* getattr */
    115 	{ &vop_setattr_desc, ufs_setattr },		/* setattr */
    116 	{ &vop_read_desc, ffs_read },			/* read */
    117 	{ &vop_write_desc, ffs_write },			/* write */
    118 	{ &vop_ioctl_desc, ufs_ioctl },			/* ioctl */
    119 	{ &vop_fcntl_desc, ufs_fcntl },			/* fcntl */
    120 	{ &vop_poll_desc, ufs_poll },			/* poll */
    121 	{ &vop_kqfilter_desc, genfs_kqfilter },		/* kqfilter */
    122 	{ &vop_revoke_desc, ufs_revoke },		/* revoke */
    123 	{ &vop_mmap_desc, ufs_mmap },			/* mmap */
    124 	{ &vop_fsync_desc, ffs_fsync },			/* fsync */
    125 	{ &vop_seek_desc, ufs_seek },			/* seek */
    126 	{ &vop_remove_desc, ufs_remove },		/* remove */
    127 	{ &vop_link_desc, ufs_link },			/* link */
    128 	{ &vop_rename_desc, ufs_rename },		/* rename */
    129 	{ &vop_mkdir_desc, ufs_mkdir },			/* mkdir */
    130 	{ &vop_rmdir_desc, ufs_rmdir },			/* rmdir */
    131 	{ &vop_symlink_desc, ufs_symlink },		/* symlink */
    132 	{ &vop_readdir_desc, ufs_readdir },		/* readdir */
    133 	{ &vop_readlink_desc, ufs_readlink },		/* readlink */
    134 	{ &vop_abortop_desc, ufs_abortop },		/* abortop */
    135 	{ &vop_inactive_desc, ufs_inactive },		/* inactive */
    136 	{ &vop_reclaim_desc, ffs_reclaim },		/* reclaim */
    137 	{ &vop_lock_desc, ffs_lock },			/* lock */
    138 	{ &vop_unlock_desc, ffs_unlock },		/* unlock */
    139 	{ &vop_bmap_desc, ufs_bmap },			/* bmap */
    140 	{ &vop_strategy_desc, ufs_strategy },		/* strategy */
    141 	{ &vop_print_desc, ufs_print },			/* print */
    142 	{ &vop_islocked_desc, ffs_islocked },		/* islocked */
    143 	{ &vop_pathconf_desc, ufs_pathconf },		/* pathconf */
    144 	{ &vop_advlock_desc, ufs_advlock },		/* advlock */
    145 	{ &vop_bwrite_desc, vn_bwrite },		/* bwrite */
    146 	{ &vop_getpages_desc, genfs_getpages },		/* getpages */
    147 	{ &vop_putpages_desc, genfs_putpages },		/* putpages */
    148 	{ &vop_openextattr_desc, ffs_openextattr },	/* openextattr */
    149 	{ &vop_closeextattr_desc, ffs_closeextattr },	/* closeextattr */
    150 	{ &vop_getextattr_desc, ffs_getextattr },	/* getextattr */
    151 	{ &vop_setextattr_desc, ffs_setextattr },	/* setextattr */
    152 	{ &vop_listextattr_desc, ffs_listextattr },	/* listextattr */
    153 	{ &vop_deleteextattr_desc, ffs_deleteextattr },	/* deleteextattr */
    154 	{ NULL, NULL }
    155 };
    156 const struct vnodeopv_desc ffs_vnodeop_opv_desc =
    157 	{ &ffs_vnodeop_p, ffs_vnodeop_entries };
    158 
    159 int (**ffs_specop_p)(void *);
    160 const struct vnodeopv_entry_desc ffs_specop_entries[] = {
    161 	{ &vop_default_desc, vn_default_error },
    162 	{ &vop_lookup_desc, spec_lookup },		/* lookup */
    163 	{ &vop_create_desc, spec_create },		/* create */
    164 	{ &vop_mknod_desc, spec_mknod },		/* mknod */
    165 	{ &vop_open_desc, spec_open },			/* open */
    166 	{ &vop_close_desc, ufsspec_close },		/* close */
    167 	{ &vop_access_desc, ufs_access },		/* access */
    168 	{ &vop_getattr_desc, ufs_getattr },		/* getattr */
    169 	{ &vop_setattr_desc, ufs_setattr },		/* setattr */
    170 	{ &vop_read_desc, ufsspec_read },		/* read */
    171 	{ &vop_write_desc, ufsspec_write },		/* write */
    172 	{ &vop_ioctl_desc, spec_ioctl },		/* ioctl */
    173 	{ &vop_fcntl_desc, ufs_fcntl },			/* fcntl */
    174 	{ &vop_poll_desc, spec_poll },			/* poll */
    175 	{ &vop_kqfilter_desc, spec_kqfilter },		/* kqfilter */
    176 	{ &vop_revoke_desc, spec_revoke },		/* revoke */
    177 	{ &vop_mmap_desc, spec_mmap },			/* mmap */
    178 	{ &vop_fsync_desc, ffs_fsync },			/* fsync */
    179 	{ &vop_seek_desc, spec_seek },			/* seek */
    180 	{ &vop_remove_desc, spec_remove },		/* remove */
    181 	{ &vop_link_desc, spec_link },			/* link */
    182 	{ &vop_rename_desc, spec_rename },		/* rename */
    183 	{ &vop_mkdir_desc, spec_mkdir },		/* mkdir */
    184 	{ &vop_rmdir_desc, spec_rmdir },		/* rmdir */
    185 	{ &vop_symlink_desc, spec_symlink },		/* symlink */
    186 	{ &vop_readdir_desc, spec_readdir },		/* readdir */
    187 	{ &vop_readlink_desc, spec_readlink },		/* readlink */
    188 	{ &vop_abortop_desc, spec_abortop },		/* abortop */
    189 	{ &vop_inactive_desc, ufs_inactive },		/* inactive */
    190 	{ &vop_reclaim_desc, ffs_reclaim },		/* reclaim */
    191 	{ &vop_lock_desc, ffs_lock },			/* lock */
    192 	{ &vop_unlock_desc, ffs_unlock },		/* unlock */
    193 	{ &vop_bmap_desc, spec_bmap },			/* bmap */
    194 	{ &vop_strategy_desc, spec_strategy },		/* strategy */
    195 	{ &vop_print_desc, ufs_print },			/* print */
    196 	{ &vop_islocked_desc, ffs_islocked },		/* islocked */
    197 	{ &vop_pathconf_desc, spec_pathconf },		/* pathconf */
    198 	{ &vop_advlock_desc, spec_advlock },		/* advlock */
    199 	{ &vop_bwrite_desc, vn_bwrite },		/* bwrite */
    200 	{ &vop_getpages_desc, spec_getpages },		/* getpages */
    201 	{ &vop_putpages_desc, spec_putpages },		/* putpages */
    202 	{ &vop_openextattr_desc, ffs_openextattr },	/* openextattr */
    203 	{ &vop_closeextattr_desc, ffs_closeextattr },	/* closeextattr */
    204 	{ &vop_getextattr_desc, ffs_getextattr },	/* getextattr */
    205 	{ &vop_setextattr_desc, ffs_setextattr },	/* setextattr */
    206 	{ &vop_listextattr_desc, ffs_listextattr },	/* listextattr */
    207 	{ &vop_deleteextattr_desc, ffs_deleteextattr },	/* deleteextattr */
    208 	{ NULL, NULL }
    209 };
    210 const struct vnodeopv_desc ffs_specop_opv_desc =
    211 	{ &ffs_specop_p, ffs_specop_entries };
    212 
    213 int (**ffs_fifoop_p)(void *);
    214 const struct vnodeopv_entry_desc ffs_fifoop_entries[] = {
    215 	{ &vop_default_desc, vn_default_error },
    216 	{ &vop_lookup_desc, fifo_lookup },		/* lookup */
    217 	{ &vop_create_desc, fifo_create },		/* create */
    218 	{ &vop_mknod_desc, fifo_mknod },		/* mknod */
    219 	{ &vop_open_desc, fifo_open },			/* open */
    220 	{ &vop_close_desc, ufsfifo_close },		/* close */
    221 	{ &vop_access_desc, ufs_access },		/* access */
    222 	{ &vop_getattr_desc, ufs_getattr },		/* getattr */
    223 	{ &vop_setattr_desc, ufs_setattr },		/* setattr */
    224 	{ &vop_read_desc, ufsfifo_read },		/* read */
    225 	{ &vop_write_desc, ufsfifo_write },		/* write */
    226 	{ &vop_ioctl_desc, fifo_ioctl },		/* ioctl */
    227 	{ &vop_fcntl_desc, ufs_fcntl },			/* fcntl */
    228 	{ &vop_poll_desc, fifo_poll },			/* poll */
    229 	{ &vop_kqfilter_desc, fifo_kqfilter },		/* kqfilter */
    230 	{ &vop_revoke_desc, fifo_revoke },		/* revoke */
    231 	{ &vop_mmap_desc, fifo_mmap },			/* mmap */
    232 	{ &vop_fsync_desc, ffs_fsync },			/* fsync */
    233 	{ &vop_seek_desc, fifo_seek },			/* seek */
    234 	{ &vop_remove_desc, fifo_remove },		/* remove */
    235 	{ &vop_link_desc, fifo_link },			/* link */
    236 	{ &vop_rename_desc, fifo_rename },		/* rename */
    237 	{ &vop_mkdir_desc, fifo_mkdir },		/* mkdir */
    238 	{ &vop_rmdir_desc, fifo_rmdir },		/* rmdir */
    239 	{ &vop_symlink_desc, fifo_symlink },		/* symlink */
    240 	{ &vop_readdir_desc, fifo_readdir },		/* readdir */
    241 	{ &vop_readlink_desc, fifo_readlink },		/* readlink */
    242 	{ &vop_abortop_desc, fifo_abortop },		/* abortop */
    243 	{ &vop_inactive_desc, ufs_inactive },		/* inactive */
    244 	{ &vop_reclaim_desc, ffs_reclaim },		/* reclaim */
    245 	{ &vop_lock_desc, ffs_lock },			/* lock */
    246 	{ &vop_unlock_desc, ffs_unlock },		/* unlock */
    247 	{ &vop_bmap_desc, fifo_bmap },			/* bmap */
    248 	{ &vop_strategy_desc, fifo_strategy },		/* strategy */
    249 	{ &vop_print_desc, ufs_print },			/* print */
    250 	{ &vop_islocked_desc, ffs_islocked },		/* islocked */
    251 	{ &vop_pathconf_desc, fifo_pathconf },		/* pathconf */
    252 	{ &vop_advlock_desc, fifo_advlock },		/* advlock */
    253 	{ &vop_bwrite_desc, vn_bwrite },		/* bwrite */
    254 	{ &vop_putpages_desc, fifo_putpages }, 		/* putpages */
    255 	{ &vop_openextattr_desc, ffs_openextattr },	/* openextattr */
    256 	{ &vop_closeextattr_desc, ffs_closeextattr },	/* closeextattr */
    257 	{ &vop_getextattr_desc, ffs_getextattr },	/* getextattr */
    258 	{ &vop_setextattr_desc, ffs_setextattr },	/* setextattr */
    259 	{ &vop_listextattr_desc, ffs_listextattr },	/* listextattr */
    260 	{ &vop_deleteextattr_desc, ffs_deleteextattr },	/* deleteextattr */
    261 	{ NULL, NULL }
    262 };
    263 const struct vnodeopv_desc ffs_fifoop_opv_desc =
    264 	{ &ffs_fifoop_p, ffs_fifoop_entries };
    265 
    266 #include <ufs/ufs/ufs_readwrite.c>
    267 
    268 int
    269 ffs_fsync(void *v)
    270 {
    271 	struct vop_fsync_args /* {
    272 		struct vnode *a_vp;
    273 		kauth_cred_t a_cred;
    274 		int a_flags;
    275 		off_t a_offlo;
    276 		off_t a_offhi;
    277 		struct lwp *a_l;
    278 	} */ *ap = v;
    279 	struct buf *bp;
    280 	int num, error, i;
    281 	struct indir ia[NIADDR + 1];
    282 	int bsize;
    283 	daddr_t blk_high;
    284 	struct vnode *vp;
    285 #ifdef WAPBL
    286 	struct mount *mp;
    287 #endif
    288 
    289 	vp = ap->a_vp;
    290 
    291 	fstrans_start(vp->v_mount, FSTRANS_LAZY);
    292 	/*
    293 	 * XXX no easy way to sync a range in a file with softdep.
    294 	 */
    295 	if ((ap->a_offlo == 0 && ap->a_offhi == 0) || DOINGSOFTDEP(vp) ||
    296 	    (vp->v_type != VREG)) {
    297 		int flags = ap->a_flags;
    298 		error = ffs_full_fsync(vp, flags);
    299 		goto out;
    300 	}
    301 
    302 	bsize = vp->v_mount->mnt_stat.f_iosize;
    303 	blk_high = ap->a_offhi / bsize;
    304 	if (ap->a_offhi % bsize != 0)
    305 		blk_high++;
    306 
    307 	/*
    308 	 * First, flush all pages in range.
    309 	 */
    310 
    311 	mutex_enter(&vp->v_interlock);
    312 	error = VOP_PUTPAGES(vp, trunc_page(ap->a_offlo),
    313 	    round_page(ap->a_offhi), PGO_CLEANIT |
    314 	    ((ap->a_flags & FSYNC_WAIT) ? PGO_SYNCIO : 0));
    315 	if (error) {
    316 		goto out;
    317 	}
    318 
    319 #ifdef WAPBL
    320 	mp = wapbl_vptomp(vp);
    321 	if (mp->mnt_wapbl) {
    322 		if (ap->a_flags & FSYNC_DATAONLY) {
    323 			fstrans_done(vp->v_mount);
    324 			return 0;
    325 		}
    326 		error = 0;
    327 		if (vp->v_tag == VT_UFS && VTOI(vp)->i_flag &
    328 		    (IN_ACCESS | IN_CHANGE | IN_UPDATE | IN_MODIFY |
    329 				 IN_MODIFIED | IN_ACCESSED)) {
    330 			error = UFS_WAPBL_BEGIN(mp);
    331 			if (error) {
    332 				fstrans_done(vp->v_mount);
    333 				return error;
    334 			}
    335 			error = ffs_update(vp, NULL, NULL,
    336 				(ap->a_flags & FSYNC_WAIT) ? UPDATE_WAIT : 0);
    337 			UFS_WAPBL_END(mp);
    338 		}
    339 		if (error || (ap->a_flags & FSYNC_NOLOG)) {
    340 			fstrans_done(vp->v_mount);
    341 			return error;
    342 		}
    343 		error = wapbl_flush(mp->mnt_wapbl, 0);
    344 		fstrans_done(vp->v_mount);
    345 		return error;
    346 	}
    347 #endif /* WAPBL */
    348 
    349 	/*
    350 	 * Then, flush indirect blocks.
    351 	 */
    352 
    353 	if (blk_high >= NDADDR) {
    354 		error = ufs_getlbns(vp, blk_high, ia, &num);
    355 		if (error)
    356 			goto out;
    357 
    358 		mutex_enter(&bufcache_lock);
    359 		for (i = 0; i < num; i++) {
    360 			if ((bp = incore(vp, ia[i].in_lbn)) == NULL)
    361 				continue;
    362 			if ((bp->b_cflags & BC_BUSY) != 0 ||
    363 			    (bp->b_oflags & BO_DELWRI) == 0)
    364 				continue;
    365 			bp->b_cflags |= BC_BUSY | BC_VFLUSH;
    366 			mutex_exit(&bufcache_lock);
    367 			bawrite(bp);
    368 			mutex_enter(&bufcache_lock);
    369 		}
    370 		mutex_exit(&bufcache_lock);
    371 	}
    372 
    373 	if (ap->a_flags & FSYNC_WAIT) {
    374 		mutex_enter(&vp->v_interlock);
    375 		while (vp->v_numoutput > 0)
    376 			cv_wait(&vp->v_cv, &vp->v_interlock);
    377 		mutex_exit(&vp->v_interlock);
    378 	}
    379 
    380 	error = ffs_update(vp, NULL, NULL,
    381 	    ((ap->a_flags & (FSYNC_WAIT | FSYNC_DATAONLY)) == FSYNC_WAIT)
    382 	    ? UPDATE_WAIT : 0);
    383 
    384 	if (error == 0 && ap->a_flags & FSYNC_CACHE) {
    385 		int l = 0;
    386 		VOP_IOCTL(VTOI(vp)->i_devvp, DIOCCACHESYNC, &l, FWRITE,
    387 			curlwp->l_cred);
    388 	}
    389 
    390 out:
    391 	fstrans_done(vp->v_mount);
    392 	return error;
    393 }
    394 
    395 /*
    396  * Synch an open file.  Called for VOP_FSYNC() and VFS_FSYNC().
    397  *
    398  * BEWARE: THIS ROUTINE ACCEPTS BOTH FFS AND NON-FFS VNODES.
    399  */
    400 /* ARGSUSED */
    401 int
    402 ffs_full_fsync(struct vnode *vp, int flags)
    403 {
    404 	extern struct vfsops ffs_vfsops;
    405 	struct buf *bp, *nbp;
    406 	int error, passes, skipmeta, inodedeps_only, waitfor;
    407 	struct mount *mp;
    408 	bool ffsino;
    409 
    410 	error = 0;
    411 
    412 	if ((flags & FSYNC_VFS) != 0) {
    413 		KASSERT(vp->v_specmountpoint != NULL);
    414 		mp = vp->v_specmountpoint;
    415 		ffsino = (mp->mnt_op == &ffs_vfsops);
    416 		KASSERT(vp->v_type == VBLK);
    417 	} else {
    418 		mp = vp->v_mount;
    419 		ffsino = true;
    420 		KASSERT(vp->v_tag == VT_UFS);
    421 	}
    422 
    423 	if (vp->v_type == VBLK &&
    424 	    vp->v_specmountpoint != NULL &&
    425 	    (vp->v_specmountpoint->mnt_flag & MNT_SOFTDEP))
    426 		softdep_fsync_mountdev(vp);
    427 
    428 	mutex_enter(&vp->v_interlock);
    429 
    430 	inodedeps_only = DOINGSOFTDEP(vp) && (flags & FSYNC_RECLAIM)
    431 	    && UVM_OBJ_IS_CLEAN(&vp->v_uobj) && LIST_EMPTY(&vp->v_dirtyblkhd);
    432 
    433 	/*
    434 	 * Flush all dirty data associated with a vnode.
    435 	 */
    436 
    437 	if (vp->v_type == VREG || vp->v_type == VBLK) {
    438 		int pflags = PGO_ALLPAGES | PGO_CLEANIT;
    439 
    440 		if ((flags & FSYNC_WAIT))
    441 			pflags |= PGO_SYNCIO;
    442 		if (vp->v_type == VREG &&
    443 		    fstrans_getstate(mp) == FSTRANS_SUSPENDING)
    444 			pflags |= PGO_FREE;
    445 		error = VOP_PUTPAGES(vp, 0, 0, pflags);
    446 		if (error)
    447 			return error;
    448 	} else {
    449 		mutex_exit(&vp->v_interlock);
    450 	}
    451 
    452 #ifdef WAPBL
    453 	if (mp && mp->mnt_wapbl) {
    454 		error = 0;
    455 		if (flags & FSYNC_DATAONLY)
    456 			return error;
    457 
    458 		if (ffsino && VTOI(vp) && (VTOI(vp)->i_flag &
    459 		    (IN_ACCESS | IN_CHANGE | IN_UPDATE | IN_MODIFY |
    460 				 IN_MODIFIED | IN_ACCESSED))) {
    461 			error = UFS_WAPBL_BEGIN(mp);
    462 			if (error)
    463 				return error;
    464 			error = ffs_update(vp, NULL, NULL,
    465 				(flags & FSYNC_WAIT) ? UPDATE_WAIT : 0);
    466 			UFS_WAPBL_END(mp);
    467 		}
    468 		if (error || (flags & FSYNC_NOLOG))
    469 			return error;
    470 
    471 		/*
    472 		 * Don't flush the log if the vnode being flushed
    473 		 * contains no dirty buffers that could be in the log.
    474 		 */
    475 		if (!((flags & FSYNC_RECLAIM) &&
    476 		    LIST_EMPTY(&vp->v_dirtyblkhd))) {
    477 			error = wapbl_flush(mp->mnt_wapbl, 0);
    478 			if (error)
    479 				return error;
    480 		}
    481 
    482 		/*
    483 		 * XXX temporary workaround for "dirty bufs" panic in
    484 		 * vinvalbuf.  need a full fix for the v_numoutput
    485 		 * waiters issues.
    486 		 */
    487 		if (flags & FSYNC_WAIT) {
    488 			mutex_enter(&vp->v_interlock);
    489 			while (vp->v_numoutput)
    490 				cv_wait(&vp->v_cv, &vp->v_interlock);
    491 			mutex_exit(&vp->v_interlock);
    492 		}
    493 
    494 		return error;
    495 	}
    496 #endif /* WAPBL */
    497 
    498 	passes = NIADDR + 1;
    499 	skipmeta = 0;
    500 	if (flags & FSYNC_WAIT)
    501 		skipmeta = 1;
    502 
    503 loop:
    504 	mutex_enter(&bufcache_lock);
    505 	LIST_FOREACH(bp, &vp->v_dirtyblkhd, b_vnbufs) {
    506 		bp->b_cflags &= ~BC_SCANNED;
    507 	}
    508 	for (bp = LIST_FIRST(&vp->v_dirtyblkhd); bp; bp = nbp) {
    509 		nbp = LIST_NEXT(bp, b_vnbufs);
    510 		if (bp->b_cflags & (BC_BUSY | BC_SCANNED))
    511 			continue;
    512 		if ((bp->b_oflags & BO_DELWRI) == 0)
    513 			panic("ffs_fsync: not dirty");
    514 		if (skipmeta && bp->b_lblkno < 0)
    515 			continue;
    516 		bp->b_cflags |= BC_BUSY | BC_VFLUSH | BC_SCANNED;
    517 		mutex_exit(&bufcache_lock);
    518 		/*
    519 		 * On our final pass through, do all I/O synchronously
    520 		 * so that we can find out if our flush is failing
    521 		 * because of write errors.
    522 		 */
    523 		if (passes > 0 || !(flags & FSYNC_WAIT))
    524 			(void) bawrite(bp);
    525 		else if ((error = bwrite(bp)) != 0)
    526 			return (error);
    527 		/*
    528 		 * Since we unlocked during the I/O, we need
    529 		 * to start from a known point.
    530 		 */
    531 		mutex_enter(&bufcache_lock);
    532 		nbp = LIST_FIRST(&vp->v_dirtyblkhd);
    533 	}
    534 	mutex_exit(&bufcache_lock);
    535 	if (skipmeta) {
    536 		skipmeta = 0;
    537 		goto loop;
    538 	}
    539 
    540 	if (flags & FSYNC_WAIT) {
    541 		mutex_enter(&vp->v_interlock);
    542 		while (vp->v_numoutput) {
    543 			cv_wait(&vp->v_cv, &vp->v_interlock);
    544 		}
    545 		mutex_exit(&vp->v_interlock);
    546 
    547 		/*
    548 		 * Ensure that any filesystem metadata associated
    549 		 * with the vnode has been written.
    550 		 */
    551 		if ((error = softdep_sync_metadata(vp)) != 0)
    552 			return (error);
    553 
    554 		if (!LIST_EMPTY(&vp->v_dirtyblkhd)) {
    555 			/*
    556 			* Block devices associated with filesystems may
    557 			* have new I/O requests posted for them even if
    558 			* the vnode is locked, so no amount of trying will
    559 			* get them clean. Thus we give block devices a
    560 			* good effort, then just give up. For all other file
    561 			* types, go around and try again until it is clean.
    562 			*/
    563 			if (passes > 0) {
    564 				passes--;
    565 				goto loop;
    566 			}
    567 #ifdef DIAGNOSTIC
    568 			if (vp->v_type != VBLK)
    569 				vprint("ffs_fsync: dirty", vp);
    570 #endif
    571 		}
    572 	}
    573 
    574 	if (inodedeps_only)
    575 		waitfor = 0;
    576 	else
    577 		waitfor = (flags & FSYNC_WAIT) ? UPDATE_WAIT : 0;
    578 
    579 	if (ffsino)
    580 		error = ffs_update(vp, NULL, NULL, waitfor);
    581 
    582 	if (error == 0 && flags & FSYNC_CACHE) {
    583 		int i = 0;
    584 		if ((flags & FSYNC_VFS) == 0) {
    585 			KASSERT(VTOI(vp) != NULL);
    586 			vp = VTOI(vp)->i_devvp;
    587 		}
    588 		VOP_IOCTL(vp, DIOCCACHESYNC, &i, FWRITE, curlwp->l_cred);
    589 	}
    590 
    591 	return error;
    592 }
    593 
    594 /*
    595  * Reclaim an inode so that it can be used for other purposes.
    596  */
    597 int
    598 ffs_reclaim(void *v)
    599 {
    600 	struct vop_reclaim_args /* {
    601 		struct vnode *a_vp;
    602 		struct lwp *a_l;
    603 	} */ *ap = v;
    604 	struct vnode *vp = ap->a_vp;
    605 	struct inode *ip = VTOI(vp);
    606 	struct mount *mp = vp->v_mount;
    607 	struct ufsmount *ump = ip->i_ump;
    608 	void *data;
    609 	int error;
    610 
    611 	fstrans_start(mp, FSTRANS_LAZY);
    612 	if ((error = ufs_reclaim(vp)) != 0) {
    613 		fstrans_done(mp);
    614 		return (error);
    615 	}
    616 	if (ip->i_din.ffs1_din != NULL) {
    617 		if (ump->um_fstype == UFS1)
    618 			pool_cache_put(ffs_dinode1_cache, ip->i_din.ffs1_din);
    619 		else
    620 			pool_cache_put(ffs_dinode2_cache, ip->i_din.ffs2_din);
    621 	}
    622 	/*
    623 	 * To interlock with ffs_sync().
    624 	 */
    625 	genfs_node_destroy(vp);
    626 	mutex_enter(&vp->v_interlock);
    627 	data = vp->v_data;
    628 	vp->v_data = NULL;
    629 	mutex_exit(&vp->v_interlock);
    630 
    631 	/*
    632 	 * XXX MFS ends up here, too, to free an inode.  Should we create
    633 	 * XXX a separate pool for MFS inodes?
    634 	 */
    635 	pool_cache_put(ffs_inode_cache, data);
    636 	fstrans_done(mp);
    637 	return (0);
    638 }
    639 
    640 #if 0
    641 int
    642 ffs_getpages(void *v)
    643 {
    644 	struct vop_getpages_args /* {
    645 		struct vnode *a_vp;
    646 		voff_t a_offset;
    647 		struct vm_page **a_m;
    648 		int *a_count;
    649 		int a_centeridx;
    650 		vm_prot_t a_access_type;
    651 		int a_advice;
    652 		int a_flags;
    653 	} */ *ap = v;
    654 	struct vnode *vp = ap->a_vp;
    655 	struct inode *ip = VTOI(vp);
    656 	struct fs *fs = ip->i_fs;
    657 
    658 	/*
    659 	 * don't allow a softdep write to create pages for only part of a block.
    660 	 * the dependency tracking requires that all pages be in memory for
    661 	 * a block involved in a dependency.
    662 	 */
    663 
    664 	if (ap->a_flags & PGO_OVERWRITE &&
    665 	    (blkoff(fs, ap->a_offset) != 0 ||
    666 	     blkoff(fs, *ap->a_count << PAGE_SHIFT) != 0) &&
    667 	    DOINGSOFTDEP(ap->a_vp)) {
    668 		if ((ap->a_flags & PGO_LOCKED) == 0) {
    669 			mutex_exit(&vp->v_interlock);
    670 		}
    671 		return EINVAL;
    672 	}
    673 	return genfs_getpages(v);
    674 }
    675 #endif
    676 
    677 /*
    678  * Return the last logical file offset that should be written for this file
    679  * if we're doing a write that ends at "size".
    680  */
    681 
    682 void
    683 ffs_gop_size(struct vnode *vp, off_t size, off_t *eobp, int flags)
    684 {
    685 	struct inode *ip = VTOI(vp);
    686 	struct fs *fs = ip->i_fs;
    687 	daddr_t olbn, nlbn;
    688 
    689 	olbn = lblkno(fs, ip->i_size);
    690 	nlbn = lblkno(fs, size);
    691 	if (nlbn < NDADDR && olbn <= nlbn) {
    692 		*eobp = fragroundup(fs, size);
    693 	} else {
    694 		*eobp = blkroundup(fs, size);
    695 	}
    696 }
    697 
    698 int
    699 ffs_openextattr(void *v)
    700 {
    701 	struct vop_openextattr_args /* {
    702 		struct vnode *a_vp;
    703 		kauth_cred_t a_cred;
    704 		struct proc *a_p;
    705 	} */ *ap = v;
    706 	struct inode *ip = VTOI(ap->a_vp);
    707 	struct fs *fs = ip->i_fs;
    708 
    709 	/* Not supported for UFS1 file systems. */
    710 	if (fs->fs_magic == FS_UFS1_MAGIC)
    711 		return (EOPNOTSUPP);
    712 
    713 	/* XXX Not implemented for UFS2 file systems. */
    714 	return (EOPNOTSUPP);
    715 }
    716 
    717 int
    718 ffs_closeextattr(void *v)
    719 {
    720 	struct vop_closeextattr_args /* {
    721 		struct vnode *a_vp;
    722 		int a_commit;
    723 		kauth_cred_t a_cred;
    724 		struct proc *a_p;
    725 	} */ *ap = v;
    726 	struct inode *ip = VTOI(ap->a_vp);
    727 	struct fs *fs = ip->i_fs;
    728 
    729 	/* Not supported for UFS1 file systems. */
    730 	if (fs->fs_magic == FS_UFS1_MAGIC)
    731 		return (EOPNOTSUPP);
    732 
    733 	/* XXX Not implemented for UFS2 file systems. */
    734 	return (EOPNOTSUPP);
    735 }
    736 
    737 int
    738 ffs_getextattr(void *v)
    739 {
    740 	struct vop_getextattr_args /* {
    741 		struct vnode *a_vp;
    742 		int a_attrnamespace;
    743 		const char *a_name;
    744 		struct uio *a_uio;
    745 		size_t *a_size;
    746 		kauth_cred_t a_cred;
    747 		struct proc *a_p;
    748 	} */ *ap = v;
    749 	struct vnode *vp = ap->a_vp;
    750 	struct inode *ip = VTOI(vp);
    751 	struct fs *fs = ip->i_fs;
    752 
    753 	if (fs->fs_magic == FS_UFS1_MAGIC) {
    754 #ifdef UFS_EXTATTR
    755 		int error;
    756 
    757 		fstrans_start(vp->v_mount, FSTRANS_SHARED);
    758 		error = ufs_getextattr(ap);
    759 		fstrans_done(vp->v_mount);
    760 		return error;
    761 #else
    762 		return (EOPNOTSUPP);
    763 #endif
    764 	}
    765 
    766 	/* XXX Not implemented for UFS2 file systems. */
    767 	return (EOPNOTSUPP);
    768 }
    769 
    770 int
    771 ffs_setextattr(void *v)
    772 {
    773 	struct vop_setextattr_args /* {
    774 		struct vnode *a_vp;
    775 		int a_attrnamespace;
    776 		const char *a_name;
    777 		struct uio *a_uio;
    778 		kauth_cred_t a_cred;
    779 		struct proc *a_p;
    780 	} */ *ap = v;
    781 	struct vnode *vp = ap->a_vp;
    782 	struct inode *ip = VTOI(vp);
    783 	struct fs *fs = ip->i_fs;
    784 
    785 	if (fs->fs_magic == FS_UFS1_MAGIC) {
    786 #ifdef UFS_EXTATTR
    787 		int error;
    788 
    789 		fstrans_start(vp->v_mount, FSTRANS_SHARED);
    790 		error = ufs_setextattr(ap);
    791 		fstrans_done(vp->v_mount);
    792 		return error;
    793 #else
    794 		return (EOPNOTSUPP);
    795 #endif
    796 	}
    797 
    798 	/* XXX Not implemented for UFS2 file systems. */
    799 	return (EOPNOTSUPP);
    800 }
    801 
    802 int
    803 ffs_listextattr(void *v)
    804 {
    805 	struct vop_listextattr_args /* {
    806 		struct vnode *a_vp;
    807 		int a_attrnamespace;
    808 		struct uio *a_uio;
    809 		size_t *a_size;
    810 		kauth_cred_t a_cred;
    811 		struct proc *a_p;
    812 	} */ *ap = v;
    813 	struct inode *ip = VTOI(ap->a_vp);
    814 	struct fs *fs = ip->i_fs;
    815 
    816 	/* Not supported for UFS1 file systems. */
    817 	if (fs->fs_magic == FS_UFS1_MAGIC)
    818 		return (EOPNOTSUPP);
    819 
    820 	/* XXX Not implemented for UFS2 file systems. */
    821 	return (EOPNOTSUPP);
    822 }
    823 
    824 int
    825 ffs_deleteextattr(void *v)
    826 {
    827 	struct vop_deleteextattr_args /* {
    828 		struct vnode *a_vp;
    829 		int a_attrnamespace;
    830 		kauth_cred_t a_cred;
    831 		struct proc *a_p;
    832 	} */ *ap = v;
    833 	struct vnode *vp = ap->a_vp;
    834 	struct inode *ip = VTOI(vp);
    835 	struct fs *fs = ip->i_fs;
    836 
    837 	if (fs->fs_magic == FS_UFS1_MAGIC) {
    838 #ifdef UFS_EXTATTR
    839 		int error;
    840 
    841 		fstrans_start(vp->v_mount, FSTRANS_SHARED);
    842 		error = ufs_deleteextattr(ap);
    843 		fstrans_done(vp->v_mount);
    844 		return error;
    845 #else
    846 		return (EOPNOTSUPP);
    847 #endif
    848 	}
    849 
    850 	/* XXX Not implemented for UFS2 file systems. */
    851 	return (EOPNOTSUPP);
    852 }
    853 
    854 /*
    855  * Lock the node.
    856  */
    857 int
    858 ffs_lock(void *v)
    859 {
    860 	struct vop_lock_args /* {
    861 		struct vnode *a_vp;
    862 		int a_flags;
    863 	} */ *ap = v;
    864 	struct vnode *vp = ap->a_vp;
    865 	struct mount *mp = vp->v_mount;
    866 	int flags = ap->a_flags;
    867 
    868 	if ((flags & LK_INTERLOCK) != 0) {
    869 		mutex_exit(&vp->v_interlock);
    870 		flags &= ~LK_INTERLOCK;
    871 	}
    872 
    873 	/*
    874 	 * Fake lock during file system suspension.
    875 	 */
    876 	if ((vp->v_type == VREG || vp->v_type == VDIR) &&
    877 	    fstrans_is_owner(mp) &&
    878 	    fstrans_getstate(mp) == FSTRANS_SUSPENDING) {
    879 		return 0;
    880 	}
    881 
    882 	return (vlockmgr(vp->v_vnlock, flags));
    883 }
    884 
    885 /*
    886  * Unlock the node.
    887  */
    888 int
    889 ffs_unlock(void *v)
    890 {
    891 	struct vop_unlock_args /* {
    892 		struct vnode *a_vp;
    893 		int a_flags;
    894 	} */ *ap = v;
    895 	struct vnode *vp = ap->a_vp;
    896 	struct mount *mp = vp->v_mount;
    897 
    898 	KASSERT(ap->a_flags == 0);
    899 
    900 	/*
    901 	 * Fake unlock during file system suspension.
    902 	 */
    903 	if ((vp->v_type == VREG || vp->v_type == VDIR) &&
    904 	    fstrans_is_owner(mp) &&
    905 	    fstrans_getstate(mp) == FSTRANS_SUSPENDING) {
    906 		return 0;
    907 	}
    908 	return (vlockmgr(vp->v_vnlock, LK_RELEASE));
    909 }
    910 
    911 /*
    912  * Return whether or not the node is locked.
    913  */
    914 int
    915 ffs_islocked(void *v)
    916 {
    917 	struct vop_islocked_args /* {
    918 		struct vnode *a_vp;
    919 	} */ *ap = v;
    920 	struct vnode *vp = ap->a_vp;
    921 
    922 	return (vlockstatus(vp->v_vnlock));
    923 }
    924