Home | History | Annotate | Line # | Download | only in ffs
ffs_vnops.c revision 1.31.2.1
      1 /*	$NetBSD: ffs_vnops.c,v 1.31.2.1 2000/12/14 23:36:48 he Exp $	*/
      2 
      3 /*
      4  * Copyright (c) 1982, 1986, 1989, 1993
      5  *	The Regents of the University of California.  All rights reserved.
      6  *
      7  * Redistribution and use in source and binary forms, with or without
      8  * modification, are permitted provided that the following conditions
      9  * are met:
     10  * 1. Redistributions of source code must retain the above copyright
     11  *    notice, this list of conditions and the following disclaimer.
     12  * 2. Redistributions in binary form must reproduce the above copyright
     13  *    notice, this list of conditions and the following disclaimer in the
     14  *    documentation and/or other materials provided with the distribution.
     15  * 3. All advertising materials mentioning features or use of this software
     16  *    must display the following acknowledgement:
     17  *	This product includes software developed by the University of
     18  *	California, Berkeley and its contributors.
     19  * 4. Neither the name of the University nor the names of its contributors
     20  *    may be used to endorse or promote products derived from this software
     21  *    without specific prior written permission.
     22  *
     23  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     24  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     25  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     26  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     27  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     28  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     29  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     30  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     31  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     32  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     33  * SUCH DAMAGE.
     34  *
     35  *	@(#)ffs_vnops.c	8.15 (Berkeley) 5/14/95
     36  */
     37 
     38 #include <sys/param.h>
     39 #include <sys/systm.h>
     40 #include <sys/resourcevar.h>
     41 #include <sys/kernel.h>
     42 #include <sys/file.h>
     43 #include <sys/stat.h>
     44 #include <sys/buf.h>
     45 #include <sys/proc.h>
     46 #include <sys/mount.h>
     47 #include <sys/vnode.h>
     48 #include <sys/pool.h>
     49 #include <sys/signalvar.h>
     50 
     51 #include <vm/vm.h>
     52 
     53 #include <uvm/uvm_extern.h>
     54 
     55 #include <miscfs/fifofs/fifo.h>
     56 #include <miscfs/genfs/genfs.h>
     57 #include <miscfs/specfs/specdev.h>
     58 
     59 #include <ufs/ufs/quota.h>
     60 #include <ufs/ufs/inode.h>
     61 #include <ufs/ufs/dir.h>
     62 #include <ufs/ufs/ufs_extern.h>
     63 #include <ufs/ufs/ufsmount.h>
     64 
     65 #include <ufs/ffs/fs.h>
     66 #include <ufs/ffs/ffs_extern.h>
     67 
     68 static int ffs_full_fsync __P((void *));
     69 
     70 /* Global vfs data structures for ufs. */
     71 int (**ffs_vnodeop_p) __P((void *));
     72 struct vnodeopv_entry_desc ffs_vnodeop_entries[] = {
     73 	{ &vop_default_desc, vn_default_error },
     74 	{ &vop_lookup_desc, ufs_lookup },		/* lookup */
     75 	{ &vop_create_desc, ufs_create },		/* create */
     76 	{ &vop_whiteout_desc, ufs_whiteout },		/* whiteout */
     77 	{ &vop_mknod_desc, ufs_mknod },			/* mknod */
     78 	{ &vop_open_desc, ufs_open },			/* open */
     79 	{ &vop_close_desc, ufs_close },			/* close */
     80 	{ &vop_access_desc, ufs_access },		/* access */
     81 	{ &vop_getattr_desc, ufs_getattr },		/* getattr */
     82 	{ &vop_setattr_desc, ufs_setattr },		/* setattr */
     83 	{ &vop_read_desc, ffs_read },			/* read */
     84 	{ &vop_write_desc, ffs_write },			/* write */
     85 	{ &vop_lease_desc, ufs_lease_check },		/* lease */
     86 	{ &vop_ioctl_desc, ufs_ioctl },			/* ioctl */
     87 	{ &vop_fcntl_desc, ufs_fcntl },			/* fcntl */
     88 	{ &vop_poll_desc, ufs_poll },			/* poll */
     89 	{ &vop_revoke_desc, ufs_revoke },		/* revoke */
     90 	{ &vop_mmap_desc, ufs_mmap },			/* mmap */
     91 	{ &vop_fsync_desc, ffs_fsync },			/* fsync */
     92 	{ &vop_seek_desc, ufs_seek },			/* seek */
     93 	{ &vop_remove_desc, ufs_remove },		/* remove */
     94 	{ &vop_link_desc, ufs_link },			/* link */
     95 	{ &vop_rename_desc, ufs_rename },		/* rename */
     96 	{ &vop_mkdir_desc, ufs_mkdir },			/* mkdir */
     97 	{ &vop_rmdir_desc, ufs_rmdir },			/* rmdir */
     98 	{ &vop_symlink_desc, ufs_symlink },		/* symlink */
     99 	{ &vop_readdir_desc, ufs_readdir },		/* readdir */
    100 	{ &vop_readlink_desc, ufs_readlink },		/* readlink */
    101 	{ &vop_abortop_desc, ufs_abortop },		/* abortop */
    102 	{ &vop_inactive_desc, ufs_inactive },		/* inactive */
    103 	{ &vop_reclaim_desc, ffs_reclaim },		/* reclaim */
    104 	{ &vop_lock_desc, ufs_lock },			/* lock */
    105 	{ &vop_unlock_desc, ufs_unlock },		/* unlock */
    106 	{ &vop_bmap_desc, ufs_bmap },			/* bmap */
    107 	{ &vop_strategy_desc, ufs_strategy },		/* strategy */
    108 	{ &vop_print_desc, ufs_print },			/* print */
    109 	{ &vop_islocked_desc, ufs_islocked },		/* islocked */
    110 	{ &vop_pathconf_desc, ufs_pathconf },		/* pathconf */
    111 	{ &vop_advlock_desc, ufs_advlock },		/* advlock */
    112 	{ &vop_blkatoff_desc, ffs_blkatoff },		/* blkatoff */
    113 	{ &vop_valloc_desc, ffs_valloc },		/* valloc */
    114 	{ &vop_balloc_desc, ffs_balloc },		/* balloc */
    115 	{ &vop_reallocblks_desc, ffs_reallocblks },	/* reallocblks */
    116 	{ &vop_vfree_desc, ffs_vfree },			/* vfree */
    117 	{ &vop_truncate_desc, ffs_truncate },		/* truncate */
    118 	{ &vop_update_desc, ffs_update },		/* update */
    119 	{ &vop_bwrite_desc, vn_bwrite },		/* bwrite */
    120 	{ (struct vnodeop_desc*)NULL, (int(*) __P((void*)))NULL }
    121 };
    122 struct vnodeopv_desc ffs_vnodeop_opv_desc =
    123 	{ &ffs_vnodeop_p, ffs_vnodeop_entries };
    124 
    125 int (**ffs_specop_p) __P((void *));
    126 struct vnodeopv_entry_desc ffs_specop_entries[] = {
    127 	{ &vop_default_desc, vn_default_error },
    128 	{ &vop_lookup_desc, spec_lookup },		/* lookup */
    129 	{ &vop_create_desc, spec_create },		/* create */
    130 	{ &vop_mknod_desc, spec_mknod },		/* mknod */
    131 	{ &vop_open_desc, spec_open },			/* open */
    132 	{ &vop_close_desc, ufsspec_close },		/* close */
    133 	{ &vop_access_desc, ufs_access },		/* access */
    134 	{ &vop_getattr_desc, ufs_getattr },		/* getattr */
    135 	{ &vop_setattr_desc, ufs_setattr },		/* setattr */
    136 	{ &vop_read_desc, ufsspec_read },		/* read */
    137 	{ &vop_write_desc, ufsspec_write },		/* write */
    138 	{ &vop_lease_desc, spec_lease_check },		/* lease */
    139 	{ &vop_ioctl_desc, spec_ioctl },		/* ioctl */
    140 	{ &vop_fcntl_desc, ufs_fcntl },			/* fcntl */
    141 	{ &vop_poll_desc, spec_poll },			/* poll */
    142 	{ &vop_revoke_desc, spec_revoke },		/* revoke */
    143 	{ &vop_mmap_desc, spec_mmap },			/* mmap */
    144 	{ &vop_fsync_desc, ffs_fsync },			/* fsync */
    145 	{ &vop_seek_desc, spec_seek },			/* seek */
    146 	{ &vop_remove_desc, spec_remove },		/* remove */
    147 	{ &vop_link_desc, spec_link },			/* link */
    148 	{ &vop_rename_desc, spec_rename },		/* rename */
    149 	{ &vop_mkdir_desc, spec_mkdir },		/* mkdir */
    150 	{ &vop_rmdir_desc, spec_rmdir },		/* rmdir */
    151 	{ &vop_symlink_desc, spec_symlink },		/* symlink */
    152 	{ &vop_readdir_desc, spec_readdir },		/* readdir */
    153 	{ &vop_readlink_desc, spec_readlink },		/* readlink */
    154 	{ &vop_abortop_desc, spec_abortop },		/* abortop */
    155 	{ &vop_inactive_desc, ufs_inactive },		/* inactive */
    156 	{ &vop_reclaim_desc, ffs_reclaim },		/* reclaim */
    157 	{ &vop_lock_desc, ufs_lock },			/* lock */
    158 	{ &vop_unlock_desc, ufs_unlock },		/* unlock */
    159 	{ &vop_bmap_desc, spec_bmap },			/* bmap */
    160 	{ &vop_strategy_desc, spec_strategy },		/* strategy */
    161 	{ &vop_print_desc, ufs_print },			/* print */
    162 	{ &vop_islocked_desc, ufs_islocked },		/* islocked */
    163 	{ &vop_pathconf_desc, spec_pathconf },		/* pathconf */
    164 	{ &vop_advlock_desc, spec_advlock },		/* advlock */
    165 	{ &vop_blkatoff_desc, spec_blkatoff },		/* blkatoff */
    166 	{ &vop_valloc_desc, spec_valloc },		/* valloc */
    167 	{ &vop_reallocblks_desc, spec_reallocblks },	/* reallocblks */
    168 	{ &vop_vfree_desc, ffs_vfree },			/* vfree */
    169 	{ &vop_truncate_desc, spec_truncate },		/* truncate */
    170 	{ &vop_update_desc, ffs_update },		/* update */
    171 	{ &vop_bwrite_desc, vn_bwrite },		/* bwrite */
    172 	{ (struct vnodeop_desc*)NULL, (int(*) __P((void *)))NULL }
    173 };
    174 struct vnodeopv_desc ffs_specop_opv_desc =
    175 	{ &ffs_specop_p, ffs_specop_entries };
    176 
    177 int (**ffs_fifoop_p) __P((void *));
    178 struct vnodeopv_entry_desc ffs_fifoop_entries[] = {
    179 	{ &vop_default_desc, vn_default_error },
    180 	{ &vop_lookup_desc, fifo_lookup },		/* lookup */
    181 	{ &vop_create_desc, fifo_create },		/* create */
    182 	{ &vop_mknod_desc, fifo_mknod },		/* mknod */
    183 	{ &vop_open_desc, fifo_open },			/* open */
    184 	{ &vop_close_desc, ufsfifo_close },		/* close */
    185 	{ &vop_access_desc, ufs_access },		/* access */
    186 	{ &vop_getattr_desc, ufs_getattr },		/* getattr */
    187 	{ &vop_setattr_desc, ufs_setattr },		/* setattr */
    188 	{ &vop_read_desc, ufsfifo_read },		/* read */
    189 	{ &vop_write_desc, ufsfifo_write },		/* write */
    190 	{ &vop_lease_desc, fifo_lease_check },		/* lease */
    191 	{ &vop_ioctl_desc, fifo_ioctl },		/* ioctl */
    192 	{ &vop_fcntl_desc, ufs_fcntl },			/* fcntl */
    193 	{ &vop_poll_desc, fifo_poll },			/* poll */
    194 	{ &vop_revoke_desc, fifo_revoke },		/* revoke */
    195 	{ &vop_mmap_desc, fifo_mmap },			/* mmap */
    196 	{ &vop_fsync_desc, ffs_fsync },			/* fsync */
    197 	{ &vop_seek_desc, fifo_seek },			/* seek */
    198 	{ &vop_remove_desc, fifo_remove },		/* remove */
    199 	{ &vop_link_desc, fifo_link },			/* link */
    200 	{ &vop_rename_desc, fifo_rename },		/* rename */
    201 	{ &vop_mkdir_desc, fifo_mkdir },		/* mkdir */
    202 	{ &vop_rmdir_desc, fifo_rmdir },		/* rmdir */
    203 	{ &vop_symlink_desc, fifo_symlink },		/* symlink */
    204 	{ &vop_readdir_desc, fifo_readdir },		/* readdir */
    205 	{ &vop_readlink_desc, fifo_readlink },		/* readlink */
    206 	{ &vop_abortop_desc, fifo_abortop },		/* abortop */
    207 	{ &vop_inactive_desc, ufs_inactive },		/* inactive */
    208 	{ &vop_reclaim_desc, ffs_reclaim },		/* reclaim */
    209 	{ &vop_lock_desc, ufs_lock },			/* lock */
    210 	{ &vop_unlock_desc, ufs_unlock },		/* unlock */
    211 	{ &vop_bmap_desc, fifo_bmap },			/* bmap */
    212 	{ &vop_strategy_desc, fifo_strategy },		/* strategy */
    213 	{ &vop_print_desc, ufs_print },			/* print */
    214 	{ &vop_islocked_desc, ufs_islocked },		/* islocked */
    215 	{ &vop_pathconf_desc, fifo_pathconf },		/* pathconf */
    216 	{ &vop_advlock_desc, fifo_advlock },		/* advlock */
    217 	{ &vop_blkatoff_desc, fifo_blkatoff },		/* blkatoff */
    218 	{ &vop_valloc_desc, fifo_valloc },		/* valloc */
    219 	{ &vop_reallocblks_desc, fifo_reallocblks },	/* reallocblks */
    220 	{ &vop_vfree_desc, ffs_vfree },			/* vfree */
    221 	{ &vop_truncate_desc, fifo_truncate },		/* truncate */
    222 	{ &vop_update_desc, ffs_update },		/* update */
    223 	{ &vop_bwrite_desc, vn_bwrite },		/* bwrite */
    224 	{ (struct vnodeop_desc*)NULL, (int(*) __P((void *)))NULL }
    225 };
    226 struct vnodeopv_desc ffs_fifoop_opv_desc =
    227 	{ &ffs_fifoop_p, ffs_fifoop_entries };
    228 
    229 int doclusterread = 1;
    230 int doclusterwrite = 1;
    231 
    232 #include <ufs/ufs/ufs_readwrite.c>
    233 
    234 int
    235 ffs_fsync(v)
    236 	void *v;
    237 {
    238 	struct vop_fsync_args /* {
    239 		struct vnode *a_vp;
    240 		struct ucred *a_cred;
    241 		int a_flags;
    242 		off_t offlo;
    243 		off_t offhi;
    244 		struct proc *a_p;
    245 	} */ *ap = v;
    246 	struct buf *bp, *nbp, *ibp;
    247 	int s, num, error, i;
    248 	struct indir ia[NIADDR + 1];
    249 	int bsize;
    250 	daddr_t blk_low, blk_high;
    251 	struct vnode *vp;
    252 
    253 	/*
    254 	 * XXX no easy way to sync a range in a file with softdep.
    255 	 */
    256 	if ((ap->a_offlo == 0 && ap->a_offhi == 0) || DOINGSOFTDEP(ap->a_vp))
    257 		return ffs_full_fsync(v);
    258 
    259 	vp = ap->a_vp;
    260 
    261 	bsize = ap->a_vp->v_mount->mnt_stat.f_iosize;
    262 	blk_low = ap->a_offlo / bsize;
    263 	blk_high = ap->a_offhi / bsize;
    264 	if (ap->a_offhi % bsize != 0)
    265 		blk_high++;
    266 
    267 	/*
    268 	 * First, flush all data blocks in range.
    269 	 */
    270 loop:
    271 	s = splbio();
    272 	for (bp = LIST_FIRST(&vp->v_dirtyblkhd); bp; bp = nbp) {
    273 		nbp = LIST_NEXT(bp, b_vnbufs);
    274 		if ((bp->b_flags & B_BUSY))
    275 			continue;
    276 		if (bp->b_lblkno < blk_low || bp->b_lblkno > blk_high)
    277 			continue;
    278 		bp->b_flags |= B_BUSY | B_VFLUSH;
    279 		splx(s);
    280 		bawrite(bp);
    281 		goto loop;
    282 	}
    283 
    284 	/*
    285 	 * Then, flush possibly unwritten indirect blocks. Without softdeps,
    286 	 * these should be the only ones left.
    287 	 */
    288 	if (!(ap->a_flags & FSYNC_DATAONLY) && blk_high >= NDADDR) {
    289 		error = ufs_getlbns(vp, blk_high, ia, &num);
    290 		if (error != 0)
    291 			return error;
    292 		for (i = 0; i < num; i++) {
    293 			ibp = incore(vp, ia[i].in_lbn);
    294 			if (ibp != NULL && !(ibp->b_flags & B_BUSY) &&
    295 			    (ibp->b_flags & B_DELWRI)) {
    296 				ibp->b_flags |= B_BUSY | B_VFLUSH;
    297 				splx(s);
    298 				bawrite(ibp);
    299 				s = splbio();
    300 			}
    301 		}
    302 	}
    303 
    304 	if (ap->a_flags & FSYNC_WAIT) {
    305 		while (vp->v_numoutput > 0) {
    306 			vp->v_flag |= VBWAIT;
    307 			tsleep((caddr_t)&vp->v_numoutput, PRIBIO + 1,
    308 			    "fsync_range", 0);
    309 		}
    310 	}
    311 
    312 	splx(s);
    313 
    314 	return (VOP_UPDATE(vp, NULL, NULL,
    315 	    (ap->a_flags & FSYNC_WAIT) ? UPDATE_WAIT : 0));
    316 }
    317 
    318 /*
    319  * Synch an open file.
    320  */
    321 /* ARGSUSED */
    322 static int
    323 ffs_full_fsync(v)
    324 	void *v;
    325 {
    326 	struct vop_fsync_args /* {
    327 		struct vnode *a_vp;
    328 		struct ucred *a_cred;
    329 		int a_flags;
    330 		off_t offlo;
    331 		off_t offhi;
    332 		struct proc *a_p;
    333 	} */ *ap = v;
    334 	struct vnode *vp = ap->a_vp;
    335 	struct buf *bp, *nbp;
    336 	int s, error, passes, skipmeta;
    337 
    338 	if (vp->v_type == VBLK &&
    339 	    vp->v_specmountpoint != NULL &&
    340 	    (vp->v_specmountpoint->mnt_flag & MNT_SOFTDEP))
    341 		softdep_fsync_mountdev(vp);
    342 
    343 	/*
    344 	 * Flush all dirty buffers associated with a vnode
    345 	 */
    346 	passes = NIADDR + 1;
    347 	skipmeta = 0;
    348 	if (ap->a_flags & (FSYNC_DATAONLY|FSYNC_WAIT))
    349 		skipmeta = 1;
    350 	s = splbio();
    351 loop:
    352 	for (bp = LIST_FIRST(&vp->v_dirtyblkhd); bp;
    353 	     bp = LIST_NEXT(bp, b_vnbufs))
    354 		bp->b_flags &= ~B_SCANNED;
    355 	for (bp = LIST_FIRST(&vp->v_dirtyblkhd); bp; bp = nbp) {
    356 		nbp = LIST_NEXT(bp, b_vnbufs);
    357 		if (bp->b_flags & (B_BUSY | B_SCANNED))
    358 			continue;
    359 		if ((bp->b_flags & B_DELWRI) == 0)
    360 			panic("ffs_fsync: not dirty");
    361 		if (skipmeta && bp->b_lblkno < 0)
    362 			continue;
    363 		bp->b_flags |= B_BUSY | B_VFLUSH | B_SCANNED;
    364 		splx(s);
    365 		/*
    366 		 * On our final pass through, do all I/O synchronously
    367 		 * so that we can find out if our flush is failing
    368 		 * because of write errors.
    369 		 */
    370 		if (passes > 0 || !(ap->a_flags & FSYNC_WAIT))
    371 			(void) bawrite(bp);
    372 		else if ((error = bwrite(bp)) != 0)
    373 			return (error);
    374 		s = splbio();
    375 		/*
    376 		 * Since we may have slept during the I/O, we need
    377 		 * to start from a known point.
    378 		 */
    379 		nbp = LIST_FIRST(&vp->v_dirtyblkhd);
    380 	}
    381 	if (skipmeta && !(ap->a_flags & FSYNC_DATAONLY)) {
    382 		skipmeta = 0;
    383 		goto loop;
    384 	}
    385 	if (ap->a_flags & FSYNC_WAIT) {
    386 		while (vp->v_numoutput) {
    387 			vp->v_flag |= VBWAIT;
    388 			(void) tsleep(&vp->v_numoutput, PRIBIO + 1,
    389 			    "ffsfsync", 0);
    390 		}
    391 		splx(s);
    392 
    393 		if (ap->a_flags & FSYNC_DATAONLY)
    394 			return (0);
    395 
    396 		/*
    397 		 * Ensure that any filesystem metadata associated
    398 		 * with the vnode has been written.
    399 		 */
    400 		if ((error = softdep_sync_metadata(ap)) != 0)
    401 			return (error);
    402 
    403 		s = splbio();
    404 		if (!LIST_EMPTY(&vp->v_dirtyblkhd)) {
    405 			/*
    406 			* Block devices associated with filesystems may
    407 			* have new I/O requests posted for them even if
    408 			* the vnode is locked, so no amount of trying will
    409 			* get them clean. Thus we give block devices a
    410 			* good effort, then just give up. For all other file
    411 			* types, go around and try again until it is clean.
    412 			*/
    413 			if (passes > 0) {
    414 				passes--;
    415 				goto loop;
    416 			}
    417 #ifdef DIAGNOSTIC
    418 			if (vp->v_type != VBLK)
    419 				vprint("ffs_fsync: dirty", vp);
    420 #endif
    421 		}
    422 	}
    423 	splx(s);
    424 	return (VOP_UPDATE(vp, NULL, NULL,
    425 	    (ap->a_flags & FSYNC_WAIT) ? UPDATE_WAIT : 0));
    426 }
    427 
    428 /*
    429  * Reclaim an inode so that it can be used for other purposes.
    430  */
    431 int
    432 ffs_reclaim(v)
    433 	void *v;
    434 {
    435 	struct vop_reclaim_args /* {
    436 		struct vnode *a_vp;
    437 		struct proc *a_p;
    438 	} */ *ap = v;
    439 	struct vnode *vp = ap->a_vp;
    440 	int error;
    441 
    442 	if ((error = ufs_reclaim(vp, ap->a_p)) != 0)
    443 		return (error);
    444 	/*
    445 	 * XXX MFS ends up here, too, to free an inode.  Should we create
    446 	 * XXX a separate pool for MFS inodes?
    447 	 */
    448 	pool_put(&ffs_inode_pool, vp->v_data);
    449 	vp->v_data = NULL;
    450 	return (0);
    451 }
    452