Home | History | Annotate | Line # | Download | only in lfs
lfs_inode.c revision 1.18
      1 /*	$NetBSD: lfs_inode.c,v 1.18 1999/03/10 00:20:00 perseant Exp $	*/
      2 
      3 /*-
      4  * Copyright (c) 1999 The NetBSD Foundation, Inc.
      5  * All rights reserved.
      6  *
      7  * This code is derived from software contributed to The NetBSD Foundation
      8  * by Konrad E. Schroder <perseant (at) hhhh.org>.
      9  *
     10  * Redistribution and use in source and binary forms, with or without
     11  * modification, are permitted provided that the following conditions
     12  * are met:
     13  * 1. Redistributions of source code must retain the above copyright
     14  *    notice, this list of conditions and the following disclaimer.
     15  * 2. Redistributions in binary form must reproduce the above copyright
     16  *    notice, this list of conditions and the following disclaimer in the
     17  *    documentation and/or other materials provided with the distribution.
     18  * 3. All advertising materials mentioning features or use of this software
     19  *    must display the following acknowledgement:
     20  *      This product includes software developed by the NetBSD
     21  *      Foundation, Inc. and its contributors.
     22  * 4. Neither the name of The NetBSD Foundation nor the names of its
     23  *    contributors may be used to endorse or promote products derived
     24  *    from this software without specific prior written permission.
     25  *
     26  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     27  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     28  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     29  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     30  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     31  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     32  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     33  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     34  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     35  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     36  * POSSIBILITY OF SUCH DAMAGE.
     37  */
     38 /*
     39  * Copyright (c) 1986, 1989, 1991, 1993
     40  *	The Regents of the University of California.  All rights reserved.
     41  *
     42  * Redistribution and use in source and binary forms, with or without
     43  * modification, are permitted provided that the following conditions
     44  * are met:
     45  * 1. Redistributions of source code must retain the above copyright
     46  *    notice, this list of conditions and the following disclaimer.
     47  * 2. Redistributions in binary form must reproduce the above copyright
     48  *    notice, this list of conditions and the following disclaimer in the
     49  *    documentation and/or other materials provided with the distribution.
     50  * 3. All advertising materials mentioning features or use of this software
     51  *    must display the following acknowledgement:
     52  *	This product includes software developed by the University of
     53  *	California, Berkeley and its contributors.
     54  * 4. Neither the name of the University nor the names of its contributors
     55  *    may be used to endorse or promote products derived from this software
     56  *    without specific prior written permission.
     57  *
     58  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     59  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     60  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     61  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     62  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     63  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     64  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     65  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     66  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     67  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     68  * SUCH DAMAGE.
     69  *
     70  *	@(#)lfs_inode.c	8.9 (Berkeley) 5/8/95
     71  */
     72 
     73 #if defined(_KERNEL) && !defined(_LKM)
     74 #include "opt_quota.h"
     75 #endif
     76 
     77 #include <sys/param.h>
     78 #include <sys/systm.h>
     79 #include <sys/mount.h>
     80 #include <sys/proc.h>
     81 #include <sys/file.h>
     82 #include <sys/buf.h>
     83 #include <sys/vnode.h>
     84 #include <sys/kernel.h>
     85 #include <sys/malloc.h>
     86 
     87 #include <vm/vm.h>
     88 
     89 #include <ufs/ufs/quota.h>
     90 #include <ufs/ufs/inode.h>
     91 #include <ufs/ufs/ufsmount.h>
     92 #include <ufs/ufs/ufs_extern.h>
     93 
     94 #include <ufs/lfs/lfs.h>
     95 #include <ufs/lfs/lfs_extern.h>
     96 
     97 /* Search a block for a specific dinode. */
     98 struct dinode *
     99 lfs_ifind(fs, ino, dip)
    100 	struct lfs *fs;
    101 	ino_t ino;
    102 	register struct dinode *dip;
    103 {
    104 	register int cnt;
    105 	register struct dinode *ldip;
    106 
    107 	for (cnt = INOPB(fs), ldip = dip + (cnt - 1); cnt--; --ldip)
    108 		if (ldip->di_inumber == ino)
    109 			return (ldip);
    110 
    111 	panic("lfs_ifind: dinode %u not found", ino);
    112 	/* NOTREACHED */
    113 }
    114 
    115 int
    116 lfs_update(v)
    117 	void *v;
    118 {
    119 	struct vop_update_args /* {
    120 				  struct vnode *a_vp;
    121 				  struct timespec *a_access;
    122 				  struct timespec *a_modify;
    123 				  int a_waitfor;
    124 				  } */ *ap = v;
    125 	struct inode *ip;
    126 	struct vnode *vp = ap->a_vp;
    127 	int mod, oflag;
    128 	struct timespec ts;
    129 
    130 	if (vp->v_mount->mnt_flag & MNT_RDONLY)
    131 		return (0);
    132 	ip = VTOI(vp);
    133 
    134 	/*
    135 	 * If we are called from vinvalbuf, and the file's blocks have
    136 	 * already been scheduled for writing, but the writes have not
    137 	 * yet completed, lfs_vflush will not be called, and vinvalbuf
    138 	 * will cause a panic.  So, we must wait until any pending write
    139 	 * for our inode completes, if we are called with LFS_SYNC set.
    140 	 */
    141 	while((ap->a_waitfor & LFS_SYNC) && WRITEINPROG(vp)) {
    142 		tsleep(vp, (PRIBIO+1), "lfs_update", 0);
    143 	}
    144 	mod = ip->i_flag & IN_MODIFIED;
    145 	oflag = ip->i_flag;
    146 	TIMEVAL_TO_TIMESPEC(&time, &ts);
    147 	LFS_ITIMES(ip,
    148 		   ap->a_access ? ap->a_access : &ts,
    149 		   ap->a_modify ? ap->a_modify : &ts, &ts);
    150 	if (!mod && (ip->i_flag & IN_MODIFIED))
    151 		ip->i_lfs->lfs_uinodes++;
    152 	if ((ip->i_flag & (IN_MODIFIED|IN_CLEANING)) == 0) {
    153 		return (0);
    154 	}
    155 
    156 	/* If sync, push back the vnode and any dirty blocks it may have. */
    157 	return (ap->a_waitfor & LFS_SYNC ? lfs_vflush(vp) : 0);
    158 }
    159 
    160 /* Update segment usage information when removing a block. */
    161 #define UPDATE_SEGUSE \
    162 	if (lastseg != -1) { \
    163 		LFS_SEGENTRY(sup, fs, lastseg, sup_bp); \
    164 		if (num > sup->su_nbytes) { \
    165 			panic("lfs_truncate: negative bytes in segment %d\n", \
    166 			      lastseg); \
    167 		      sup->su_nbytes = 0; \
    168 		} else \
    169 		sup->su_nbytes -= num; \
    170 		e1 = VOP_BWRITE(sup_bp); \
    171 		fragsreleased += numfrags(fs, num); \
    172 	}
    173 
    174 #define SEGDEC(S) { \
    175 	if (daddr != 0) { \
    176 		if (lastseg != (seg = datosn(fs, daddr))) { \
    177 			UPDATE_SEGUSE; \
    178 			num = (S); \
    179 			lastseg = seg; \
    180 		} else \
    181 			num += (S); \
    182 	} \
    183 }
    184 
    185 /*
    186  * Truncate the inode ip to at most length size.  Update segment usage
    187  * table information.
    188  */
    189 /* ARGSUSED */
    190 int
    191 lfs_truncate(v)
    192 	void *v;
    193 {
    194 	struct vop_truncate_args /* {
    195 		struct vnode *a_vp;
    196 		off_t a_length;
    197 		int a_flags;
    198 		struct ucred *a_cred;
    199 		struct proc *a_p;
    200 	} */ *ap = v;
    201 	register struct indir *inp;
    202 	register int i;
    203 	register ufs_daddr_t *daddrp;
    204 	register struct vnode *vp = ap->a_vp;
    205 	off_t length = ap->a_length;
    206 	struct buf *bp, *sup_bp;
    207 	struct ifile *ifp;
    208 	struct inode *ip;
    209 	struct lfs *fs;
    210 	struct indir a[NIADDR + 2], a_end[NIADDR + 2];
    211 	SEGUSE *sup;
    212 	ufs_daddr_t daddr, lastblock, lbn, olastblock;
    213 	ufs_daddr_t oldsize_lastblock, oldsize_newlast, newsize;
    214 	long off, a_released, fragsreleased, i_released;
    215 	int e1, e2, depth, lastseg, num, offset, seg, freesize;
    216 
    217 	ip = VTOI(vp);
    218 
    219 	if (vp->v_type == VLNK && vp->v_mount->mnt_maxsymlinklen > 0) {
    220 #ifdef DIAGNOSTIC
    221 		if (length != 0)
    222 			panic("lfs_truncate: partial truncate of symlink");
    223 #endif
    224 		bzero((char *)&ip->i_ffs_shortlink, (u_int)ip->i_ffs_size);
    225 		ip->i_ffs_size = 0;
    226 		ip->i_flag |= IN_CHANGE | IN_UPDATE;
    227 		return (VOP_UPDATE(vp, NULL, NULL, 0));
    228 	}
    229 #ifdef UVM
    230 	uvm_vnp_setsize(vp, length);
    231 #else
    232 	vnode_pager_setsize(vp, length);
    233 #endif
    234 
    235 	fs = ip->i_lfs;
    236 	lfs_imtime(fs);
    237 
    238 	/* If length is larger than the file, just update the times. */
    239 	if (ip->i_ffs_size <= length) {
    240 		ip->i_flag |= IN_CHANGE | IN_UPDATE;
    241 		return (VOP_UPDATE(vp, NULL, NULL, 0));
    242 	}
    243 
    244 #if 0
    245 	/*
    246 	 * Make sure no writes happen while we're truncating
    247 	 * XXX KS - I don't remember why....
    248 	 */
    249 	while(fs->lfs_seglock) {
    250 		tsleep(&fs->lfs_seglock, (PRIBIO+1), "lfs_truncate", 0);
    251 	}
    252 #endif
    253 
    254 	/*
    255 	 * Calculate index into inode's block list of last direct and indirect
    256 	 * blocks (if any) which we want to keep.  Lastblock is 0 when the
    257 	 * file is truncated to 0.
    258 	 */
    259 	lastblock = lblkno(fs, length + fs->lfs_bsize - 1);
    260 	olastblock = lblkno(fs, ip->i_ffs_size + fs->lfs_bsize - 1) - 1;
    261 
    262 	/*
    263 	 * Update the size of the file. If the file is not being truncated to
    264 	 * a block boundry, the contents of the partial block following the end
    265 	 * because of subsequent file growth.  For this part of the code,
    266 	 * oldsize_newlast refers to the old size of the new last block in the
    267 	 * file.
    268 	 */
    269 	offset = blkoff(fs, length);
    270 	lbn = lblkno(fs, length);
    271 	oldsize_newlast = blksize(fs, ip, lbn);
    272 
    273 	/* Now set oldsize to the current size of the current last block */
    274 	oldsize_lastblock = blksize(fs, ip, olastblock);
    275 	if (offset == 0)
    276 		ip->i_ffs_size = length;
    277 	else {
    278 #ifdef QUOTA
    279 		if ((e1 = getinoquota(ip)) != 0)
    280 			return (e1);
    281 #endif
    282 		if ((e1 = bread(vp, lbn, oldsize_newlast, NOCRED, &bp)) != 0) {
    283 			printf("lfs_truncate: bread: %d\n",e1);
    284 			brelse(bp);
    285 			return (e1);
    286 		}
    287 		ip->i_ffs_size = length;
    288 #if defined(UVM)
    289 		(void)uvm_vnp_uncache(vp);
    290 #else
    291 		(void)vnode_pager_uncache(vp);
    292 #endif
    293 		newsize = blksize(fs, ip, lbn);
    294 		bzero((char *)bp->b_data + offset, (u_int)(newsize - offset));
    295 #ifdef DEBUG
    296 		if(bp->b_flags & B_CALL)
    297 		    panic("Can't allocbuf malloced buffer!");
    298 		else
    299 #endif
    300 			allocbuf(bp, newsize);
    301 		if(oldsize_newlast > newsize)
    302 			ip->i_ffs_blocks -= btodb(oldsize_newlast - newsize);
    303 		if ((e1 = VOP_BWRITE(bp)) != 0) {
    304 			printf("lfs_truncate: bwrite: %d\n",e1);
    305 			return (e1);
    306 		}
    307 	}
    308 	/*
    309 	 * Modify sup->su_nbyte counters for each deleted block; keep track
    310 	 * of number of blocks removed for ip->i_ffs_blocks.
    311 	 */
    312 	fragsreleased = 0;
    313 	num = 0;
    314 	lastseg = -1;
    315 
    316 	for (lbn = olastblock; lbn >= lastblock;) {
    317 		/* XXX use run length from bmap array to make this faster */
    318 		ufs_bmaparray(vp, lbn, &daddr, a, &depth, NULL);
    319 		if (lbn == olastblock) {
    320 			for (i = NIADDR + 2; i--;)
    321 				a_end[i] = a[i];
    322 			freesize = oldsize_lastblock;
    323 		} else
    324 			freesize = fs->lfs_bsize;
    325 		switch (depth) {
    326 		case 0:		/* Direct block. */
    327 			daddr = ip->i_ffs_db[lbn];
    328 			SEGDEC(freesize);
    329 			ip->i_ffs_db[lbn] = 0;
    330 			--lbn;
    331 			break;
    332 #ifdef DIAGNOSTIC
    333 		case 1:		/* An indirect block. */
    334 			panic("lfs_truncate: ufs_bmaparray returned depth 1");
    335 			/* NOTREACHED */
    336 #endif
    337 		default:	/* Chain of indirect blocks. */
    338 			inp = a + --depth;
    339 			if (inp->in_off > 0 && lbn != lastblock) {
    340 				lbn -= inp->in_off < lbn - lastblock ?
    341 					inp->in_off : lbn - lastblock;
    342 				break;
    343 			}
    344 			for (; depth && (inp->in_off == 0 || lbn == lastblock);
    345 			     --inp, --depth) {
    346 				if (bread(vp,
    347 					  inp->in_lbn, fs->lfs_bsize, NOCRED, &bp))
    348 					panic("lfs_truncate: bread bno %d",
    349 					      inp->in_lbn);
    350 				daddrp = (ufs_daddr_t *)bp->b_data + inp->in_off;
    351 				for (i = inp->in_off;
    352 				     i++ <= a_end[depth].in_off;) {
    353 					daddr = *daddrp++;
    354 					SEGDEC(freesize);
    355 				}
    356 				a_end[depth].in_off = NINDIR(fs) - 1;
    357 				if (inp->in_off == 0)
    358 					brelse (bp);
    359 				else {
    360 					bzero((ufs_daddr_t *)bp->b_data +
    361 					      inp->in_off, fs->lfs_bsize -
    362 					      inp->in_off * sizeof(ufs_daddr_t));
    363 					if ((e1 = VOP_BWRITE(bp)) != 0) {
    364 						printf("lfs_truncate: indir bwrite: %d\n",e1);
    365 						return (e1);
    366 					}
    367 				}
    368 			}
    369 			if (depth == 0 && a[1].in_off == 0) {
    370 				off = a[0].in_off;
    371 				daddr = ip->i_ffs_ib[off];
    372 				SEGDEC(freesize);
    373 				ip->i_ffs_ib[off] = 0;
    374 			}
    375 			if (lbn == lastblock || lbn <= NDADDR)
    376 				--lbn;
    377 			else {
    378 				lbn -= NINDIR(fs);
    379 				if (lbn < lastblock)
    380 					lbn = lastblock;
    381 			}
    382 		}
    383 	}
    384 	UPDATE_SEGUSE;
    385 
    386 	/* If truncating the file to 0, update the version number. */
    387 	if (length == 0) {
    388 		LFS_IENTRY(ifp, fs, ip->i_number, bp);
    389 		++ifp->if_version;
    390 		(void) VOP_BWRITE(bp);
    391 	}
    392 #ifdef DIAGNOSTIC
    393 	if (ip->i_ffs_blocks < fragstodb(fs, fragsreleased)) {
    394 		panic("lfs_truncate: frag count < 0 (%d<%ld), ino %d\n",
    395 			    ip->i_ffs_blocks, fragstodb(fs, fragsreleased),
    396 			    ip->i_number);
    397 		fragsreleased = dbtofrags(fs, ip->i_ffs_blocks);
    398 	}
    399 #endif
    400 	ip->i_ffs_blocks -= fragstodb(fs, fragsreleased);
    401 	fs->lfs_bfree +=  fragstodb(fs, fragsreleased);
    402 	ip->i_flag |= IN_CHANGE | IN_UPDATE;
    403 	/*
    404 	 * Traverse dirty block list counting number of dirty buffers
    405 	 * that are being deleted out of the cache, so that the lfs_avail
    406 	 * field can be updated.
    407 	 */
    408 	a_released = 0;
    409 	i_released = 0;
    410 	for (bp = vp->v_dirtyblkhd.lh_first; bp; bp = bp->b_vnbufs.le_next) {
    411 		if (bp->b_flags & B_LOCKED) {
    412 			a_released += numfrags(fs, bp->b_bcount);
    413 			/*
    414 			 * XXX
    415 			 * When buffers are created in the cache, their block
    416 			 * number is set equal to their logical block number.
    417 			 * If that is still true, we are assuming that the
    418 			 * blocks are new (not yet on disk) and weren't
    419 			 * counted above.  However, there is a slight chance
    420 			 * that a block's disk address is equal to its logical
    421 			 * block number in which case, we'll get an overcounting
    422 			 * here.
    423 			 */
    424 			if (bp->b_blkno == bp->b_lblkno) {
    425 				i_released += numfrags(fs, bp->b_bcount);
    426 			}
    427 		}
    428 	}
    429 	fragsreleased = i_released;
    430 #ifdef DIAGNOSTIC
    431 	if (fragsreleased > dbtofrags(fs, ip->i_ffs_blocks)) {
    432 		printf("lfs_inode: %ld frags released > %d in inode %d\n",
    433 		       fragsreleased, dbtofrags(fs, ip->i_ffs_blocks),
    434 		       ip->i_number);
    435 		fragsreleased = dbtofrags(fs, ip->i_ffs_blocks);
    436 	}
    437 #endif
    438 	fs->lfs_bfree += fragstodb(fs, fragsreleased);
    439 	ip->i_ffs_blocks -= fragstodb(fs, fragsreleased);
    440 #ifdef DIAGNOSTIC
    441 	if (length == 0 && ip->i_ffs_blocks != 0) {
    442 		printf("lfs_inode: trunc to zero, but %d blocks left on inode %d\n",
    443 		       ip->i_ffs_blocks, ip->i_number);
    444 		panic("lfs_inode\n");
    445 	}
    446 #endif
    447 	fs->lfs_avail += fragstodb(fs, a_released);
    448 	e1 = vinvalbuf(vp, (length > 0) ? V_SAVE : 0, ap->a_cred, ap->a_p,
    449 		       0, 0);
    450 	e2 = VOP_UPDATE(vp, NULL, NULL, 0);
    451 	if(e1)
    452 		printf("lfs_truncate: vinvalbuf: %d\n",e1);
    453 	if(e2)
    454 		printf("lfs_truncate: update: %d\n",e2);
    455 
    456 	return (e1 ? e1 : e2 ? e2 : 0);
    457 }
    458