Home | History | Annotate | Line # | Download | only in lfs
lfs_balloc.c revision 1.15
      1  1.15  perseant /*	$NetBSD: lfs_balloc.c,v 1.15 2000/04/23 21:10:26 perseant Exp $	*/
      2   1.2       cgd 
      3  1.11  perseant /*-
      4  1.11  perseant  * Copyright (c) 1999 The NetBSD Foundation, Inc.
      5  1.11  perseant  * All rights reserved.
      6  1.11  perseant  *
      7  1.11  perseant  * This code is derived from software contributed to The NetBSD Foundation
      8  1.11  perseant  * by Konrad E. Schroder <perseant (at) hhhh.org>.
      9  1.11  perseant  *
     10  1.11  perseant  * Redistribution and use in source and binary forms, with or without
     11  1.11  perseant  * modification, are permitted provided that the following conditions
     12  1.11  perseant  * are met:
     13  1.11  perseant  * 1. Redistributions of source code must retain the above copyright
     14  1.11  perseant  *    notice, this list of conditions and the following disclaimer.
     15  1.11  perseant  * 2. Redistributions in binary form must reproduce the above copyright
     16  1.11  perseant  *    notice, this list of conditions and the following disclaimer in the
     17  1.11  perseant  *    documentation and/or other materials provided with the distribution.
     18  1.11  perseant  * 3. All advertising materials mentioning features or use of this software
     19  1.11  perseant  *    must display the following acknowledgement:
     20  1.11  perseant  *      This product includes software developed by the NetBSD
     21  1.11  perseant  *      Foundation, Inc. and its contributors.
     22  1.11  perseant  * 4. Neither the name of The NetBSD Foundation nor the names of its
     23  1.11  perseant  *    contributors may be used to endorse or promote products derived
     24  1.11  perseant  *    from this software without specific prior written permission.
     25  1.11  perseant  *
     26  1.11  perseant  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     27  1.11  perseant  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     28  1.11  perseant  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     29  1.11  perseant  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     30  1.11  perseant  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     31  1.11  perseant  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     32  1.11  perseant  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     33  1.11  perseant  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     34  1.11  perseant  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     35  1.11  perseant  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     36  1.11  perseant  * POSSIBILITY OF SUCH DAMAGE.
     37  1.11  perseant  */
     38   1.1   mycroft /*
     39   1.1   mycroft  * Copyright (c) 1989, 1991, 1993
     40   1.1   mycroft  *	The Regents of the University of California.  All rights reserved.
     41   1.1   mycroft  *
     42   1.1   mycroft  * Redistribution and use in source and binary forms, with or without
     43   1.1   mycroft  * modification, are permitted provided that the following conditions
     44   1.1   mycroft  * are met:
     45   1.1   mycroft  * 1. Redistributions of source code must retain the above copyright
     46   1.1   mycroft  *    notice, this list of conditions and the following disclaimer.
     47   1.1   mycroft  * 2. Redistributions in binary form must reproduce the above copyright
     48   1.1   mycroft  *    notice, this list of conditions and the following disclaimer in the
     49   1.1   mycroft  *    documentation and/or other materials provided with the distribution.
     50   1.1   mycroft  * 3. All advertising materials mentioning features or use of this software
     51   1.1   mycroft  *    must display the following acknowledgement:
     52   1.1   mycroft  *	This product includes software developed by the University of
     53   1.1   mycroft  *	California, Berkeley and its contributors.
     54   1.1   mycroft  * 4. Neither the name of the University nor the names of its contributors
     55   1.1   mycroft  *    may be used to endorse or promote products derived from this software
     56   1.1   mycroft  *    without specific prior written permission.
     57   1.1   mycroft  *
     58   1.1   mycroft  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     59   1.1   mycroft  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     60   1.1   mycroft  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     61   1.1   mycroft  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     62   1.1   mycroft  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     63   1.1   mycroft  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     64   1.1   mycroft  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     65   1.1   mycroft  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     66   1.1   mycroft  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     67   1.1   mycroft  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     68   1.1   mycroft  * SUCH DAMAGE.
     69   1.1   mycroft  *
     70   1.5      fvdl  *	@(#)lfs_balloc.c	8.4 (Berkeley) 5/8/95
     71   1.1   mycroft  */
     72   1.8    scottr 
     73   1.9    scottr #if defined(_KERNEL) && !defined(_LKM)
     74   1.8    scottr #include "opt_quota.h"
     75   1.9    scottr #endif
     76   1.8    scottr 
     77   1.1   mycroft #include <sys/param.h>
     78   1.3  christos #include <sys/systm.h>
     79   1.1   mycroft #include <sys/buf.h>
     80   1.1   mycroft #include <sys/proc.h>
     81   1.1   mycroft #include <sys/vnode.h>
     82   1.1   mycroft #include <sys/mount.h>
     83   1.1   mycroft #include <sys/resourcevar.h>
     84   1.1   mycroft #include <sys/trace.h>
     85   1.1   mycroft 
     86   1.1   mycroft #include <miscfs/specfs/specdev.h>
     87   1.1   mycroft 
     88   1.1   mycroft #include <ufs/ufs/quota.h>
     89   1.1   mycroft #include <ufs/ufs/inode.h>
     90   1.1   mycroft #include <ufs/ufs/ufsmount.h>
     91   1.3  christos #include <ufs/ufs/ufs_extern.h>
     92   1.1   mycroft 
     93   1.1   mycroft #include <ufs/lfs/lfs.h>
     94   1.1   mycroft #include <ufs/lfs/lfs_extern.h>
     95   1.1   mycroft 
     96   1.5      fvdl #include <vm/vm.h>
     97  1.12       mrg 
     98  1.12       mrg #include <uvm/uvm_extern.h>
     99   1.5      fvdl 
    100   1.5      fvdl int lfs_fragextend __P((struct vnode *, int, int, ufs_daddr_t, struct buf **));
    101   1.5      fvdl 
    102   1.1   mycroft int
    103  1.14      fvdl lfs_balloc(v)
    104  1.14      fvdl 	void *v;
    105  1.14      fvdl {
    106  1.14      fvdl 	struct vop_balloc_args /* {
    107  1.14      fvdl 		struct vnode *a_vp;
    108  1.14      fvdl 		off_t a_startoffset;
    109  1.14      fvdl 		int a_size;
    110  1.14      fvdl 		struct ucred *a_cred;
    111  1.14      fvdl 		int a_flags;
    112  1.14      fvdl 		struct buf *a_bpp;
    113  1.14      fvdl 	} */ *ap = v;
    114   1.1   mycroft 	struct vnode *vp;
    115   1.5      fvdl 	int offset;
    116   1.1   mycroft 	u_long iosize;
    117  1.14      fvdl 	daddr_t lbn;
    118   1.1   mycroft 	struct buf *ibp, *bp;
    119   1.1   mycroft 	struct inode *ip;
    120   1.1   mycroft 	struct lfs *fs;
    121   1.1   mycroft 	struct indir indirs[NIADDR+2];
    122   1.5      fvdl 	ufs_daddr_t	daddr, lastblock;
    123  1.11  perseant 	int bb;		/* number of disk blocks in a block disk blocks */
    124  1.11  perseant 	int error, frags, i, nsize, osize, num;
    125  1.14      fvdl 
    126  1.14      fvdl 	vp = ap->a_vp;
    127   1.1   mycroft 	ip = VTOI(vp);
    128   1.1   mycroft 	fs = ip->i_lfs;
    129  1.14      fvdl 	offset = blkoff(fs, ap->a_startoffset);
    130  1.14      fvdl 	iosize = ap->a_size;
    131  1.14      fvdl 	lbn = lblkno(fs, ap->a_startoffset);
    132  1.14      fvdl 	(void)lfs_check(vp, lbn, 0);
    133  1.11  perseant 
    134  1.11  perseant #ifdef DEBUG
    135  1.11  perseant 	if(!VOP_ISLOCKED(vp)) {
    136  1.11  perseant 		printf("lfs_balloc: warning: ino %d not locked\n",ip->i_number);
    137  1.11  perseant 	}
    138  1.11  perseant #endif
    139  1.11  perseant 
    140   1.1   mycroft 	/*
    141   1.1   mycroft 	 * Three cases: it's a block beyond the end of file, it's a block in
    142   1.1   mycroft 	 * the file that may or may not have been assigned a disk address or
    143   1.1   mycroft 	 * we're writing an entire block.  Note, if the daddr is unassigned,
    144   1.1   mycroft 	 * the block might still have existed in the cache (if it was read
    145  1.11  perseant 	 * or written earlier).	 If it did, make sure we don't count it as a
    146  1.11  perseant 	 * new block or zero out its contents.	If it did not, make sure
    147   1.1   mycroft 	 * we allocate any necessary indirect blocks.
    148   1.5      fvdl 	 * If we are writing a block beyond the end of the file, we need to
    149  1.11  perseant 	 * check if the old last block was a fragment.	If it was, we need
    150   1.5      fvdl 	 * to rewrite it.
    151   1.1   mycroft 	 */
    152  1.11  perseant 
    153  1.14      fvdl 	*ap->a_bpp = NULL;
    154   1.5      fvdl 	error = ufs_bmaparray(vp, lbn, &daddr, &indirs[0], &num, NULL );
    155   1.3  christos 	if (error)
    156   1.1   mycroft 		return (error);
    157  1.11  perseant 
    158   1.5      fvdl 	/* Check for block beyond end of file and fragment extension needed. */
    159   1.5      fvdl 	lastblock = lblkno(fs, ip->i_ffs_size);
    160   1.5      fvdl 	if (lastblock < NDADDR && lastblock < lbn) {
    161   1.5      fvdl 		osize = blksize(fs, ip, lastblock);
    162   1.5      fvdl 		if (osize < fs->lfs_bsize && osize > 0) {
    163   1.5      fvdl 			if ((error = lfs_fragextend(vp, osize, fs->lfs_bsize,
    164  1.11  perseant 						    lastblock, &bp)))
    165   1.5      fvdl 				return(error);
    166   1.5      fvdl 			ip->i_ffs_size = (lastblock + 1) * fs->lfs_bsize;
    167   1.7  drochner 			uvm_vnp_setsize(vp, ip->i_ffs_size);
    168   1.5      fvdl 			ip->i_flag |= IN_CHANGE | IN_UPDATE;
    169   1.5      fvdl 			VOP_BWRITE(bp);
    170   1.5      fvdl 		}
    171   1.5      fvdl 	}
    172  1.11  perseant 
    173   1.1   mycroft 	bb = VFSTOUFS(vp->v_mount)->um_seqinc;
    174   1.1   mycroft 	if (daddr == UNASSIGNED)
    175   1.1   mycroft 		/* May need to allocate indirect blocks */
    176   1.1   mycroft 		for (i = 1; i < num; ++i)
    177   1.1   mycroft 			if (!indirs[i].in_exists) {
    178   1.5      fvdl 				ibp = getblk(vp, indirs[i].in_lbn, fs->lfs_bsize,
    179  1.11  perseant 					     0, 0);
    180   1.5      fvdl 				if ((ibp->b_flags & (B_DONE | B_DELWRI)))
    181   1.1   mycroft 					panic ("Indirect block should not exist");
    182   1.5      fvdl 
    183   1.5      fvdl 				if (!ISSPACE(fs, bb, curproc->p_ucred)){
    184   1.5      fvdl 					ibp->b_flags |= B_INVAL;
    185   1.5      fvdl 					brelse(ibp);
    186   1.5      fvdl 					return(ENOSPC);
    187   1.5      fvdl 				} else {
    188   1.5      fvdl 					ip->i_ffs_blocks += bb;
    189   1.5      fvdl 					ip->i_lfs->lfs_bfree -= bb;
    190   1.5      fvdl 					clrbuf(ibp);
    191   1.5      fvdl 					if ((error = VOP_BWRITE(ibp)))
    192   1.5      fvdl 						return(error);
    193   1.5      fvdl 				}
    194   1.1   mycroft 			}
    195  1.11  perseant 
    196   1.5      fvdl 	/*
    197   1.5      fvdl 	 * If the block we are writing is a direct block, it's the last
    198   1.5      fvdl 	 * block in the file, and offset + iosize is less than a full
    199   1.5      fvdl 	 * block, we can write one or more fragments.  There are two cases:
    200   1.5      fvdl 	 * the block is brand new and we should allocate it the correct
    201   1.5      fvdl 	 * size or it already exists and contains some fragments and
    202   1.5      fvdl 	 * may need to extend it.
    203   1.5      fvdl 	 */
    204  1.11  perseant 	if (lbn < NDADDR && lblkno(fs, ip->i_ffs_size) <= lbn) {
    205  1.11  perseant 		osize = blksize(fs, ip, lbn);
    206   1.5      fvdl 		nsize = fragroundup(fs, offset + iosize);
    207   1.5      fvdl 		frags = numfrags(fs, nsize);
    208   1.5      fvdl 		bb = fragstodb(fs, frags);
    209  1.11  perseant 		if (lblktosize(fs, lbn) >= ip->i_ffs_size)
    210   1.5      fvdl 			/* Brand new block or fragment */
    211  1.14      fvdl 			*ap->a_bpp = bp = getblk(vp, lbn, nsize, 0, 0);
    212   1.5      fvdl 		else {
    213  1.11  perseant 			if (nsize <= osize) {
    214  1.11  perseant 				/* No need to extend */
    215  1.11  perseant 				/* XXX KS - Are we wasting space? */
    216  1.11  perseant 				if ((error = bread(vp, lbn, osize, NOCRED, &bp)))
    217  1.11  perseant 					return error;
    218  1.11  perseant 			} else {
    219  1.11  perseant 				/* Extend existing block */
    220  1.11  perseant 				if ((error =
    221  1.11  perseant 				     lfs_fragextend(vp, osize, nsize, lbn, &bp)))
    222  1.11  perseant 					return(error);
    223  1.11  perseant 			}
    224  1.14      fvdl 			*ap->a_bpp = bp;
    225   1.5      fvdl 		}
    226   1.5      fvdl 	} else {
    227   1.5      fvdl 		/*
    228   1.5      fvdl 		 * Get the existing block from the cache either because the
    229  1.11  perseant 		 * block 1) is not a direct block or 2) is not the last
    230   1.5      fvdl 		 * block in the file.
    231   1.5      fvdl 		 */
    232   1.5      fvdl 		frags = dbtofrags(fs, bb);
    233  1.14      fvdl 		*ap->a_bpp = bp = getblk(vp, lbn, blksize(fs, ip, lbn), 0, 0);
    234   1.1   mycroft 	}
    235  1.11  perseant 
    236   1.5      fvdl 	/*
    237   1.5      fvdl 	 * The block we are writing may be a brand new block
    238   1.5      fvdl 	 * in which case we need to do accounting (i.e. check
    239   1.5      fvdl 	 * for free space and update the inode number of blocks.
    240  1.15  perseant 	 *
    241  1.15  perseant 	 * We can tell a truly new block because (1) ufs_bmaparray
    242  1.15  perseant 	 * will say it is UNASSIGNED; and (2) it will not be marked
    243  1.15  perseant 	 * with B_DELWRI.  (It might be marked B_DONE, if it was
    244  1.15  perseant 	 * read into the cache before it existed on disk.)
    245   1.5      fvdl 	 */
    246  1.15  perseant 	if ((!(bp->b_flags & B_DELWRI)) && daddr == UNASSIGNED) {
    247  1.15  perseant 		if (!ISSPACE(fs, bb, curproc->p_ucred)) {
    248  1.15  perseant 			bp->b_flags |= B_INVAL;
    249  1.15  perseant 			brelse(bp);
    250  1.15  perseant 			return(ENOSPC);
    251  1.15  perseant 		} else {
    252  1.15  perseant 			ip->i_ffs_blocks += bb;
    253  1.15  perseant 			ip->i_lfs->lfs_bfree -= bb;
    254  1.15  perseant 			if (iosize != fs->lfs_bsize)
    255  1.15  perseant 				clrbuf(bp);
    256  1.15  perseant 		}
    257  1.15  perseant 	} else if (!(bp->b_flags & (B_DONE|B_DELWRI))) {
    258  1.15  perseant 		/*
    259  1.15  perseant 		 * Not a brand new block, also not in the cache;
    260  1.15  perseant 		 * read it in from disk.
    261  1.15  perseant 		 */
    262  1.15  perseant 		if (iosize == fs->lfs_bsize)
    263   1.5      fvdl 			/* Optimization: I/O is unnecessary. */
    264   1.5      fvdl 			bp->b_blkno = daddr;
    265  1.15  perseant 		else {
    266   1.5      fvdl 			/*
    267   1.5      fvdl 			 * We need to read the block to preserve the
    268   1.5      fvdl 			 * existing bytes.
    269   1.5      fvdl 			 */
    270   1.1   mycroft 			bp->b_blkno = daddr;
    271   1.1   mycroft 			bp->b_flags |= B_READ;
    272   1.1   mycroft 			VOP_STRATEGY(bp);
    273   1.1   mycroft 			return(biowait(bp));
    274   1.1   mycroft 		}
    275   1.1   mycroft 	}
    276  1.11  perseant 
    277   1.5      fvdl 	return (0);
    278   1.5      fvdl }
    279   1.5      fvdl 
    280   1.5      fvdl int
    281   1.5      fvdl lfs_fragextend(vp, osize, nsize, lbn, bpp)
    282   1.5      fvdl 	struct vnode *vp;
    283   1.5      fvdl 	int osize;
    284   1.5      fvdl 	int nsize;
    285   1.5      fvdl 	ufs_daddr_t lbn;
    286   1.5      fvdl 	struct buf **bpp;
    287   1.5      fvdl {
    288   1.5      fvdl 	struct inode *ip;
    289   1.5      fvdl 	struct lfs *fs;
    290   1.5      fvdl 	long bb;
    291   1.5      fvdl 	int error;
    292  1.11  perseant 	extern long locked_queue_bytes;
    293  1.13  perseant 	struct buf *ibp;
    294  1.13  perseant 	SEGUSE *sup;
    295   1.5      fvdl 
    296   1.5      fvdl 	ip = VTOI(vp);
    297   1.5      fvdl 	fs = ip->i_lfs;
    298  1.11  perseant 
    299   1.5      fvdl 	bb = (long)fragstodb(fs, numfrags(fs, nsize - osize));
    300  1.11  perseant  top:
    301   1.5      fvdl 	if (!ISSPACE(fs, bb, curproc->p_ucred)) {
    302   1.5      fvdl 		return(ENOSPC);
    303   1.5      fvdl 	}
    304   1.5      fvdl 	if ((error = bread(vp, lbn, osize, NOCRED, bpp))) {
    305   1.5      fvdl 		brelse(*bpp);
    306   1.5      fvdl 		return(error);
    307   1.5      fvdl 	}
    308  1.13  perseant 
    309  1.13  perseant 	/*
    310  1.13  perseant  	 * Fix the allocation for this fragment so that it looks like the
    311  1.13  perseant          * source segment contained a block of the new size.  This overcounts;
    312  1.13  perseant 	 * but the overcount only lasts until the block in question
    313  1.13  perseant 	 * is written, so the on-disk live bytes count is always correct.
    314  1.13  perseant 	 */
    315  1.13  perseant 	LFS_SEGENTRY(sup, fs, datosn(fs,(*bpp)->b_blkno), ibp);
    316  1.13  perseant 	sup->su_nbytes += (nsize-osize);
    317  1.13  perseant 	VOP_BWRITE(ibp);
    318  1.13  perseant 
    319   1.5      fvdl #ifdef QUOTA
    320   1.5      fvdl 	if ((error = chkdq(ip, bb, curproc->p_ucred, 0))) {
    321   1.5      fvdl 		brelse(*bpp);
    322   1.5      fvdl 		return (error);
    323   1.5      fvdl 	}
    324   1.5      fvdl #endif
    325  1.11  perseant 	/*
    326  1.11  perseant 	 * XXX - KS - Don't change size while we're gathered, as we could
    327  1.11  perseant 	 * then overlap another buffer in lfs_writeseg.
    328  1.11  perseant 	 */
    329  1.11  perseant 	if((*bpp)->b_flags & B_GATHERED) {
    330  1.11  perseant 		(*bpp)->b_flags |= B_NEEDCOMMIT; /* XXX KS - what flag to use? */
    331  1.11  perseant 		brelse(*bpp);
    332  1.11  perseant 		tsleep(*bpp, (PRIBIO+1), "lfs_fragextend", 0);
    333  1.11  perseant 		goto top;
    334  1.11  perseant 	}
    335   1.5      fvdl 	ip->i_ffs_blocks += bb;
    336   1.5      fvdl 	ip->i_flag |= IN_CHANGE | IN_UPDATE;
    337   1.5      fvdl 	fs->lfs_bfree -= fragstodb(fs, numfrags(fs, (nsize - osize)));
    338  1.11  perseant 	if((*bpp)->b_flags & B_LOCKED)
    339  1.11  perseant 		locked_queue_bytes += (nsize - osize);
    340   1.5      fvdl 	allocbuf(*bpp, nsize);
    341   1.5      fvdl 	bzero((char *)((*bpp)->b_data) + osize, (u_int)(nsize - osize));
    342  1.11  perseant 
    343   1.5      fvdl 	return(0);
    344   1.1   mycroft }
    345