Home | History | Annotate | Line # | Download | only in lfs
lfs_alloc.c revision 1.106.10.3
      1  1.106.10.3      yamt /*	$NetBSD: lfs_alloc.c,v 1.106.10.3 2010/03/11 15:04:44 yamt Exp $	*/
      2         1.2       cgd 
      3        1.17  perseant /*-
      4       1.100        ad  * Copyright (c) 1999, 2000, 2001, 2002, 2003, 2007 The NetBSD Foundation, Inc.
      5        1.17  perseant  * All rights reserved.
      6        1.17  perseant  *
      7        1.17  perseant  * This code is derived from software contributed to The NetBSD Foundation
      8        1.17  perseant  * by Konrad E. Schroder <perseant (at) hhhh.org>.
      9        1.17  perseant  *
     10        1.17  perseant  * Redistribution and use in source and binary forms, with or without
     11        1.17  perseant  * modification, are permitted provided that the following conditions
     12        1.17  perseant  * are met:
     13        1.17  perseant  * 1. Redistributions of source code must retain the above copyright
     14        1.17  perseant  *    notice, this list of conditions and the following disclaimer.
     15        1.17  perseant  * 2. Redistributions in binary form must reproduce the above copyright
     16        1.17  perseant  *    notice, this list of conditions and the following disclaimer in the
     17        1.17  perseant  *    documentation and/or other materials provided with the distribution.
     18        1.17  perseant  *
     19        1.17  perseant  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20        1.17  perseant  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21        1.17  perseant  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22        1.17  perseant  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23        1.17  perseant  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24        1.17  perseant  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25        1.17  perseant  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26        1.17  perseant  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27        1.17  perseant  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28        1.17  perseant  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29        1.17  perseant  * POSSIBILITY OF SUCH DAMAGE.
     30        1.17  perseant  */
     31         1.1   mycroft /*
     32         1.1   mycroft  * Copyright (c) 1991, 1993
     33         1.1   mycroft  *	The Regents of the University of California.  All rights reserved.
     34         1.1   mycroft  *
     35         1.1   mycroft  * Redistribution and use in source and binary forms, with or without
     36         1.1   mycroft  * modification, are permitted provided that the following conditions
     37         1.1   mycroft  * are met:
     38         1.1   mycroft  * 1. Redistributions of source code must retain the above copyright
     39         1.1   mycroft  *    notice, this list of conditions and the following disclaimer.
     40         1.1   mycroft  * 2. Redistributions in binary form must reproduce the above copyright
     41         1.1   mycroft  *    notice, this list of conditions and the following disclaimer in the
     42         1.1   mycroft  *    documentation and/or other materials provided with the distribution.
     43        1.71       agc  * 3. Neither the name of the University nor the names of its contributors
     44         1.1   mycroft  *    may be used to endorse or promote products derived from this software
     45         1.1   mycroft  *    without specific prior written permission.
     46         1.1   mycroft  *
     47         1.1   mycroft  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     48         1.1   mycroft  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     49         1.1   mycroft  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     50         1.1   mycroft  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     51         1.1   mycroft  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     52         1.1   mycroft  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     53         1.1   mycroft  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     54         1.1   mycroft  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     55         1.1   mycroft  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     56         1.1   mycroft  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     57         1.1   mycroft  * SUCH DAMAGE.
     58         1.1   mycroft  *
     59         1.2       cgd  *	@(#)lfs_alloc.c	8.4 (Berkeley) 1/4/94
     60         1.1   mycroft  */
     61        1.52     lukem 
     62        1.52     lukem #include <sys/cdefs.h>
     63  1.106.10.3      yamt __KERNEL_RCSID(0, "$NetBSD: lfs_alloc.c,v 1.106.10.3 2010/03/11 15:04:44 yamt Exp $");
     64        1.12    scottr 
     65        1.47       mrg #if defined(_KERNEL_OPT)
     66        1.12    scottr #include "opt_quota.h"
     67        1.13    scottr #endif
     68         1.1   mycroft 
     69         1.1   mycroft #include <sys/param.h>
     70         1.3  christos #include <sys/systm.h>
     71         1.1   mycroft #include <sys/kernel.h>
     72         1.1   mycroft #include <sys/buf.h>
     73        1.56  perseant #include <sys/lock.h>
     74         1.1   mycroft #include <sys/vnode.h>
     75         1.1   mycroft #include <sys/syslog.h>
     76         1.1   mycroft #include <sys/mount.h>
     77        1.87  perseant #include <sys/malloc.h>
     78        1.15   thorpej #include <sys/pool.h>
     79        1.50       chs #include <sys/proc.h>
     80        1.81  perseant #include <sys/tree.h>
     81        1.94      elad #include <sys/kauth.h>
     82         1.1   mycroft 
     83         1.1   mycroft #include <ufs/ufs/quota.h>
     84         1.1   mycroft #include <ufs/ufs/inode.h>
     85         1.1   mycroft #include <ufs/ufs/ufsmount.h>
     86         1.3  christos #include <ufs/ufs/ufs_extern.h>
     87         1.1   mycroft 
     88         1.1   mycroft #include <ufs/lfs/lfs.h>
     89         1.1   mycroft #include <ufs/lfs/lfs_extern.h>
     90         1.1   mycroft 
     91        1.87  perseant /* Constants for inode free bitmap */
     92        1.88  perseant #define BMSHIFT 5	/* 2 ** 5 = 32 */
     93        1.88  perseant #define BMMASK  ((1 << BMSHIFT) - 1)
     94        1.88  perseant #define SET_BITMAP_FREE(F, I) do { \
     95        1.88  perseant 	DLOG((DLOG_ALLOC, "lfs: ino %d wrd %d bit %d set\n", (int)(I), 	\
     96        1.88  perseant 	     (int)((I) >> BMSHIFT), (int)((I) & BMMASK)));		\
     97        1.88  perseant 	(F)->lfs_ino_bitmap[(I) >> BMSHIFT] |= (1 << ((I) & BMMASK));	\
     98        1.88  perseant } while (0)
     99        1.88  perseant #define CLR_BITMAP_FREE(F, I) do { \
    100        1.88  perseant 	DLOG((DLOG_ALLOC, "lfs: ino %d wrd %d bit %d clr\n", (int)(I), 	\
    101        1.88  perseant 	     (int)((I) >> BMSHIFT), (int)((I) & BMMASK)));		\
    102        1.88  perseant 	(F)->lfs_ino_bitmap[(I) >> BMSHIFT] &= ~(1 << ((I) & BMMASK));	\
    103        1.88  perseant } while(0)
    104        1.88  perseant 
    105        1.87  perseant #define ISSET_BITMAP_FREE(F, I) \
    106        1.88  perseant 	((F)->lfs_ino_bitmap[(I) >> BMSHIFT] & (1 << ((I) & BMMASK)))
    107        1.87  perseant 
    108        1.44  perseant /*
    109        1.65  perseant  * Add a new block to the Ifile, to accommodate future file creations.
    110        1.65  perseant  * Called with the segment lock held.
    111        1.56  perseant  */
    112        1.96  perseant int
    113        1.96  perseant lfs_extend_ifile(struct lfs *fs, kauth_cred_t cred)
    114        1.44  perseant {
    115        1.44  perseant 	struct vnode *vp;
    116        1.44  perseant 	struct inode *ip;
    117        1.44  perseant 	IFILE *ifp;
    118        1.48  perseant 	IFILE_V1 *ifp_v1;
    119        1.48  perseant 	struct buf *bp, *cbp;
    120        1.44  perseant 	int error;
    121        1.83  christos 	daddr_t i, blkno, xmax;
    122        1.87  perseant 	ino_t oldlast, maxino;
    123        1.48  perseant 	CLEANERINFO *cip;
    124        1.44  perseant 
    125        1.78  perseant 	ASSERT_SEGLOCK(fs);
    126        1.78  perseant 
    127        1.44  perseant 	vp = fs->lfs_ivnode;
    128        1.44  perseant 	ip = VTOI(vp);
    129        1.66      fvdl 	blkno = lblkno(fs, ip->i_size);
    130        1.85      yamt 	if ((error = lfs_balloc(vp, ip->i_size, fs->lfs_bsize, cred, 0,
    131        1.44  perseant 				&bp)) != 0) {
    132        1.44  perseant 		return (error);
    133        1.44  perseant 	}
    134        1.66      fvdl 	ip->i_size += fs->lfs_bsize;
    135        1.66      fvdl 	ip->i_ffs1_size = ip->i_size;
    136        1.66      fvdl 	uvm_vnp_setsize(vp, ip->i_size);
    137        1.75     perry 
    138        1.88  perseant 	maxino = ((ip->i_size >> fs->lfs_bshift) - fs->lfs_cleansz -
    139        1.88  perseant 		  fs->lfs_segtabsz) * fs->lfs_ifpb;
    140        1.88  perseant 	fs->lfs_ino_bitmap = (lfs_bm_t *)
    141        1.88  perseant 		realloc(fs->lfs_ino_bitmap, ((maxino + BMMASK) >> BMSHIFT) *
    142        1.88  perseant 			sizeof(lfs_bm_t), M_SEGMENT, M_WAITOK);
    143        1.88  perseant 	KASSERT(fs->lfs_ino_bitmap != NULL);
    144        1.87  perseant 
    145        1.44  perseant 	i = (blkno - fs->lfs_segtabsz - fs->lfs_cleansz) *
    146        1.44  perseant 		fs->lfs_ifpb;
    147        1.87  perseant 
    148        1.87  perseant 	/*
    149        1.87  perseant 	 * We insert the new inodes at the head of the free list.
    150        1.87  perseant 	 * Under normal circumstances, the free list is empty here,
    151        1.87  perseant 	 * so we are also incidentally placing them at the end (which
    152        1.87  perseant 	 * we must do if we are to keep them in order).
    153        1.87  perseant 	 */
    154        1.48  perseant 	LFS_GET_HEADFREE(fs, cip, cbp, &oldlast);
    155        1.48  perseant 	LFS_PUT_HEADFREE(fs, cip, cbp, i);
    156        1.44  perseant #ifdef DIAGNOSTIC
    157        1.63  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM)
    158        1.44  perseant 		panic("inode 0 allocated [2]");
    159        1.44  perseant #endif /* DIAGNOSTIC */
    160        1.83  christos 	xmax = i + fs->lfs_ifpb;
    161        1.48  perseant 
    162        1.53       chs 	if (fs->lfs_version == 1) {
    163        1.83  christos 		for (ifp_v1 = (IFILE_V1 *)bp->b_data; i < xmax; ++ifp_v1) {
    164        1.89  perseant 			SET_BITMAP_FREE(fs, i);
    165        1.48  perseant 			ifp_v1->if_version = 1;
    166        1.48  perseant 			ifp_v1->if_daddr = LFS_UNUSED_DADDR;
    167        1.48  perseant 			ifp_v1->if_nextfree = ++i;
    168        1.48  perseant 		}
    169        1.48  perseant 		ifp_v1--;
    170        1.48  perseant 		ifp_v1->if_nextfree = oldlast;
    171        1.48  perseant 	} else {
    172        1.83  christos 		for (ifp = (IFILE *)bp->b_data; i < xmax; ++ifp) {
    173        1.89  perseant 			SET_BITMAP_FREE(fs, i);
    174        1.48  perseant 			ifp->if_version = 1;
    175        1.48  perseant 			ifp->if_daddr = LFS_UNUSED_DADDR;
    176        1.48  perseant 			ifp->if_nextfree = ++i;
    177        1.48  perseant 		}
    178        1.48  perseant 		ifp--;
    179        1.48  perseant 		ifp->if_nextfree = oldlast;
    180        1.44  perseant 	}
    181        1.83  christos 	LFS_PUT_TAILFREE(fs, cip, cbp, xmax - 1);
    182        1.48  perseant 
    183        1.56  perseant 	(void) LFS_BWRITE_LOG(bp); /* Ifile */
    184        1.44  perseant 
    185        1.44  perseant 	return 0;
    186        1.44  perseant }
    187        1.44  perseant 
    188         1.1   mycroft /* Allocate a new inode. */
    189         1.1   mycroft /* ARGSUSED */
    190        1.43  perseant /* VOP_BWRITE 2i times */
    191         1.1   mycroft int
    192        1.99  christos lfs_valloc(struct vnode *pvp, int mode, kauth_cred_t cred,
    193        1.98  christos     struct vnode **vpp)
    194         1.3  christos {
    195         1.1   mycroft 	struct lfs *fs;
    196        1.48  perseant 	struct buf *bp, *cbp;
    197         1.1   mycroft 	struct ifile *ifp;
    198         1.1   mycroft 	ino_t new_ino;
    199         1.1   mycroft 	int error;
    200        1.36  perseant 	int new_gen;
    201        1.48  perseant 	CLEANERINFO *cip;
    202         1.1   mycroft 
    203        1.85      yamt 	fs = VTOI(pvp)->i_lfs;
    204        1.38  perseant 	if (fs->lfs_ronly)
    205        1.38  perseant 		return EROFS;
    206        1.75     perry 
    207        1.78  perseant 	ASSERT_NO_SEGLOCK(fs);
    208        1.78  perseant 
    209        1.56  perseant 	lfs_seglock(fs, SEGM_PROT);
    210        1.78  perseant 	vn_lock(fs->lfs_ivnode, LK_EXCLUSIVE);
    211        1.17  perseant 
    212         1.1   mycroft 	/* Get the head of the freelist. */
    213        1.48  perseant 	LFS_GET_HEADFREE(fs, cip, cbp, &new_ino);
    214        1.87  perseant 	KASSERT(new_ino != LFS_UNUSED_INUM && new_ino != LFS_IFILE_INUM);
    215        1.48  perseant 
    216        1.87  perseant 	DLOG((DLOG_ALLOC, "lfs_valloc: allocate inode %lld\n",
    217        1.87  perseant 	     (long long)new_ino));
    218        1.75     perry 
    219         1.1   mycroft 	/*
    220         1.1   mycroft 	 * Remove the inode from the free list and write the new start
    221         1.1   mycroft 	 * of the free list into the superblock.
    222         1.1   mycroft 	 */
    223        1.87  perseant 	CLR_BITMAP_FREE(fs, new_ino);
    224         1.1   mycroft 	LFS_IENTRY(ifp, fs, new_ino, bp);
    225         1.1   mycroft 	if (ifp->if_daddr != LFS_UNUSED_DADDR)
    226        1.84  christos 		panic("lfs_valloc: inuse inode %llu on the free list",
    227        1.84  christos 		    (unsigned long long)new_ino);
    228        1.48  perseant 	LFS_PUT_HEADFREE(fs, cip, cbp, ifp->if_nextfree);
    229        1.87  perseant 	DLOG((DLOG_ALLOC, "lfs_valloc: headfree %lld -> %lld\n",
    230        1.87  perseant 	     (long long)new_ino, (long long)ifp->if_nextfree));
    231        1.48  perseant 
    232        1.37  perseant 	new_gen = ifp->if_version; /* version was updated by vfree */
    233       1.102        ad 	brelse(bp, 0);
    234        1.30  perseant 
    235         1.1   mycroft 	/* Extend IFILE so that the next lfs_valloc will succeed. */
    236        1.63  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM) {
    237        1.96  perseant 		if ((error = lfs_extend_ifile(fs, cred)) != 0) {
    238        1.48  perseant 			LFS_PUT_HEADFREE(fs, cip, cbp, new_ino);
    239        1.78  perseant 			VOP_UNLOCK(fs->lfs_ivnode, 0);
    240        1.56  perseant 			lfs_segunlock(fs);
    241        1.44  perseant 			return error;
    242         1.1   mycroft 		}
    243         1.1   mycroft 	}
    244        1.17  perseant #ifdef DIAGNOSTIC
    245        1.63  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM)
    246        1.17  perseant 		panic("inode 0 allocated [3]");
    247        1.17  perseant #endif /* DIAGNOSTIC */
    248        1.48  perseant 
    249        1.78  perseant 	/* Set superblock modified bit and increment file count. */
    250       1.105        ad 	mutex_enter(&lfs_lock);
    251        1.78  perseant 	fs->lfs_fmod = 1;
    252       1.105        ad 	mutex_exit(&lfs_lock);
    253        1.78  perseant 	++fs->lfs_nfiles;
    254        1.78  perseant 
    255        1.78  perseant 	VOP_UNLOCK(fs->lfs_ivnode, 0);
    256        1.56  perseant 	lfs_segunlock(fs);
    257        1.63  perseant 
    258        1.85      yamt 	return lfs_ialloc(fs, pvp, new_ino, new_gen, vpp);
    259        1.44  perseant }
    260        1.44  perseant 
    261        1.65  perseant /*
    262        1.65  perseant  * Finish allocating a new inode, given an inode and generation number.
    263        1.65  perseant  */
    264        1.96  perseant int
    265        1.44  perseant lfs_ialloc(struct lfs *fs, struct vnode *pvp, ino_t new_ino, int new_gen,
    266        1.44  perseant 	   struct vnode **vpp)
    267        1.44  perseant {
    268        1.44  perseant 	struct inode *ip;
    269        1.44  perseant 	struct vnode *vp;
    270        1.40      fvdl 
    271        1.78  perseant 	ASSERT_NO_SEGLOCK(fs);
    272        1.78  perseant 
    273        1.77  perseant 	vp = *vpp;
    274       1.100        ad 	mutex_enter(&ufs_hashlock);
    275        1.40      fvdl 	/* Create an inode to associate with the vnode. */
    276        1.44  perseant 	lfs_vcreate(pvp->v_mount, new_ino, vp);
    277        1.51       chs 
    278         1.1   mycroft 	ip = VTOI(vp);
    279       1.105        ad 	mutex_enter(&lfs_lock);
    280        1.73   mycroft 	LFS_SET_UINO(ip, IN_CHANGE);
    281       1.105        ad 	mutex_exit(&lfs_lock);
    282        1.66      fvdl 	/* on-disk structure has been zeroed out by lfs_vcreate */
    283        1.66      fvdl 	ip->i_din.ffs1_din->di_inumber = new_ino;
    284        1.51       chs 
    285        1.79  perseant 	/* Note no blocks yet */
    286        1.79  perseant 	ip->i_lfs_hiblk = -1;
    287        1.79  perseant 
    288         1.1   mycroft 	/* Set a new generation number for this inode. */
    289        1.66      fvdl 	if (new_gen) {
    290        1.66      fvdl 		ip->i_gen = new_gen;
    291        1.66      fvdl 		ip->i_ffs1_gen = new_gen;
    292        1.66      fvdl 	}
    293        1.51       chs 
    294         1.1   mycroft 	/* Insert into the inode hash table. */
    295         1.1   mycroft 	ufs_ihashins(ip);
    296       1.100        ad 	mutex_exit(&ufs_hashlock);
    297        1.44  perseant 
    298        1.77  perseant 	ufs_vinit(vp->v_mount, lfs_specop_p, lfs_fifoop_p, vpp);
    299        1.77  perseant 	vp = *vpp;
    300        1.44  perseant 	ip = VTOI(vp);
    301        1.57      yamt 
    302        1.57      yamt 	memset(ip->i_lfs_fragsize, 0, NDADDR * sizeof(*ip->i_lfs_fragsize));
    303        1.51       chs 
    304        1.51       chs 	uvm_vnp_setsize(vp, 0);
    305        1.72      yamt 	lfs_mark_vnode(vp);
    306        1.54       chs 	genfs_node_init(vp, &lfs_genfsops);
    307  1.106.10.3      yamt 	vref(ip->i_devvp);
    308         1.1   mycroft 	return (0);
    309         1.1   mycroft }
    310         1.1   mycroft 
    311         1.1   mycroft /* Create a new vnode/inode pair and initialize what fields we can. */
    312        1.40      fvdl void
    313        1.48  perseant lfs_vcreate(struct mount *mp, ino_t ino, struct vnode *vp)
    314         1.1   mycroft {
    315         1.1   mycroft 	struct inode *ip;
    316        1.66      fvdl 	struct ufs1_dinode *dp;
    317         1.1   mycroft 	struct ufsmount *ump;
    318        1.75     perry 
    319         1.1   mycroft 	/* Get a pointer to the private mount structure. */
    320         1.1   mycroft 	ump = VFSTOUFS(mp);
    321        1.75     perry 
    322        1.78  perseant 	ASSERT_NO_SEGLOCK(ump->um_lfs);
    323        1.78  perseant 
    324         1.1   mycroft 	/* Initialize the inode. */
    325        1.15   thorpej 	ip = pool_get(&lfs_inode_pool, PR_WAITOK);
    326        1.66      fvdl 	memset(ip, 0, sizeof(*ip));
    327        1.66      fvdl 	dp = pool_get(&lfs_dinode_pool, PR_WAITOK);
    328        1.66      fvdl 	memset(dp, 0, sizeof(*dp));
    329        1.63  perseant 	ip->inode_ext.lfs = pool_get(&lfs_inoext_pool, PR_WAITOK);
    330        1.74  perseant 	memset(ip->inode_ext.lfs, 0, sizeof(*ip->inode_ext.lfs));
    331        1.40      fvdl 	vp->v_data = ip;
    332        1.66      fvdl 	ip->i_din.ffs1_din = dp;
    333        1.66      fvdl 	ip->i_ump = ump;
    334        1.40      fvdl 	ip->i_vnode = vp;
    335         1.1   mycroft 	ip->i_devvp = ump->um_devvp;
    336         1.1   mycroft 	ip->i_dev = ump->um_dev;
    337        1.66      fvdl 	ip->i_number = dp->di_inumber = ino;
    338         1.1   mycroft 	ip->i_lfs = ump->um_lfs;
    339        1.66      fvdl 	ip->i_lfs_effnblks = 0;
    340        1.81  perseant 	SPLAY_INIT(&ip->i_lfs_lbtree);
    341        1.82  perseant 	ip->i_lfs_nbtree = 0;
    342        1.91  perseant 	LIST_INIT(&ip->i_lfs_segdhd);
    343         1.1   mycroft #ifdef QUOTA
    344       1.101   hannken 	ufsquota_init(ip);
    345         1.1   mycroft #endif
    346         1.1   mycroft }
    347         1.1   mycroft 
    348        1.87  perseant #if 0
    349        1.87  perseant /*
    350        1.87  perseant  * Find the highest-numbered allocated inode.
    351        1.87  perseant  * This will be used to shrink the Ifile.
    352        1.87  perseant  */
    353        1.87  perseant static inline ino_t
    354        1.87  perseant lfs_last_alloc_ino(struct lfs *fs)
    355        1.87  perseant {
    356        1.87  perseant 	ino_t ino, maxino;
    357        1.87  perseant 
    358        1.87  perseant 	maxino = ((fs->lfs_ivnode->v_size >> fs->lfs_bshift) -
    359        1.87  perseant 		  fs->lfs_cleansz - fs->lfs_segtabsz) * fs->lfs_ifpb;
    360        1.87  perseant 	for (ino = maxino - 1; ino > LFS_UNUSED_INUM; --ino) {
    361        1.87  perseant 		if (ISSET_BITMAP_FREE(fs, ino) == 0)
    362        1.87  perseant 			break;
    363        1.87  perseant 	}
    364        1.87  perseant 	return ino;
    365        1.87  perseant }
    366        1.87  perseant #endif
    367        1.87  perseant 
    368        1.87  perseant /*
    369        1.87  perseant  * Find the previous (next lowest numbered) free inode, if any.
    370        1.87  perseant  * If there is none, return LFS_UNUSED_INUM.
    371        1.87  perseant  */
    372        1.87  perseant static inline ino_t
    373        1.87  perseant lfs_freelist_prev(struct lfs *fs, ino_t ino)
    374        1.87  perseant {
    375        1.88  perseant 	ino_t tino, bound, bb, freehdbb;
    376        1.88  perseant 
    377        1.88  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM)	 /* No free inodes at all */
    378        1.88  perseant 		return LFS_UNUSED_INUM;
    379        1.88  perseant 
    380        1.88  perseant 	/* Search our own word first */
    381        1.88  perseant 	bound = ino & ~BMMASK;
    382        1.89  perseant 	for (tino = ino - 1; tino >= bound && tino > LFS_UNUSED_INUM; tino--)
    383        1.88  perseant 		if (ISSET_BITMAP_FREE(fs, tino))
    384        1.88  perseant 			return tino;
    385        1.88  perseant 	/* If there are no lower words to search, just return */
    386        1.88  perseant 	if (ino >> BMSHIFT == 0)
    387        1.88  perseant 		return LFS_UNUSED_INUM;
    388        1.88  perseant 
    389        1.88  perseant 	/*
    390        1.88  perseant 	 * Find a word with a free inode in it.  We have to be a bit
    391        1.88  perseant 	 * careful here since ino_t is unsigned.
    392        1.88  perseant 	 */
    393        1.88  perseant 	freehdbb = (fs->lfs_freehd >> BMSHIFT);
    394        1.88  perseant 	for (bb = (ino >> BMSHIFT) - 1; bb >= freehdbb && bb > 0; --bb)
    395        1.88  perseant 		if (fs->lfs_ino_bitmap[bb])
    396        1.88  perseant 			break;
    397        1.88  perseant 	if (fs->lfs_ino_bitmap[bb] == 0)
    398        1.88  perseant 		return LFS_UNUSED_INUM;
    399        1.88  perseant 
    400        1.88  perseant 	/* Search the word we found */
    401        1.89  perseant 	for (tino = (bb << BMSHIFT) | BMMASK; tino >= (bb << BMSHIFT) &&
    402        1.89  perseant 	     tino > LFS_UNUSED_INUM; tino--)
    403        1.88  perseant 		if (ISSET_BITMAP_FREE(fs, tino))
    404        1.88  perseant 			break;
    405        1.87  perseant 
    406        1.87  perseant 	if (tino <= LFS_IFILE_INUM)
    407        1.87  perseant 		tino = LFS_UNUSED_INUM;
    408        1.87  perseant 
    409        1.87  perseant 	return tino;
    410        1.87  perseant }
    411        1.87  perseant 
    412         1.1   mycroft /* Free an inode. */
    413         1.1   mycroft /* ARGUSED */
    414        1.43  perseant /* VOP_BWRITE 2i times */
    415         1.1   mycroft int
    416        1.99  christos lfs_vfree(struct vnode *vp, ino_t ino, int mode)
    417         1.3  christos {
    418         1.1   mycroft 	SEGUSE *sup;
    419        1.48  perseant 	CLEANERINFO *cip;
    420        1.48  perseant 	struct buf *cbp, *bp;
    421         1.1   mycroft 	struct ifile *ifp;
    422         1.1   mycroft 	struct inode *ip;
    423         1.1   mycroft 	struct lfs *fs;
    424        1.59      fvdl 	daddr_t old_iaddr;
    425        1.85      yamt 	ino_t otail;
    426        1.75     perry 
    427         1.1   mycroft 	/* Get the inode number and file system. */
    428        1.30  perseant 	ip = VTOI(vp);
    429         1.1   mycroft 	fs = ip->i_lfs;
    430         1.1   mycroft 	ino = ip->i_number;
    431        1.34  perseant 
    432        1.78  perseant 	ASSERT_NO_SEGLOCK(fs);
    433        1.88  perseant 	DLOG((DLOG_ALLOC, "lfs_vfree: free ino %lld\n", (long long)ino));
    434        1.78  perseant 
    435        1.48  perseant 	/* Drain of pending writes */
    436       1.105        ad 	mutex_enter(&vp->v_interlock);
    437       1.105        ad 	while (fs->lfs_version > 1 && WRITEINPROG(vp)) {
    438       1.105        ad 		cv_wait(&vp->v_cv, &vp->v_interlock);
    439       1.105        ad 	}
    440       1.105        ad 	mutex_exit(&vp->v_interlock);
    441        1.48  perseant 
    442        1.63  perseant 	lfs_seglock(fs, SEGM_PROT);
    443        1.78  perseant 	vn_lock(fs->lfs_ivnode, LK_EXCLUSIVE);
    444        1.75     perry 
    445        1.72      yamt 	lfs_unmark_vnode(vp);
    446       1.105        ad 	mutex_enter(&lfs_lock);
    447       1.103        ad 	if (vp->v_uflag & VU_DIROP) {
    448       1.103        ad 		vp->v_uflag &= ~VU_DIROP;
    449        1.30  perseant 		--lfs_dirvcount;
    450        1.92  perseant 		--fs->lfs_dirvcount;
    451        1.63  perseant 		TAILQ_REMOVE(&fs->lfs_dchainhd, ip, i_lfs_dchain);
    452        1.92  perseant 		wakeup(&fs->lfs_dirvcount);
    453        1.30  perseant 		wakeup(&lfs_dirvcount);
    454       1.105        ad 		mutex_exit(&lfs_lock);
    455        1.30  perseant 		lfs_vunref(vp);
    456        1.90  perseant 
    457        1.90  perseant 		/*
    458        1.90  perseant 		 * If this inode is not going to be written any more, any
    459        1.90  perseant 		 * segment accounting left over from its truncation needs
    460        1.90  perseant 		 * to occur at the end of the next dirops flush.  Attach
    461        1.90  perseant 		 * them to the fs-wide list for that purpose.
    462        1.90  perseant 		 */
    463        1.90  perseant 		if (LIST_FIRST(&ip->i_lfs_segdhd) != NULL) {
    464        1.90  perseant 			struct segdelta *sd;
    465        1.90  perseant 
    466        1.90  perseant 			while((sd = LIST_FIRST(&ip->i_lfs_segdhd)) != NULL) {
    467        1.90  perseant 				LIST_REMOVE(sd, list);
    468        1.90  perseant 				LIST_INSERT_HEAD(&fs->lfs_segdhd, sd, list);
    469        1.90  perseant 			}
    470        1.90  perseant 		}
    471        1.90  perseant 	} else {
    472        1.90  perseant 		/*
    473        1.90  perseant 		 * If it's not a dirop, we can finalize right away.
    474        1.90  perseant 		 */
    475       1.105        ad 		mutex_exit(&lfs_lock);
    476        1.90  perseant 		lfs_finalize_ino_seguse(fs, ip);
    477        1.38  perseant 	}
    478        1.30  perseant 
    479       1.105        ad 	mutex_enter(&lfs_lock);
    480        1.42  perseant 	LFS_CLR_UINO(ip, IN_ACCESSED|IN_CLEANING|IN_MODIFIED);
    481       1.105        ad 	mutex_exit(&lfs_lock);
    482        1.33  perseant 	ip->i_flag &= ~IN_ALLMOD;
    483        1.93  perseant 	ip->i_lfs_iflags |= LFSI_DELETED;
    484        1.93  perseant 
    485         1.1   mycroft 	/*
    486         1.1   mycroft 	 * Set the ifile's inode entry to unused, increment its version number
    487        1.48  perseant 	 * and link it onto the free chain.
    488         1.1   mycroft 	 */
    489        1.87  perseant 	SET_BITMAP_FREE(fs, ino);
    490         1.1   mycroft 	LFS_IENTRY(ifp, fs, ino, bp);
    491         1.1   mycroft 	old_iaddr = ifp->if_daddr;
    492         1.1   mycroft 	ifp->if_daddr = LFS_UNUSED_DADDR;
    493         1.1   mycroft 	++ifp->if_version;
    494        1.48  perseant 	if (fs->lfs_version == 1) {
    495        1.48  perseant 		LFS_GET_HEADFREE(fs, cip, cbp, &(ifp->if_nextfree));
    496        1.48  perseant 		LFS_PUT_HEADFREE(fs, cip, cbp, ino);
    497        1.56  perseant 		(void) LFS_BWRITE_LOG(bp); /* Ifile */
    498        1.48  perseant 	} else {
    499        1.87  perseant 		ino_t tino, onf;
    500        1.87  perseant 
    501        1.48  perseant 		ifp->if_nextfree = LFS_UNUSED_INUM;
    502        1.56  perseant 		(void) LFS_BWRITE_LOG(bp); /* Ifile */
    503        1.87  perseant 
    504        1.87  perseant 		tino = lfs_freelist_prev(fs, ino);
    505        1.87  perseant 		if (tino == LFS_UNUSED_INUM) {
    506        1.87  perseant 			/* Nothing free below us, put us on the head */
    507        1.87  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    508        1.87  perseant 			LFS_GET_HEADFREE(fs, cip, cbp, &(ifp->if_nextfree));
    509        1.87  perseant 			LFS_PUT_HEADFREE(fs, cip, cbp, ino);
    510        1.88  perseant 			DLOG((DLOG_ALLOC, "lfs_vfree: headfree %lld -> %lld\n",
    511        1.87  perseant 			     (long long)ifp->if_nextfree, (long long)ino));
    512        1.87  perseant 			LFS_BWRITE_LOG(bp); /* Ifile */
    513        1.87  perseant 
    514        1.87  perseant 			/* If the list was empty, set tail too */
    515        1.87  perseant 			LFS_GET_TAILFREE(fs, cip, cbp, &otail);
    516        1.87  perseant 			if (otail == LFS_UNUSED_INUM) {
    517        1.87  perseant 				LFS_PUT_TAILFREE(fs, cip, cbp, ino);
    518        1.87  perseant 				DLOG((DLOG_ALLOC, "lfs_vfree: tailfree %lld "
    519        1.87  perseant 				      "-> %lld\n", (long long)otail,
    520        1.87  perseant 				      (long long)ino));
    521        1.87  perseant 			}
    522        1.87  perseant 		} else {
    523        1.87  perseant 			/*
    524        1.87  perseant 			 * Insert this inode into the list after tino.
    525        1.87  perseant 			 * We hold the segment lock so we don't have to
    526        1.87  perseant 			 * worry about blocks being written out of order.
    527        1.87  perseant 			 */
    528        1.87  perseant 			DLOG((DLOG_ALLOC, "lfs_vfree: insert ino %lld "
    529        1.87  perseant 			      " after %lld\n", ino, tino));
    530        1.87  perseant 
    531        1.87  perseant 			LFS_IENTRY(ifp, fs, tino, bp);
    532        1.87  perseant 			onf = ifp->if_nextfree;
    533        1.87  perseant 			ifp->if_nextfree = ino;
    534        1.87  perseant 			LFS_BWRITE_LOG(bp);	/* Ifile */
    535        1.87  perseant 
    536        1.87  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    537        1.87  perseant 			ifp->if_nextfree = onf;
    538        1.87  perseant 			LFS_BWRITE_LOG(bp);	/* Ifile */
    539        1.87  perseant 
    540        1.87  perseant 			/* If we're last, put us on the tail */
    541        1.87  perseant 			if (onf == LFS_UNUSED_INUM) {
    542        1.87  perseant 				LFS_GET_TAILFREE(fs, cip, cbp, &otail);
    543        1.87  perseant 				LFS_PUT_TAILFREE(fs, cip, cbp, ino);
    544        1.87  perseant 				DLOG((DLOG_ALLOC, "lfs_vfree: tailfree %lld "
    545        1.87  perseant 				      "-> %lld\n", (long long)otail,
    546        1.87  perseant 				      (long long)ino));
    547        1.87  perseant 			}
    548        1.87  perseant 		}
    549        1.48  perseant 	}
    550        1.17  perseant #ifdef DIAGNOSTIC
    551        1.53       chs 	if (ino == LFS_UNUSED_INUM) {
    552        1.17  perseant 		panic("inode 0 freed");
    553        1.17  perseant 	}
    554        1.17  perseant #endif /* DIAGNOSTIC */
    555         1.1   mycroft 	if (old_iaddr != LFS_UNUSED_DADDR) {
    556        1.48  perseant 		LFS_SEGENTRY(sup, fs, dtosn(fs, old_iaddr), bp);
    557        1.22  perseant #ifdef DIAGNOSTIC
    558        1.66      fvdl 		if (sup->su_nbytes < sizeof (struct ufs1_dinode)) {
    559        1.43  perseant 			printf("lfs_vfree: negative byte count"
    560        1.62      yamt 			       " (segment %" PRIu32 " short by %d)\n",
    561        1.48  perseant 			       dtosn(fs, old_iaddr),
    562        1.66      fvdl 			       (int)sizeof (struct ufs1_dinode) -
    563        1.66      fvdl 				    sup->su_nbytes);
    564        1.22  perseant 			panic("lfs_vfree: negative byte count");
    565        1.66      fvdl 			sup->su_nbytes = sizeof (struct ufs1_dinode);
    566        1.17  perseant 		}
    567        1.22  perseant #endif
    568        1.66      fvdl 		sup->su_nbytes -= sizeof (struct ufs1_dinode);
    569        1.63  perseant 		LFS_WRITESEGENTRY(sup, fs, dtosn(fs, old_iaddr), bp); /* Ifile */
    570         1.1   mycroft 	}
    571        1.75     perry 
    572         1.1   mycroft 	/* Set superblock modified bit and decrement file count. */
    573       1.105        ad 	mutex_enter(&lfs_lock);
    574         1.1   mycroft 	fs->lfs_fmod = 1;
    575       1.105        ad 	mutex_exit(&lfs_lock);
    576         1.1   mycroft 	--fs->lfs_nfiles;
    577        1.75     perry 
    578        1.78  perseant 	VOP_UNLOCK(fs->lfs_ivnode, 0);
    579        1.56  perseant 	lfs_segunlock(fs);
    580        1.63  perseant 
    581         1.1   mycroft 	return (0);
    582         1.1   mycroft }
    583        1.87  perseant 
    584        1.87  perseant /*
    585        1.87  perseant  * Sort the freelist and set up the free-inode bitmap.
    586        1.87  perseant  * To be called by lfs_mountfs().
    587        1.87  perseant  */
    588        1.87  perseant void
    589        1.87  perseant lfs_order_freelist(struct lfs *fs)
    590        1.87  perseant {
    591        1.87  perseant 	CLEANERINFO *cip;
    592        1.87  perseant 	IFILE *ifp = NULL;
    593        1.87  perseant 	struct buf *bp;
    594        1.87  perseant 	ino_t ino, firstino, lastino, maxino;
    595        1.97  perseant #ifdef notyet
    596        1.97  perseant 	struct vnode *vp;
    597        1.97  perseant #endif
    598        1.87  perseant 
    599        1.95  perseant 	ASSERT_NO_SEGLOCK(fs);
    600        1.95  perseant 	lfs_seglock(fs, SEGM_PROT);
    601        1.95  perseant 
    602        1.87  perseant 	maxino = ((fs->lfs_ivnode->v_size >> fs->lfs_bshift) -
    603        1.87  perseant 		  fs->lfs_cleansz - fs->lfs_segtabsz) * fs->lfs_ifpb;
    604        1.88  perseant 	fs->lfs_ino_bitmap = (lfs_bm_t *)
    605        1.88  perseant 		malloc(((maxino + BMMASK) >> BMSHIFT) * sizeof(lfs_bm_t),
    606        1.88  perseant 		       M_SEGMENT, M_WAITOK | M_ZERO);
    607        1.88  perseant 	KASSERT(fs->lfs_ino_bitmap != NULL);
    608        1.87  perseant 
    609        1.87  perseant 	firstino = lastino = LFS_UNUSED_INUM;
    610        1.87  perseant 	for (ino = 0; ino < maxino; ino++) {
    611        1.87  perseant 		if (ino % fs->lfs_ifpb == 0)
    612        1.87  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    613        1.87  perseant 		else
    614        1.87  perseant 			++ifp;
    615        1.87  perseant 
    616        1.87  perseant 		/* Don't put zero or ifile on the free list */
    617        1.87  perseant 		if (ino == LFS_UNUSED_INUM || ino == LFS_IFILE_INUM)
    618        1.87  perseant 			continue;
    619        1.87  perseant 
    620        1.97  perseant #ifdef notyet
    621        1.97  perseant 		/* Address orphaned files */
    622        1.97  perseant 		if (ifp->if_nextfree == LFS_ORPHAN_NEXTFREE &&
    623        1.97  perseant 		    VFS_VGET(fs->lfs_ivnode->v_mount, ino, &vp) == 0) {
    624       1.104        he 			lfs_truncate(vp, 0, 0, NOCRED);
    625        1.97  perseant 			vput(vp);
    626        1.97  perseant 			LFS_SEGENTRY(sup, fs, dtosn(fs, ifp->if_daddr), bp);
    627        1.97  perseant 			KASSERT(sup->su_nbytes >= DINODE1_SIZE);
    628        1.97  perseant 			sup->su_nbytes -= DINODE1_SIZE;
    629        1.97  perseant 			LFS_WRITESEGENTRY(sup, fs, dtosn(fs, ifp->if_daddr), bp);
    630        1.97  perseant 
    631        1.97  perseant 			/* Set up to fall through to next section */
    632        1.97  perseant 			ifp->if_daddr = LFS_UNUSED_DADDR;
    633        1.97  perseant 			LFS_BWRITE_LOG(bp);
    634        1.97  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    635        1.97  perseant 		}
    636        1.97  perseant #endif
    637        1.97  perseant 
    638        1.87  perseant 		if (ifp->if_daddr == LFS_UNUSED_DADDR) {
    639        1.87  perseant 			if (firstino == LFS_UNUSED_INUM)
    640        1.87  perseant 				firstino = ino;
    641        1.87  perseant 			else {
    642       1.102        ad 				brelse(bp, 0);
    643        1.87  perseant 
    644        1.87  perseant 				LFS_IENTRY(ifp, fs, lastino, bp);
    645        1.87  perseant 				ifp->if_nextfree = ino;
    646        1.87  perseant 				LFS_BWRITE_LOG(bp);
    647        1.87  perseant 
    648        1.87  perseant 				LFS_IENTRY(ifp, fs, ino, bp);
    649        1.87  perseant 			}
    650        1.87  perseant 			lastino = ino;
    651        1.87  perseant 
    652        1.87  perseant 			SET_BITMAP_FREE(fs, ino);
    653        1.87  perseant 		}
    654        1.87  perseant 
    655        1.87  perseant 		if ((ino + 1) % fs->lfs_ifpb == 0)
    656       1.102        ad 			brelse(bp, 0);
    657        1.87  perseant 	}
    658        1.87  perseant 
    659        1.87  perseant 	LFS_PUT_HEADFREE(fs, cip, bp, firstino);
    660        1.87  perseant 	LFS_PUT_TAILFREE(fs, cip, bp, lastino);
    661        1.95  perseant 
    662        1.95  perseant 	lfs_segunlock(fs);
    663        1.87  perseant }
    664        1.97  perseant 
    665        1.97  perseant void
    666        1.97  perseant lfs_orphan(struct lfs *fs, ino_t ino)
    667        1.97  perseant {
    668        1.97  perseant 	IFILE *ifp;
    669        1.97  perseant 	struct buf *bp;
    670        1.97  perseant 
    671        1.97  perseant 	LFS_IENTRY(ifp, fs, ino, bp);
    672        1.97  perseant 	ifp->if_nextfree = LFS_ORPHAN_NEXTFREE;
    673        1.97  perseant 	LFS_BWRITE_LOG(bp);
    674        1.97  perseant }
    675