Home | History | Annotate | Line # | Download | only in lfs
lfs_alloc.c revision 1.111
      1  1.111     rmind /*	$NetBSD: lfs_alloc.c,v 1.111 2011/06/12 03:36:01 rmind Exp $	*/
      2    1.2       cgd 
      3   1.17  perseant /*-
      4  1.100        ad  * Copyright (c) 1999, 2000, 2001, 2002, 2003, 2007 The NetBSD Foundation, Inc.
      5   1.17  perseant  * All rights reserved.
      6   1.17  perseant  *
      7   1.17  perseant  * This code is derived from software contributed to The NetBSD Foundation
      8   1.17  perseant  * by Konrad E. Schroder <perseant (at) hhhh.org>.
      9   1.17  perseant  *
     10   1.17  perseant  * Redistribution and use in source and binary forms, with or without
     11   1.17  perseant  * modification, are permitted provided that the following conditions
     12   1.17  perseant  * are met:
     13   1.17  perseant  * 1. Redistributions of source code must retain the above copyright
     14   1.17  perseant  *    notice, this list of conditions and the following disclaimer.
     15   1.17  perseant  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.17  perseant  *    notice, this list of conditions and the following disclaimer in the
     17   1.17  perseant  *    documentation and/or other materials provided with the distribution.
     18   1.17  perseant  *
     19   1.17  perseant  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.17  perseant  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.17  perseant  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.17  perseant  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.17  perseant  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.17  perseant  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.17  perseant  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.17  perseant  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.17  perseant  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.17  perseant  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.17  perseant  * POSSIBILITY OF SUCH DAMAGE.
     30   1.17  perseant  */
     31    1.1   mycroft /*
     32    1.1   mycroft  * Copyright (c) 1991, 1993
     33    1.1   mycroft  *	The Regents of the University of California.  All rights reserved.
     34    1.1   mycroft  *
     35    1.1   mycroft  * Redistribution and use in source and binary forms, with or without
     36    1.1   mycroft  * modification, are permitted provided that the following conditions
     37    1.1   mycroft  * are met:
     38    1.1   mycroft  * 1. Redistributions of source code must retain the above copyright
     39    1.1   mycroft  *    notice, this list of conditions and the following disclaimer.
     40    1.1   mycroft  * 2. Redistributions in binary form must reproduce the above copyright
     41    1.1   mycroft  *    notice, this list of conditions and the following disclaimer in the
     42    1.1   mycroft  *    documentation and/or other materials provided with the distribution.
     43   1.71       agc  * 3. Neither the name of the University nor the names of its contributors
     44    1.1   mycroft  *    may be used to endorse or promote products derived from this software
     45    1.1   mycroft  *    without specific prior written permission.
     46    1.1   mycroft  *
     47    1.1   mycroft  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     48    1.1   mycroft  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     49    1.1   mycroft  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     50    1.1   mycroft  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     51    1.1   mycroft  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     52    1.1   mycroft  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     53    1.1   mycroft  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     54    1.1   mycroft  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     55    1.1   mycroft  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     56    1.1   mycroft  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     57    1.1   mycroft  * SUCH DAMAGE.
     58    1.1   mycroft  *
     59    1.2       cgd  *	@(#)lfs_alloc.c	8.4 (Berkeley) 1/4/94
     60    1.1   mycroft  */
     61   1.52     lukem 
     62   1.52     lukem #include <sys/cdefs.h>
     63  1.111     rmind __KERNEL_RCSID(0, "$NetBSD: lfs_alloc.c,v 1.111 2011/06/12 03:36:01 rmind Exp $");
     64   1.12    scottr 
     65   1.47       mrg #if defined(_KERNEL_OPT)
     66   1.12    scottr #include "opt_quota.h"
     67   1.13    scottr #endif
     68    1.1   mycroft 
     69    1.1   mycroft #include <sys/param.h>
     70    1.3  christos #include <sys/systm.h>
     71    1.1   mycroft #include <sys/kernel.h>
     72    1.1   mycroft #include <sys/buf.h>
     73   1.56  perseant #include <sys/lock.h>
     74    1.1   mycroft #include <sys/vnode.h>
     75    1.1   mycroft #include <sys/syslog.h>
     76    1.1   mycroft #include <sys/mount.h>
     77   1.87  perseant #include <sys/malloc.h>
     78   1.15   thorpej #include <sys/pool.h>
     79   1.50       chs #include <sys/proc.h>
     80   1.81  perseant #include <sys/tree.h>
     81   1.94      elad #include <sys/kauth.h>
     82    1.1   mycroft 
     83    1.1   mycroft #include <ufs/ufs/quota.h>
     84    1.1   mycroft #include <ufs/ufs/inode.h>
     85    1.1   mycroft #include <ufs/ufs/ufsmount.h>
     86    1.3  christos #include <ufs/ufs/ufs_extern.h>
     87    1.1   mycroft 
     88    1.1   mycroft #include <ufs/lfs/lfs.h>
     89    1.1   mycroft #include <ufs/lfs/lfs_extern.h>
     90    1.1   mycroft 
     91   1.87  perseant /* Constants for inode free bitmap */
     92   1.88  perseant #define BMSHIFT 5	/* 2 ** 5 = 32 */
     93   1.88  perseant #define BMMASK  ((1 << BMSHIFT) - 1)
     94   1.88  perseant #define SET_BITMAP_FREE(F, I) do { \
     95   1.88  perseant 	DLOG((DLOG_ALLOC, "lfs: ino %d wrd %d bit %d set\n", (int)(I), 	\
     96   1.88  perseant 	     (int)((I) >> BMSHIFT), (int)((I) & BMMASK)));		\
     97   1.88  perseant 	(F)->lfs_ino_bitmap[(I) >> BMSHIFT] |= (1 << ((I) & BMMASK));	\
     98   1.88  perseant } while (0)
     99   1.88  perseant #define CLR_BITMAP_FREE(F, I) do { \
    100   1.88  perseant 	DLOG((DLOG_ALLOC, "lfs: ino %d wrd %d bit %d clr\n", (int)(I), 	\
    101   1.88  perseant 	     (int)((I) >> BMSHIFT), (int)((I) & BMMASK)));		\
    102   1.88  perseant 	(F)->lfs_ino_bitmap[(I) >> BMSHIFT] &= ~(1 << ((I) & BMMASK));	\
    103   1.88  perseant } while(0)
    104   1.88  perseant 
    105   1.87  perseant #define ISSET_BITMAP_FREE(F, I) \
    106   1.88  perseant 	((F)->lfs_ino_bitmap[(I) >> BMSHIFT] & (1 << ((I) & BMMASK)))
    107   1.87  perseant 
    108   1.44  perseant /*
    109   1.65  perseant  * Add a new block to the Ifile, to accommodate future file creations.
    110   1.65  perseant  * Called with the segment lock held.
    111   1.56  perseant  */
    112   1.96  perseant int
    113   1.96  perseant lfs_extend_ifile(struct lfs *fs, kauth_cred_t cred)
    114   1.44  perseant {
    115   1.44  perseant 	struct vnode *vp;
    116   1.44  perseant 	struct inode *ip;
    117   1.44  perseant 	IFILE *ifp;
    118   1.48  perseant 	IFILE_V1 *ifp_v1;
    119   1.48  perseant 	struct buf *bp, *cbp;
    120   1.44  perseant 	int error;
    121   1.83  christos 	daddr_t i, blkno, xmax;
    122   1.87  perseant 	ino_t oldlast, maxino;
    123   1.48  perseant 	CLEANERINFO *cip;
    124   1.44  perseant 
    125   1.78  perseant 	ASSERT_SEGLOCK(fs);
    126   1.78  perseant 
    127   1.44  perseant 	vp = fs->lfs_ivnode;
    128   1.44  perseant 	ip = VTOI(vp);
    129   1.66      fvdl 	blkno = lblkno(fs, ip->i_size);
    130   1.85      yamt 	if ((error = lfs_balloc(vp, ip->i_size, fs->lfs_bsize, cred, 0,
    131   1.44  perseant 				&bp)) != 0) {
    132   1.44  perseant 		return (error);
    133   1.44  perseant 	}
    134   1.66      fvdl 	ip->i_size += fs->lfs_bsize;
    135   1.66      fvdl 	ip->i_ffs1_size = ip->i_size;
    136   1.66      fvdl 	uvm_vnp_setsize(vp, ip->i_size);
    137   1.75     perry 
    138   1.88  perseant 	maxino = ((ip->i_size >> fs->lfs_bshift) - fs->lfs_cleansz -
    139   1.88  perseant 		  fs->lfs_segtabsz) * fs->lfs_ifpb;
    140   1.88  perseant 	fs->lfs_ino_bitmap = (lfs_bm_t *)
    141   1.88  perseant 		realloc(fs->lfs_ino_bitmap, ((maxino + BMMASK) >> BMSHIFT) *
    142   1.88  perseant 			sizeof(lfs_bm_t), M_SEGMENT, M_WAITOK);
    143   1.88  perseant 	KASSERT(fs->lfs_ino_bitmap != NULL);
    144   1.87  perseant 
    145   1.44  perseant 	i = (blkno - fs->lfs_segtabsz - fs->lfs_cleansz) *
    146   1.44  perseant 		fs->lfs_ifpb;
    147   1.87  perseant 
    148   1.87  perseant 	/*
    149   1.87  perseant 	 * We insert the new inodes at the head of the free list.
    150   1.87  perseant 	 * Under normal circumstances, the free list is empty here,
    151   1.87  perseant 	 * so we are also incidentally placing them at the end (which
    152   1.87  perseant 	 * we must do if we are to keep them in order).
    153   1.87  perseant 	 */
    154   1.48  perseant 	LFS_GET_HEADFREE(fs, cip, cbp, &oldlast);
    155   1.48  perseant 	LFS_PUT_HEADFREE(fs, cip, cbp, i);
    156   1.44  perseant #ifdef DIAGNOSTIC
    157   1.63  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM)
    158   1.44  perseant 		panic("inode 0 allocated [2]");
    159   1.44  perseant #endif /* DIAGNOSTIC */
    160   1.83  christos 	xmax = i + fs->lfs_ifpb;
    161   1.48  perseant 
    162   1.53       chs 	if (fs->lfs_version == 1) {
    163   1.83  christos 		for (ifp_v1 = (IFILE_V1 *)bp->b_data; i < xmax; ++ifp_v1) {
    164   1.89  perseant 			SET_BITMAP_FREE(fs, i);
    165   1.48  perseant 			ifp_v1->if_version = 1;
    166   1.48  perseant 			ifp_v1->if_daddr = LFS_UNUSED_DADDR;
    167   1.48  perseant 			ifp_v1->if_nextfree = ++i;
    168   1.48  perseant 		}
    169   1.48  perseant 		ifp_v1--;
    170   1.48  perseant 		ifp_v1->if_nextfree = oldlast;
    171   1.48  perseant 	} else {
    172   1.83  christos 		for (ifp = (IFILE *)bp->b_data; i < xmax; ++ifp) {
    173   1.89  perseant 			SET_BITMAP_FREE(fs, i);
    174   1.48  perseant 			ifp->if_version = 1;
    175   1.48  perseant 			ifp->if_daddr = LFS_UNUSED_DADDR;
    176   1.48  perseant 			ifp->if_nextfree = ++i;
    177   1.48  perseant 		}
    178   1.48  perseant 		ifp--;
    179   1.48  perseant 		ifp->if_nextfree = oldlast;
    180   1.44  perseant 	}
    181   1.83  christos 	LFS_PUT_TAILFREE(fs, cip, cbp, xmax - 1);
    182   1.48  perseant 
    183   1.56  perseant 	(void) LFS_BWRITE_LOG(bp); /* Ifile */
    184   1.44  perseant 
    185   1.44  perseant 	return 0;
    186   1.44  perseant }
    187   1.44  perseant 
    188    1.1   mycroft /* Allocate a new inode. */
    189    1.1   mycroft /* ARGSUSED */
    190   1.43  perseant /* VOP_BWRITE 2i times */
    191    1.1   mycroft int
    192   1.99  christos lfs_valloc(struct vnode *pvp, int mode, kauth_cred_t cred,
    193   1.98  christos     struct vnode **vpp)
    194    1.3  christos {
    195    1.1   mycroft 	struct lfs *fs;
    196   1.48  perseant 	struct buf *bp, *cbp;
    197    1.1   mycroft 	struct ifile *ifp;
    198    1.1   mycroft 	ino_t new_ino;
    199    1.1   mycroft 	int error;
    200   1.36  perseant 	int new_gen;
    201   1.48  perseant 	CLEANERINFO *cip;
    202    1.1   mycroft 
    203   1.85      yamt 	fs = VTOI(pvp)->i_lfs;
    204   1.38  perseant 	if (fs->lfs_ronly)
    205   1.38  perseant 		return EROFS;
    206   1.75     perry 
    207   1.78  perseant 	ASSERT_NO_SEGLOCK(fs);
    208   1.78  perseant 
    209   1.56  perseant 	lfs_seglock(fs, SEGM_PROT);
    210   1.78  perseant 	vn_lock(fs->lfs_ivnode, LK_EXCLUSIVE);
    211   1.17  perseant 
    212    1.1   mycroft 	/* Get the head of the freelist. */
    213   1.48  perseant 	LFS_GET_HEADFREE(fs, cip, cbp, &new_ino);
    214   1.87  perseant 	KASSERT(new_ino != LFS_UNUSED_INUM && new_ino != LFS_IFILE_INUM);
    215   1.48  perseant 
    216   1.87  perseant 	DLOG((DLOG_ALLOC, "lfs_valloc: allocate inode %lld\n",
    217   1.87  perseant 	     (long long)new_ino));
    218   1.75     perry 
    219    1.1   mycroft 	/*
    220    1.1   mycroft 	 * Remove the inode from the free list and write the new start
    221    1.1   mycroft 	 * of the free list into the superblock.
    222    1.1   mycroft 	 */
    223   1.87  perseant 	CLR_BITMAP_FREE(fs, new_ino);
    224    1.1   mycroft 	LFS_IENTRY(ifp, fs, new_ino, bp);
    225    1.1   mycroft 	if (ifp->if_daddr != LFS_UNUSED_DADDR)
    226   1.84  christos 		panic("lfs_valloc: inuse inode %llu on the free list",
    227   1.84  christos 		    (unsigned long long)new_ino);
    228   1.48  perseant 	LFS_PUT_HEADFREE(fs, cip, cbp, ifp->if_nextfree);
    229   1.87  perseant 	DLOG((DLOG_ALLOC, "lfs_valloc: headfree %lld -> %lld\n",
    230   1.87  perseant 	     (long long)new_ino, (long long)ifp->if_nextfree));
    231   1.48  perseant 
    232   1.37  perseant 	new_gen = ifp->if_version; /* version was updated by vfree */
    233  1.102        ad 	brelse(bp, 0);
    234   1.30  perseant 
    235    1.1   mycroft 	/* Extend IFILE so that the next lfs_valloc will succeed. */
    236   1.63  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM) {
    237   1.96  perseant 		if ((error = lfs_extend_ifile(fs, cred)) != 0) {
    238   1.48  perseant 			LFS_PUT_HEADFREE(fs, cip, cbp, new_ino);
    239  1.110   hannken 			VOP_UNLOCK(fs->lfs_ivnode);
    240   1.56  perseant 			lfs_segunlock(fs);
    241   1.44  perseant 			return error;
    242    1.1   mycroft 		}
    243    1.1   mycroft 	}
    244   1.17  perseant #ifdef DIAGNOSTIC
    245   1.63  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM)
    246   1.17  perseant 		panic("inode 0 allocated [3]");
    247   1.17  perseant #endif /* DIAGNOSTIC */
    248   1.48  perseant 
    249   1.78  perseant 	/* Set superblock modified bit and increment file count. */
    250  1.105        ad 	mutex_enter(&lfs_lock);
    251   1.78  perseant 	fs->lfs_fmod = 1;
    252  1.105        ad 	mutex_exit(&lfs_lock);
    253   1.78  perseant 	++fs->lfs_nfiles;
    254   1.78  perseant 
    255  1.110   hannken 	VOP_UNLOCK(fs->lfs_ivnode);
    256   1.56  perseant 	lfs_segunlock(fs);
    257   1.63  perseant 
    258   1.85      yamt 	return lfs_ialloc(fs, pvp, new_ino, new_gen, vpp);
    259   1.44  perseant }
    260   1.44  perseant 
    261   1.65  perseant /*
    262   1.65  perseant  * Finish allocating a new inode, given an inode and generation number.
    263   1.65  perseant  */
    264   1.96  perseant int
    265   1.44  perseant lfs_ialloc(struct lfs *fs, struct vnode *pvp, ino_t new_ino, int new_gen,
    266   1.44  perseant 	   struct vnode **vpp)
    267   1.44  perseant {
    268   1.44  perseant 	struct inode *ip;
    269   1.44  perseant 	struct vnode *vp;
    270   1.40      fvdl 
    271   1.78  perseant 	ASSERT_NO_SEGLOCK(fs);
    272   1.78  perseant 
    273   1.77  perseant 	vp = *vpp;
    274  1.100        ad 	mutex_enter(&ufs_hashlock);
    275   1.40      fvdl 	/* Create an inode to associate with the vnode. */
    276   1.44  perseant 	lfs_vcreate(pvp->v_mount, new_ino, vp);
    277   1.51       chs 
    278    1.1   mycroft 	ip = VTOI(vp);
    279  1.105        ad 	mutex_enter(&lfs_lock);
    280   1.73   mycroft 	LFS_SET_UINO(ip, IN_CHANGE);
    281  1.105        ad 	mutex_exit(&lfs_lock);
    282   1.66      fvdl 	/* on-disk structure has been zeroed out by lfs_vcreate */
    283   1.66      fvdl 	ip->i_din.ffs1_din->di_inumber = new_ino;
    284   1.51       chs 
    285   1.79  perseant 	/* Note no blocks yet */
    286   1.79  perseant 	ip->i_lfs_hiblk = -1;
    287   1.79  perseant 
    288    1.1   mycroft 	/* Set a new generation number for this inode. */
    289   1.66      fvdl 	if (new_gen) {
    290   1.66      fvdl 		ip->i_gen = new_gen;
    291   1.66      fvdl 		ip->i_ffs1_gen = new_gen;
    292   1.66      fvdl 	}
    293   1.51       chs 
    294    1.1   mycroft 	/* Insert into the inode hash table. */
    295    1.1   mycroft 	ufs_ihashins(ip);
    296  1.100        ad 	mutex_exit(&ufs_hashlock);
    297   1.44  perseant 
    298   1.77  perseant 	ufs_vinit(vp->v_mount, lfs_specop_p, lfs_fifoop_p, vpp);
    299   1.77  perseant 	vp = *vpp;
    300   1.44  perseant 	ip = VTOI(vp);
    301   1.57      yamt 
    302   1.57      yamt 	memset(ip->i_lfs_fragsize, 0, NDADDR * sizeof(*ip->i_lfs_fragsize));
    303   1.51       chs 
    304   1.51       chs 	uvm_vnp_setsize(vp, 0);
    305   1.72      yamt 	lfs_mark_vnode(vp);
    306   1.54       chs 	genfs_node_init(vp, &lfs_genfsops);
    307  1.109     pooka 	vref(ip->i_devvp);
    308    1.1   mycroft 	return (0);
    309    1.1   mycroft }
    310    1.1   mycroft 
    311    1.1   mycroft /* Create a new vnode/inode pair and initialize what fields we can. */
    312   1.40      fvdl void
    313   1.48  perseant lfs_vcreate(struct mount *mp, ino_t ino, struct vnode *vp)
    314    1.1   mycroft {
    315    1.1   mycroft 	struct inode *ip;
    316   1.66      fvdl 	struct ufs1_dinode *dp;
    317    1.1   mycroft 	struct ufsmount *ump;
    318   1.75     perry 
    319    1.1   mycroft 	/* Get a pointer to the private mount structure. */
    320    1.1   mycroft 	ump = VFSTOUFS(mp);
    321   1.75     perry 
    322   1.78  perseant 	ASSERT_NO_SEGLOCK(ump->um_lfs);
    323   1.78  perseant 
    324    1.1   mycroft 	/* Initialize the inode. */
    325   1.15   thorpej 	ip = pool_get(&lfs_inode_pool, PR_WAITOK);
    326   1.66      fvdl 	memset(ip, 0, sizeof(*ip));
    327   1.66      fvdl 	dp = pool_get(&lfs_dinode_pool, PR_WAITOK);
    328   1.66      fvdl 	memset(dp, 0, sizeof(*dp));
    329   1.63  perseant 	ip->inode_ext.lfs = pool_get(&lfs_inoext_pool, PR_WAITOK);
    330   1.74  perseant 	memset(ip->inode_ext.lfs, 0, sizeof(*ip->inode_ext.lfs));
    331   1.40      fvdl 	vp->v_data = ip;
    332   1.66      fvdl 	ip->i_din.ffs1_din = dp;
    333   1.66      fvdl 	ip->i_ump = ump;
    334   1.40      fvdl 	ip->i_vnode = vp;
    335    1.1   mycroft 	ip->i_devvp = ump->um_devvp;
    336    1.1   mycroft 	ip->i_dev = ump->um_dev;
    337   1.66      fvdl 	ip->i_number = dp->di_inumber = ino;
    338    1.1   mycroft 	ip->i_lfs = ump->um_lfs;
    339   1.66      fvdl 	ip->i_lfs_effnblks = 0;
    340   1.81  perseant 	SPLAY_INIT(&ip->i_lfs_lbtree);
    341   1.82  perseant 	ip->i_lfs_nbtree = 0;
    342   1.91  perseant 	LIST_INIT(&ip->i_lfs_segdhd);
    343    1.1   mycroft #ifdef QUOTA
    344  1.101   hannken 	ufsquota_init(ip);
    345    1.1   mycroft #endif
    346    1.1   mycroft }
    347    1.1   mycroft 
    348   1.87  perseant #if 0
    349   1.87  perseant /*
    350   1.87  perseant  * Find the highest-numbered allocated inode.
    351   1.87  perseant  * This will be used to shrink the Ifile.
    352   1.87  perseant  */
    353   1.87  perseant static inline ino_t
    354   1.87  perseant lfs_last_alloc_ino(struct lfs *fs)
    355   1.87  perseant {
    356   1.87  perseant 	ino_t ino, maxino;
    357   1.87  perseant 
    358   1.87  perseant 	maxino = ((fs->lfs_ivnode->v_size >> fs->lfs_bshift) -
    359   1.87  perseant 		  fs->lfs_cleansz - fs->lfs_segtabsz) * fs->lfs_ifpb;
    360   1.87  perseant 	for (ino = maxino - 1; ino > LFS_UNUSED_INUM; --ino) {
    361   1.87  perseant 		if (ISSET_BITMAP_FREE(fs, ino) == 0)
    362   1.87  perseant 			break;
    363   1.87  perseant 	}
    364   1.87  perseant 	return ino;
    365   1.87  perseant }
    366   1.87  perseant #endif
    367   1.87  perseant 
    368   1.87  perseant /*
    369   1.87  perseant  * Find the previous (next lowest numbered) free inode, if any.
    370   1.87  perseant  * If there is none, return LFS_UNUSED_INUM.
    371   1.87  perseant  */
    372   1.87  perseant static inline ino_t
    373   1.87  perseant lfs_freelist_prev(struct lfs *fs, ino_t ino)
    374   1.87  perseant {
    375   1.88  perseant 	ino_t tino, bound, bb, freehdbb;
    376   1.88  perseant 
    377   1.88  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM)	 /* No free inodes at all */
    378   1.88  perseant 		return LFS_UNUSED_INUM;
    379   1.88  perseant 
    380   1.88  perseant 	/* Search our own word first */
    381   1.88  perseant 	bound = ino & ~BMMASK;
    382   1.89  perseant 	for (tino = ino - 1; tino >= bound && tino > LFS_UNUSED_INUM; tino--)
    383   1.88  perseant 		if (ISSET_BITMAP_FREE(fs, tino))
    384   1.88  perseant 			return tino;
    385   1.88  perseant 	/* If there are no lower words to search, just return */
    386   1.88  perseant 	if (ino >> BMSHIFT == 0)
    387   1.88  perseant 		return LFS_UNUSED_INUM;
    388   1.88  perseant 
    389   1.88  perseant 	/*
    390   1.88  perseant 	 * Find a word with a free inode in it.  We have to be a bit
    391   1.88  perseant 	 * careful here since ino_t is unsigned.
    392   1.88  perseant 	 */
    393   1.88  perseant 	freehdbb = (fs->lfs_freehd >> BMSHIFT);
    394   1.88  perseant 	for (bb = (ino >> BMSHIFT) - 1; bb >= freehdbb && bb > 0; --bb)
    395   1.88  perseant 		if (fs->lfs_ino_bitmap[bb])
    396   1.88  perseant 			break;
    397   1.88  perseant 	if (fs->lfs_ino_bitmap[bb] == 0)
    398   1.88  perseant 		return LFS_UNUSED_INUM;
    399   1.88  perseant 
    400   1.88  perseant 	/* Search the word we found */
    401   1.89  perseant 	for (tino = (bb << BMSHIFT) | BMMASK; tino >= (bb << BMSHIFT) &&
    402   1.89  perseant 	     tino > LFS_UNUSED_INUM; tino--)
    403   1.88  perseant 		if (ISSET_BITMAP_FREE(fs, tino))
    404   1.88  perseant 			break;
    405   1.87  perseant 
    406   1.87  perseant 	if (tino <= LFS_IFILE_INUM)
    407   1.87  perseant 		tino = LFS_UNUSED_INUM;
    408   1.87  perseant 
    409   1.87  perseant 	return tino;
    410   1.87  perseant }
    411   1.87  perseant 
    412    1.1   mycroft /* Free an inode. */
    413    1.1   mycroft /* ARGUSED */
    414   1.43  perseant /* VOP_BWRITE 2i times */
    415    1.1   mycroft int
    416   1.99  christos lfs_vfree(struct vnode *vp, ino_t ino, int mode)
    417    1.3  christos {
    418    1.1   mycroft 	SEGUSE *sup;
    419   1.48  perseant 	CLEANERINFO *cip;
    420   1.48  perseant 	struct buf *cbp, *bp;
    421    1.1   mycroft 	struct ifile *ifp;
    422    1.1   mycroft 	struct inode *ip;
    423    1.1   mycroft 	struct lfs *fs;
    424   1.59      fvdl 	daddr_t old_iaddr;
    425   1.85      yamt 	ino_t otail;
    426   1.75     perry 
    427    1.1   mycroft 	/* Get the inode number and file system. */
    428   1.30  perseant 	ip = VTOI(vp);
    429    1.1   mycroft 	fs = ip->i_lfs;
    430    1.1   mycroft 	ino = ip->i_number;
    431   1.34  perseant 
    432   1.78  perseant 	ASSERT_NO_SEGLOCK(fs);
    433   1.88  perseant 	DLOG((DLOG_ALLOC, "lfs_vfree: free ino %lld\n", (long long)ino));
    434   1.78  perseant 
    435   1.48  perseant 	/* Drain of pending writes */
    436  1.111     rmind 	mutex_enter(vp->v_interlock);
    437  1.105        ad 	while (fs->lfs_version > 1 && WRITEINPROG(vp)) {
    438  1.111     rmind 		cv_wait(&vp->v_cv, vp->v_interlock);
    439  1.105        ad 	}
    440  1.111     rmind 	mutex_exit(vp->v_interlock);
    441   1.48  perseant 
    442   1.63  perseant 	lfs_seglock(fs, SEGM_PROT);
    443   1.78  perseant 	vn_lock(fs->lfs_ivnode, LK_EXCLUSIVE);
    444   1.75     perry 
    445   1.72      yamt 	lfs_unmark_vnode(vp);
    446  1.105        ad 	mutex_enter(&lfs_lock);
    447  1.103        ad 	if (vp->v_uflag & VU_DIROP) {
    448  1.103        ad 		vp->v_uflag &= ~VU_DIROP;
    449   1.30  perseant 		--lfs_dirvcount;
    450   1.92  perseant 		--fs->lfs_dirvcount;
    451   1.63  perseant 		TAILQ_REMOVE(&fs->lfs_dchainhd, ip, i_lfs_dchain);
    452   1.92  perseant 		wakeup(&fs->lfs_dirvcount);
    453   1.30  perseant 		wakeup(&lfs_dirvcount);
    454  1.105        ad 		mutex_exit(&lfs_lock);
    455   1.30  perseant 		lfs_vunref(vp);
    456   1.90  perseant 
    457   1.90  perseant 		/*
    458   1.90  perseant 		 * If this inode is not going to be written any more, any
    459   1.90  perseant 		 * segment accounting left over from its truncation needs
    460   1.90  perseant 		 * to occur at the end of the next dirops flush.  Attach
    461   1.90  perseant 		 * them to the fs-wide list for that purpose.
    462   1.90  perseant 		 */
    463   1.90  perseant 		if (LIST_FIRST(&ip->i_lfs_segdhd) != NULL) {
    464   1.90  perseant 			struct segdelta *sd;
    465   1.90  perseant 
    466   1.90  perseant 			while((sd = LIST_FIRST(&ip->i_lfs_segdhd)) != NULL) {
    467   1.90  perseant 				LIST_REMOVE(sd, list);
    468   1.90  perseant 				LIST_INSERT_HEAD(&fs->lfs_segdhd, sd, list);
    469   1.90  perseant 			}
    470   1.90  perseant 		}
    471   1.90  perseant 	} else {
    472   1.90  perseant 		/*
    473   1.90  perseant 		 * If it's not a dirop, we can finalize right away.
    474   1.90  perseant 		 */
    475  1.105        ad 		mutex_exit(&lfs_lock);
    476   1.90  perseant 		lfs_finalize_ino_seguse(fs, ip);
    477   1.38  perseant 	}
    478   1.30  perseant 
    479  1.105        ad 	mutex_enter(&lfs_lock);
    480   1.42  perseant 	LFS_CLR_UINO(ip, IN_ACCESSED|IN_CLEANING|IN_MODIFIED);
    481  1.105        ad 	mutex_exit(&lfs_lock);
    482   1.33  perseant 	ip->i_flag &= ~IN_ALLMOD;
    483   1.93  perseant 	ip->i_lfs_iflags |= LFSI_DELETED;
    484   1.93  perseant 
    485    1.1   mycroft 	/*
    486    1.1   mycroft 	 * Set the ifile's inode entry to unused, increment its version number
    487   1.48  perseant 	 * and link it onto the free chain.
    488    1.1   mycroft 	 */
    489   1.87  perseant 	SET_BITMAP_FREE(fs, ino);
    490    1.1   mycroft 	LFS_IENTRY(ifp, fs, ino, bp);
    491    1.1   mycroft 	old_iaddr = ifp->if_daddr;
    492    1.1   mycroft 	ifp->if_daddr = LFS_UNUSED_DADDR;
    493    1.1   mycroft 	++ifp->if_version;
    494   1.48  perseant 	if (fs->lfs_version == 1) {
    495   1.48  perseant 		LFS_GET_HEADFREE(fs, cip, cbp, &(ifp->if_nextfree));
    496   1.48  perseant 		LFS_PUT_HEADFREE(fs, cip, cbp, ino);
    497   1.56  perseant 		(void) LFS_BWRITE_LOG(bp); /* Ifile */
    498   1.48  perseant 	} else {
    499   1.87  perseant 		ino_t tino, onf;
    500   1.87  perseant 
    501   1.48  perseant 		ifp->if_nextfree = LFS_UNUSED_INUM;
    502   1.56  perseant 		(void) LFS_BWRITE_LOG(bp); /* Ifile */
    503   1.87  perseant 
    504   1.87  perseant 		tino = lfs_freelist_prev(fs, ino);
    505   1.87  perseant 		if (tino == LFS_UNUSED_INUM) {
    506   1.87  perseant 			/* Nothing free below us, put us on the head */
    507   1.87  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    508   1.87  perseant 			LFS_GET_HEADFREE(fs, cip, cbp, &(ifp->if_nextfree));
    509   1.87  perseant 			LFS_PUT_HEADFREE(fs, cip, cbp, ino);
    510   1.88  perseant 			DLOG((DLOG_ALLOC, "lfs_vfree: headfree %lld -> %lld\n",
    511   1.87  perseant 			     (long long)ifp->if_nextfree, (long long)ino));
    512   1.87  perseant 			LFS_BWRITE_LOG(bp); /* Ifile */
    513   1.87  perseant 
    514   1.87  perseant 			/* If the list was empty, set tail too */
    515   1.87  perseant 			LFS_GET_TAILFREE(fs, cip, cbp, &otail);
    516   1.87  perseant 			if (otail == LFS_UNUSED_INUM) {
    517   1.87  perseant 				LFS_PUT_TAILFREE(fs, cip, cbp, ino);
    518   1.87  perseant 				DLOG((DLOG_ALLOC, "lfs_vfree: tailfree %lld "
    519   1.87  perseant 				      "-> %lld\n", (long long)otail,
    520   1.87  perseant 				      (long long)ino));
    521   1.87  perseant 			}
    522   1.87  perseant 		} else {
    523   1.87  perseant 			/*
    524   1.87  perseant 			 * Insert this inode into the list after tino.
    525   1.87  perseant 			 * We hold the segment lock so we don't have to
    526   1.87  perseant 			 * worry about blocks being written out of order.
    527   1.87  perseant 			 */
    528   1.87  perseant 			DLOG((DLOG_ALLOC, "lfs_vfree: insert ino %lld "
    529   1.87  perseant 			      " after %lld\n", ino, tino));
    530   1.87  perseant 
    531   1.87  perseant 			LFS_IENTRY(ifp, fs, tino, bp);
    532   1.87  perseant 			onf = ifp->if_nextfree;
    533   1.87  perseant 			ifp->if_nextfree = ino;
    534   1.87  perseant 			LFS_BWRITE_LOG(bp);	/* Ifile */
    535   1.87  perseant 
    536   1.87  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    537   1.87  perseant 			ifp->if_nextfree = onf;
    538   1.87  perseant 			LFS_BWRITE_LOG(bp);	/* Ifile */
    539   1.87  perseant 
    540   1.87  perseant 			/* If we're last, put us on the tail */
    541   1.87  perseant 			if (onf == LFS_UNUSED_INUM) {
    542   1.87  perseant 				LFS_GET_TAILFREE(fs, cip, cbp, &otail);
    543   1.87  perseant 				LFS_PUT_TAILFREE(fs, cip, cbp, ino);
    544   1.87  perseant 				DLOG((DLOG_ALLOC, "lfs_vfree: tailfree %lld "
    545   1.87  perseant 				      "-> %lld\n", (long long)otail,
    546   1.87  perseant 				      (long long)ino));
    547   1.87  perseant 			}
    548   1.87  perseant 		}
    549   1.48  perseant 	}
    550   1.17  perseant #ifdef DIAGNOSTIC
    551   1.53       chs 	if (ino == LFS_UNUSED_INUM) {
    552   1.17  perseant 		panic("inode 0 freed");
    553   1.17  perseant 	}
    554   1.17  perseant #endif /* DIAGNOSTIC */
    555    1.1   mycroft 	if (old_iaddr != LFS_UNUSED_DADDR) {
    556   1.48  perseant 		LFS_SEGENTRY(sup, fs, dtosn(fs, old_iaddr), bp);
    557   1.22  perseant #ifdef DIAGNOSTIC
    558   1.66      fvdl 		if (sup->su_nbytes < sizeof (struct ufs1_dinode)) {
    559   1.43  perseant 			printf("lfs_vfree: negative byte count"
    560   1.62      yamt 			       " (segment %" PRIu32 " short by %d)\n",
    561   1.48  perseant 			       dtosn(fs, old_iaddr),
    562   1.66      fvdl 			       (int)sizeof (struct ufs1_dinode) -
    563   1.66      fvdl 				    sup->su_nbytes);
    564   1.22  perseant 			panic("lfs_vfree: negative byte count");
    565   1.66      fvdl 			sup->su_nbytes = sizeof (struct ufs1_dinode);
    566   1.17  perseant 		}
    567   1.22  perseant #endif
    568   1.66      fvdl 		sup->su_nbytes -= sizeof (struct ufs1_dinode);
    569   1.63  perseant 		LFS_WRITESEGENTRY(sup, fs, dtosn(fs, old_iaddr), bp); /* Ifile */
    570    1.1   mycroft 	}
    571   1.75     perry 
    572    1.1   mycroft 	/* Set superblock modified bit and decrement file count. */
    573  1.105        ad 	mutex_enter(&lfs_lock);
    574    1.1   mycroft 	fs->lfs_fmod = 1;
    575  1.105        ad 	mutex_exit(&lfs_lock);
    576    1.1   mycroft 	--fs->lfs_nfiles;
    577   1.75     perry 
    578  1.110   hannken 	VOP_UNLOCK(fs->lfs_ivnode);
    579   1.56  perseant 	lfs_segunlock(fs);
    580   1.63  perseant 
    581    1.1   mycroft 	return (0);
    582    1.1   mycroft }
    583   1.87  perseant 
    584   1.87  perseant /*
    585   1.87  perseant  * Sort the freelist and set up the free-inode bitmap.
    586   1.87  perseant  * To be called by lfs_mountfs().
    587   1.87  perseant  */
    588   1.87  perseant void
    589   1.87  perseant lfs_order_freelist(struct lfs *fs)
    590   1.87  perseant {
    591   1.87  perseant 	CLEANERINFO *cip;
    592   1.87  perseant 	IFILE *ifp = NULL;
    593   1.87  perseant 	struct buf *bp;
    594   1.87  perseant 	ino_t ino, firstino, lastino, maxino;
    595   1.97  perseant #ifdef notyet
    596   1.97  perseant 	struct vnode *vp;
    597   1.97  perseant #endif
    598   1.87  perseant 
    599   1.95  perseant 	ASSERT_NO_SEGLOCK(fs);
    600   1.95  perseant 	lfs_seglock(fs, SEGM_PROT);
    601   1.95  perseant 
    602   1.87  perseant 	maxino = ((fs->lfs_ivnode->v_size >> fs->lfs_bshift) -
    603   1.87  perseant 		  fs->lfs_cleansz - fs->lfs_segtabsz) * fs->lfs_ifpb;
    604   1.88  perseant 	fs->lfs_ino_bitmap = (lfs_bm_t *)
    605   1.88  perseant 		malloc(((maxino + BMMASK) >> BMSHIFT) * sizeof(lfs_bm_t),
    606   1.88  perseant 		       M_SEGMENT, M_WAITOK | M_ZERO);
    607   1.88  perseant 	KASSERT(fs->lfs_ino_bitmap != NULL);
    608   1.87  perseant 
    609   1.87  perseant 	firstino = lastino = LFS_UNUSED_INUM;
    610   1.87  perseant 	for (ino = 0; ino < maxino; ino++) {
    611   1.87  perseant 		if (ino % fs->lfs_ifpb == 0)
    612   1.87  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    613   1.87  perseant 		else
    614   1.87  perseant 			++ifp;
    615   1.87  perseant 
    616   1.87  perseant 		/* Don't put zero or ifile on the free list */
    617   1.87  perseant 		if (ino == LFS_UNUSED_INUM || ino == LFS_IFILE_INUM)
    618   1.87  perseant 			continue;
    619   1.87  perseant 
    620   1.97  perseant #ifdef notyet
    621   1.97  perseant 		/* Address orphaned files */
    622   1.97  perseant 		if (ifp->if_nextfree == LFS_ORPHAN_NEXTFREE &&
    623   1.97  perseant 		    VFS_VGET(fs->lfs_ivnode->v_mount, ino, &vp) == 0) {
    624  1.104        he 			lfs_truncate(vp, 0, 0, NOCRED);
    625   1.97  perseant 			vput(vp);
    626   1.97  perseant 			LFS_SEGENTRY(sup, fs, dtosn(fs, ifp->if_daddr), bp);
    627   1.97  perseant 			KASSERT(sup->su_nbytes >= DINODE1_SIZE);
    628   1.97  perseant 			sup->su_nbytes -= DINODE1_SIZE;
    629   1.97  perseant 			LFS_WRITESEGENTRY(sup, fs, dtosn(fs, ifp->if_daddr), bp);
    630   1.97  perseant 
    631   1.97  perseant 			/* Set up to fall through to next section */
    632   1.97  perseant 			ifp->if_daddr = LFS_UNUSED_DADDR;
    633   1.97  perseant 			LFS_BWRITE_LOG(bp);
    634   1.97  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    635   1.97  perseant 		}
    636   1.97  perseant #endif
    637   1.97  perseant 
    638   1.87  perseant 		if (ifp->if_daddr == LFS_UNUSED_DADDR) {
    639   1.87  perseant 			if (firstino == LFS_UNUSED_INUM)
    640   1.87  perseant 				firstino = ino;
    641   1.87  perseant 			else {
    642  1.102        ad 				brelse(bp, 0);
    643   1.87  perseant 
    644   1.87  perseant 				LFS_IENTRY(ifp, fs, lastino, bp);
    645   1.87  perseant 				ifp->if_nextfree = ino;
    646   1.87  perseant 				LFS_BWRITE_LOG(bp);
    647   1.87  perseant 
    648   1.87  perseant 				LFS_IENTRY(ifp, fs, ino, bp);
    649   1.87  perseant 			}
    650   1.87  perseant 			lastino = ino;
    651   1.87  perseant 
    652   1.87  perseant 			SET_BITMAP_FREE(fs, ino);
    653   1.87  perseant 		}
    654   1.87  perseant 
    655   1.87  perseant 		if ((ino + 1) % fs->lfs_ifpb == 0)
    656  1.102        ad 			brelse(bp, 0);
    657   1.87  perseant 	}
    658   1.87  perseant 
    659   1.87  perseant 	LFS_PUT_HEADFREE(fs, cip, bp, firstino);
    660   1.87  perseant 	LFS_PUT_TAILFREE(fs, cip, bp, lastino);
    661   1.95  perseant 
    662   1.95  perseant 	lfs_segunlock(fs);
    663   1.87  perseant }
    664   1.97  perseant 
    665   1.97  perseant void
    666   1.97  perseant lfs_orphan(struct lfs *fs, ino_t ino)
    667   1.97  perseant {
    668   1.97  perseant 	IFILE *ifp;
    669   1.97  perseant 	struct buf *bp;
    670   1.97  perseant 
    671   1.97  perseant 	LFS_IENTRY(ifp, fs, ino, bp);
    672   1.97  perseant 	ifp->if_nextfree = LFS_ORPHAN_NEXTFREE;
    673   1.97  perseant 	LFS_BWRITE_LOG(bp);
    674   1.97  perseant }
    675