Home | History | Annotate | Line # | Download | only in lfs
lfs_alloc.c revision 1.107
      1  1.107    martin /*	$NetBSD: lfs_alloc.c,v 1.107 2008/04/28 20:24:11 martin Exp $	*/
      2    1.2       cgd 
      3   1.17  perseant /*-
      4  1.100        ad  * Copyright (c) 1999, 2000, 2001, 2002, 2003, 2007 The NetBSD Foundation, Inc.
      5   1.17  perseant  * All rights reserved.
      6   1.17  perseant  *
      7   1.17  perseant  * This code is derived from software contributed to The NetBSD Foundation
      8   1.17  perseant  * by Konrad E. Schroder <perseant (at) hhhh.org>.
      9   1.17  perseant  *
     10   1.17  perseant  * Redistribution and use in source and binary forms, with or without
     11   1.17  perseant  * modification, are permitted provided that the following conditions
     12   1.17  perseant  * are met:
     13   1.17  perseant  * 1. Redistributions of source code must retain the above copyright
     14   1.17  perseant  *    notice, this list of conditions and the following disclaimer.
     15   1.17  perseant  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.17  perseant  *    notice, this list of conditions and the following disclaimer in the
     17   1.17  perseant  *    documentation and/or other materials provided with the distribution.
     18   1.17  perseant  *
     19   1.17  perseant  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.17  perseant  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.17  perseant  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.17  perseant  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.17  perseant  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.17  perseant  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.17  perseant  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.17  perseant  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.17  perseant  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.17  perseant  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.17  perseant  * POSSIBILITY OF SUCH DAMAGE.
     30   1.17  perseant  */
     31    1.1   mycroft /*
     32    1.1   mycroft  * Copyright (c) 1991, 1993
     33    1.1   mycroft  *	The Regents of the University of California.  All rights reserved.
     34    1.1   mycroft  *
     35    1.1   mycroft  * Redistribution and use in source and binary forms, with or without
     36    1.1   mycroft  * modification, are permitted provided that the following conditions
     37    1.1   mycroft  * are met:
     38    1.1   mycroft  * 1. Redistributions of source code must retain the above copyright
     39    1.1   mycroft  *    notice, this list of conditions and the following disclaimer.
     40    1.1   mycroft  * 2. Redistributions in binary form must reproduce the above copyright
     41    1.1   mycroft  *    notice, this list of conditions and the following disclaimer in the
     42    1.1   mycroft  *    documentation and/or other materials provided with the distribution.
     43   1.71       agc  * 3. Neither the name of the University nor the names of its contributors
     44    1.1   mycroft  *    may be used to endorse or promote products derived from this software
     45    1.1   mycroft  *    without specific prior written permission.
     46    1.1   mycroft  *
     47    1.1   mycroft  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     48    1.1   mycroft  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     49    1.1   mycroft  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     50    1.1   mycroft  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     51    1.1   mycroft  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     52    1.1   mycroft  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     53    1.1   mycroft  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     54    1.1   mycroft  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     55    1.1   mycroft  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     56    1.1   mycroft  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     57    1.1   mycroft  * SUCH DAMAGE.
     58    1.1   mycroft  *
     59    1.2       cgd  *	@(#)lfs_alloc.c	8.4 (Berkeley) 1/4/94
     60    1.1   mycroft  */
     61   1.52     lukem 
     62   1.52     lukem #include <sys/cdefs.h>
     63  1.107    martin __KERNEL_RCSID(0, "$NetBSD: lfs_alloc.c,v 1.107 2008/04/28 20:24:11 martin Exp $");
     64   1.12    scottr 
     65   1.47       mrg #if defined(_KERNEL_OPT)
     66   1.12    scottr #include "opt_quota.h"
     67   1.13    scottr #endif
     68    1.1   mycroft 
     69    1.1   mycroft #include <sys/param.h>
     70    1.3  christos #include <sys/systm.h>
     71    1.1   mycroft #include <sys/kernel.h>
     72    1.1   mycroft #include <sys/buf.h>
     73   1.56  perseant #include <sys/lock.h>
     74    1.1   mycroft #include <sys/vnode.h>
     75    1.1   mycroft #include <sys/syslog.h>
     76    1.1   mycroft #include <sys/mount.h>
     77   1.87  perseant #include <sys/malloc.h>
     78   1.15   thorpej #include <sys/pool.h>
     79   1.50       chs #include <sys/proc.h>
     80   1.81  perseant #include <sys/tree.h>
     81   1.94      elad #include <sys/kauth.h>
     82    1.1   mycroft 
     83    1.1   mycroft #include <ufs/ufs/quota.h>
     84    1.1   mycroft #include <ufs/ufs/inode.h>
     85    1.1   mycroft #include <ufs/ufs/ufsmount.h>
     86    1.3  christos #include <ufs/ufs/ufs_extern.h>
     87    1.1   mycroft 
     88    1.1   mycroft #include <ufs/lfs/lfs.h>
     89    1.1   mycroft #include <ufs/lfs/lfs_extern.h>
     90    1.1   mycroft 
     91  1.100        ad extern kmutex_t ufs_hashlock;
     92   1.17  perseant 
     93   1.87  perseant /* Constants for inode free bitmap */
     94   1.88  perseant #define BMSHIFT 5	/* 2 ** 5 = 32 */
     95   1.88  perseant #define BMMASK  ((1 << BMSHIFT) - 1)
     96   1.88  perseant #define SET_BITMAP_FREE(F, I) do { \
     97   1.88  perseant 	DLOG((DLOG_ALLOC, "lfs: ino %d wrd %d bit %d set\n", (int)(I), 	\
     98   1.88  perseant 	     (int)((I) >> BMSHIFT), (int)((I) & BMMASK)));		\
     99   1.88  perseant 	(F)->lfs_ino_bitmap[(I) >> BMSHIFT] |= (1 << ((I) & BMMASK));	\
    100   1.88  perseant } while (0)
    101   1.88  perseant #define CLR_BITMAP_FREE(F, I) do { \
    102   1.88  perseant 	DLOG((DLOG_ALLOC, "lfs: ino %d wrd %d bit %d clr\n", (int)(I), 	\
    103   1.88  perseant 	     (int)((I) >> BMSHIFT), (int)((I) & BMMASK)));		\
    104   1.88  perseant 	(F)->lfs_ino_bitmap[(I) >> BMSHIFT] &= ~(1 << ((I) & BMMASK));	\
    105   1.88  perseant } while(0)
    106   1.88  perseant 
    107   1.87  perseant #define ISSET_BITMAP_FREE(F, I) \
    108   1.88  perseant 	((F)->lfs_ino_bitmap[(I) >> BMSHIFT] & (1 << ((I) & BMMASK)))
    109   1.87  perseant 
    110   1.44  perseant /*
    111   1.65  perseant  * Add a new block to the Ifile, to accommodate future file creations.
    112   1.65  perseant  * Called with the segment lock held.
    113   1.56  perseant  */
    114   1.96  perseant int
    115   1.96  perseant lfs_extend_ifile(struct lfs *fs, kauth_cred_t cred)
    116   1.44  perseant {
    117   1.44  perseant 	struct vnode *vp;
    118   1.44  perseant 	struct inode *ip;
    119   1.44  perseant 	IFILE *ifp;
    120   1.48  perseant 	IFILE_V1 *ifp_v1;
    121   1.48  perseant 	struct buf *bp, *cbp;
    122   1.44  perseant 	int error;
    123   1.83  christos 	daddr_t i, blkno, xmax;
    124   1.87  perseant 	ino_t oldlast, maxino;
    125   1.48  perseant 	CLEANERINFO *cip;
    126   1.44  perseant 
    127   1.78  perseant 	ASSERT_SEGLOCK(fs);
    128   1.78  perseant 
    129   1.44  perseant 	vp = fs->lfs_ivnode;
    130   1.44  perseant 	ip = VTOI(vp);
    131   1.66      fvdl 	blkno = lblkno(fs, ip->i_size);
    132   1.85      yamt 	if ((error = lfs_balloc(vp, ip->i_size, fs->lfs_bsize, cred, 0,
    133   1.44  perseant 				&bp)) != 0) {
    134   1.44  perseant 		return (error);
    135   1.44  perseant 	}
    136   1.66      fvdl 	ip->i_size += fs->lfs_bsize;
    137   1.66      fvdl 	ip->i_ffs1_size = ip->i_size;
    138   1.66      fvdl 	uvm_vnp_setsize(vp, ip->i_size);
    139   1.75     perry 
    140   1.88  perseant 	maxino = ((ip->i_size >> fs->lfs_bshift) - fs->lfs_cleansz -
    141   1.88  perseant 		  fs->lfs_segtabsz) * fs->lfs_ifpb;
    142   1.88  perseant 	fs->lfs_ino_bitmap = (lfs_bm_t *)
    143   1.88  perseant 		realloc(fs->lfs_ino_bitmap, ((maxino + BMMASK) >> BMSHIFT) *
    144   1.88  perseant 			sizeof(lfs_bm_t), M_SEGMENT, M_WAITOK);
    145   1.88  perseant 	KASSERT(fs->lfs_ino_bitmap != NULL);
    146   1.87  perseant 
    147   1.44  perseant 	i = (blkno - fs->lfs_segtabsz - fs->lfs_cleansz) *
    148   1.44  perseant 		fs->lfs_ifpb;
    149   1.87  perseant 
    150   1.87  perseant 	/*
    151   1.87  perseant 	 * We insert the new inodes at the head of the free list.
    152   1.87  perseant 	 * Under normal circumstances, the free list is empty here,
    153   1.87  perseant 	 * so we are also incidentally placing them at the end (which
    154   1.87  perseant 	 * we must do if we are to keep them in order).
    155   1.87  perseant 	 */
    156   1.48  perseant 	LFS_GET_HEADFREE(fs, cip, cbp, &oldlast);
    157   1.48  perseant 	LFS_PUT_HEADFREE(fs, cip, cbp, i);
    158   1.44  perseant #ifdef DIAGNOSTIC
    159   1.63  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM)
    160   1.44  perseant 		panic("inode 0 allocated [2]");
    161   1.44  perseant #endif /* DIAGNOSTIC */
    162   1.83  christos 	xmax = i + fs->lfs_ifpb;
    163   1.48  perseant 
    164   1.53       chs 	if (fs->lfs_version == 1) {
    165   1.83  christos 		for (ifp_v1 = (IFILE_V1 *)bp->b_data; i < xmax; ++ifp_v1) {
    166   1.89  perseant 			SET_BITMAP_FREE(fs, i);
    167   1.48  perseant 			ifp_v1->if_version = 1;
    168   1.48  perseant 			ifp_v1->if_daddr = LFS_UNUSED_DADDR;
    169   1.48  perseant 			ifp_v1->if_nextfree = ++i;
    170   1.48  perseant 		}
    171   1.48  perseant 		ifp_v1--;
    172   1.48  perseant 		ifp_v1->if_nextfree = oldlast;
    173   1.48  perseant 	} else {
    174   1.83  christos 		for (ifp = (IFILE *)bp->b_data; i < xmax; ++ifp) {
    175   1.89  perseant 			SET_BITMAP_FREE(fs, i);
    176   1.48  perseant 			ifp->if_version = 1;
    177   1.48  perseant 			ifp->if_daddr = LFS_UNUSED_DADDR;
    178   1.48  perseant 			ifp->if_nextfree = ++i;
    179   1.48  perseant 		}
    180   1.48  perseant 		ifp--;
    181   1.48  perseant 		ifp->if_nextfree = oldlast;
    182   1.44  perseant 	}
    183   1.83  christos 	LFS_PUT_TAILFREE(fs, cip, cbp, xmax - 1);
    184   1.48  perseant 
    185   1.56  perseant 	(void) LFS_BWRITE_LOG(bp); /* Ifile */
    186   1.44  perseant 
    187   1.44  perseant 	return 0;
    188   1.44  perseant }
    189   1.44  perseant 
    190    1.1   mycroft /* Allocate a new inode. */
    191    1.1   mycroft /* ARGSUSED */
    192   1.43  perseant /* VOP_BWRITE 2i times */
    193    1.1   mycroft int
    194   1.99  christos lfs_valloc(struct vnode *pvp, int mode, kauth_cred_t cred,
    195   1.98  christos     struct vnode **vpp)
    196    1.3  christos {
    197    1.1   mycroft 	struct lfs *fs;
    198   1.48  perseant 	struct buf *bp, *cbp;
    199    1.1   mycroft 	struct ifile *ifp;
    200    1.1   mycroft 	ino_t new_ino;
    201    1.1   mycroft 	int error;
    202   1.36  perseant 	int new_gen;
    203   1.48  perseant 	CLEANERINFO *cip;
    204    1.1   mycroft 
    205   1.85      yamt 	fs = VTOI(pvp)->i_lfs;
    206   1.38  perseant 	if (fs->lfs_ronly)
    207   1.38  perseant 		return EROFS;
    208   1.75     perry 
    209   1.78  perseant 	ASSERT_NO_SEGLOCK(fs);
    210   1.78  perseant 
    211   1.56  perseant 	lfs_seglock(fs, SEGM_PROT);
    212   1.78  perseant 	vn_lock(fs->lfs_ivnode, LK_EXCLUSIVE);
    213   1.17  perseant 
    214    1.1   mycroft 	/* Get the head of the freelist. */
    215   1.48  perseant 	LFS_GET_HEADFREE(fs, cip, cbp, &new_ino);
    216   1.87  perseant 	KASSERT(new_ino != LFS_UNUSED_INUM && new_ino != LFS_IFILE_INUM);
    217   1.48  perseant 
    218   1.87  perseant 	DLOG((DLOG_ALLOC, "lfs_valloc: allocate inode %lld\n",
    219   1.87  perseant 	     (long long)new_ino));
    220   1.75     perry 
    221    1.1   mycroft 	/*
    222    1.1   mycroft 	 * Remove the inode from the free list and write the new start
    223    1.1   mycroft 	 * of the free list into the superblock.
    224    1.1   mycroft 	 */
    225   1.87  perseant 	CLR_BITMAP_FREE(fs, new_ino);
    226    1.1   mycroft 	LFS_IENTRY(ifp, fs, new_ino, bp);
    227    1.1   mycroft 	if (ifp->if_daddr != LFS_UNUSED_DADDR)
    228   1.84  christos 		panic("lfs_valloc: inuse inode %llu on the free list",
    229   1.84  christos 		    (unsigned long long)new_ino);
    230   1.48  perseant 	LFS_PUT_HEADFREE(fs, cip, cbp, ifp->if_nextfree);
    231   1.87  perseant 	DLOG((DLOG_ALLOC, "lfs_valloc: headfree %lld -> %lld\n",
    232   1.87  perseant 	     (long long)new_ino, (long long)ifp->if_nextfree));
    233   1.48  perseant 
    234   1.37  perseant 	new_gen = ifp->if_version; /* version was updated by vfree */
    235  1.102        ad 	brelse(bp, 0);
    236   1.30  perseant 
    237    1.1   mycroft 	/* Extend IFILE so that the next lfs_valloc will succeed. */
    238   1.63  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM) {
    239   1.96  perseant 		if ((error = lfs_extend_ifile(fs, cred)) != 0) {
    240   1.48  perseant 			LFS_PUT_HEADFREE(fs, cip, cbp, new_ino);
    241   1.78  perseant 			VOP_UNLOCK(fs->lfs_ivnode, 0);
    242   1.56  perseant 			lfs_segunlock(fs);
    243   1.44  perseant 			return error;
    244    1.1   mycroft 		}
    245    1.1   mycroft 	}
    246   1.17  perseant #ifdef DIAGNOSTIC
    247   1.63  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM)
    248   1.17  perseant 		panic("inode 0 allocated [3]");
    249   1.17  perseant #endif /* DIAGNOSTIC */
    250   1.48  perseant 
    251   1.78  perseant 	/* Set superblock modified bit and increment file count. */
    252  1.105        ad 	mutex_enter(&lfs_lock);
    253   1.78  perseant 	fs->lfs_fmod = 1;
    254  1.105        ad 	mutex_exit(&lfs_lock);
    255   1.78  perseant 	++fs->lfs_nfiles;
    256   1.78  perseant 
    257   1.78  perseant 	VOP_UNLOCK(fs->lfs_ivnode, 0);
    258   1.56  perseant 	lfs_segunlock(fs);
    259   1.63  perseant 
    260   1.85      yamt 	return lfs_ialloc(fs, pvp, new_ino, new_gen, vpp);
    261   1.44  perseant }
    262   1.44  perseant 
    263   1.65  perseant /*
    264   1.65  perseant  * Finish allocating a new inode, given an inode and generation number.
    265   1.65  perseant  */
    266   1.96  perseant int
    267   1.44  perseant lfs_ialloc(struct lfs *fs, struct vnode *pvp, ino_t new_ino, int new_gen,
    268   1.44  perseant 	   struct vnode **vpp)
    269   1.44  perseant {
    270   1.44  perseant 	struct inode *ip;
    271   1.44  perseant 	struct vnode *vp;
    272   1.40      fvdl 
    273   1.78  perseant 	ASSERT_NO_SEGLOCK(fs);
    274   1.78  perseant 
    275   1.77  perseant 	vp = *vpp;
    276  1.100        ad 	mutex_enter(&ufs_hashlock);
    277   1.40      fvdl 	/* Create an inode to associate with the vnode. */
    278   1.44  perseant 	lfs_vcreate(pvp->v_mount, new_ino, vp);
    279   1.51       chs 
    280    1.1   mycroft 	ip = VTOI(vp);
    281  1.105        ad 	mutex_enter(&lfs_lock);
    282   1.73   mycroft 	LFS_SET_UINO(ip, IN_CHANGE);
    283  1.105        ad 	mutex_exit(&lfs_lock);
    284   1.66      fvdl 	/* on-disk structure has been zeroed out by lfs_vcreate */
    285   1.66      fvdl 	ip->i_din.ffs1_din->di_inumber = new_ino;
    286   1.51       chs 
    287   1.79  perseant 	/* Note no blocks yet */
    288   1.79  perseant 	ip->i_lfs_hiblk = -1;
    289   1.79  perseant 
    290    1.1   mycroft 	/* Set a new generation number for this inode. */
    291   1.66      fvdl 	if (new_gen) {
    292   1.66      fvdl 		ip->i_gen = new_gen;
    293   1.66      fvdl 		ip->i_ffs1_gen = new_gen;
    294   1.66      fvdl 	}
    295   1.51       chs 
    296    1.1   mycroft 	/* Insert into the inode hash table. */
    297    1.1   mycroft 	ufs_ihashins(ip);
    298  1.100        ad 	mutex_exit(&ufs_hashlock);
    299   1.44  perseant 
    300   1.77  perseant 	ufs_vinit(vp->v_mount, lfs_specop_p, lfs_fifoop_p, vpp);
    301   1.77  perseant 	vp = *vpp;
    302   1.44  perseant 	ip = VTOI(vp);
    303   1.57      yamt 
    304   1.57      yamt 	memset(ip->i_lfs_fragsize, 0, NDADDR * sizeof(*ip->i_lfs_fragsize));
    305   1.51       chs 
    306   1.51       chs 	uvm_vnp_setsize(vp, 0);
    307   1.72      yamt 	lfs_mark_vnode(vp);
    308   1.54       chs 	genfs_node_init(vp, &lfs_genfsops);
    309   1.38  perseant 	VREF(ip->i_devvp);
    310    1.1   mycroft 	return (0);
    311    1.1   mycroft }
    312    1.1   mycroft 
    313    1.1   mycroft /* Create a new vnode/inode pair and initialize what fields we can. */
    314   1.40      fvdl void
    315   1.48  perseant lfs_vcreate(struct mount *mp, ino_t ino, struct vnode *vp)
    316    1.1   mycroft {
    317    1.1   mycroft 	struct inode *ip;
    318   1.66      fvdl 	struct ufs1_dinode *dp;
    319    1.1   mycroft 	struct ufsmount *ump;
    320   1.75     perry 
    321    1.1   mycroft 	/* Get a pointer to the private mount structure. */
    322    1.1   mycroft 	ump = VFSTOUFS(mp);
    323   1.75     perry 
    324   1.78  perseant 	ASSERT_NO_SEGLOCK(ump->um_lfs);
    325   1.78  perseant 
    326    1.1   mycroft 	/* Initialize the inode. */
    327   1.15   thorpej 	ip = pool_get(&lfs_inode_pool, PR_WAITOK);
    328   1.66      fvdl 	memset(ip, 0, sizeof(*ip));
    329   1.66      fvdl 	dp = pool_get(&lfs_dinode_pool, PR_WAITOK);
    330   1.66      fvdl 	memset(dp, 0, sizeof(*dp));
    331   1.63  perseant 	ip->inode_ext.lfs = pool_get(&lfs_inoext_pool, PR_WAITOK);
    332   1.74  perseant 	memset(ip->inode_ext.lfs, 0, sizeof(*ip->inode_ext.lfs));
    333   1.40      fvdl 	vp->v_data = ip;
    334   1.66      fvdl 	ip->i_din.ffs1_din = dp;
    335   1.66      fvdl 	ip->i_ump = ump;
    336   1.40      fvdl 	ip->i_vnode = vp;
    337    1.1   mycroft 	ip->i_devvp = ump->um_devvp;
    338    1.1   mycroft 	ip->i_dev = ump->um_dev;
    339   1.66      fvdl 	ip->i_number = dp->di_inumber = ino;
    340    1.1   mycroft 	ip->i_lfs = ump->um_lfs;
    341   1.66      fvdl 	ip->i_lfs_effnblks = 0;
    342   1.81  perseant 	SPLAY_INIT(&ip->i_lfs_lbtree);
    343   1.82  perseant 	ip->i_lfs_nbtree = 0;
    344   1.91  perseant 	LIST_INIT(&ip->i_lfs_segdhd);
    345    1.1   mycroft #ifdef QUOTA
    346  1.101   hannken 	ufsquota_init(ip);
    347    1.1   mycroft #endif
    348    1.1   mycroft }
    349    1.1   mycroft 
    350   1.87  perseant #if 0
    351   1.87  perseant /*
    352   1.87  perseant  * Find the highest-numbered allocated inode.
    353   1.87  perseant  * This will be used to shrink the Ifile.
    354   1.87  perseant  */
    355   1.87  perseant static inline ino_t
    356   1.87  perseant lfs_last_alloc_ino(struct lfs *fs)
    357   1.87  perseant {
    358   1.87  perseant 	ino_t ino, maxino;
    359   1.87  perseant 
    360   1.87  perseant 	maxino = ((fs->lfs_ivnode->v_size >> fs->lfs_bshift) -
    361   1.87  perseant 		  fs->lfs_cleansz - fs->lfs_segtabsz) * fs->lfs_ifpb;
    362   1.87  perseant 	for (ino = maxino - 1; ino > LFS_UNUSED_INUM; --ino) {
    363   1.87  perseant 		if (ISSET_BITMAP_FREE(fs, ino) == 0)
    364   1.87  perseant 			break;
    365   1.87  perseant 	}
    366   1.87  perseant 	return ino;
    367   1.87  perseant }
    368   1.87  perseant #endif
    369   1.87  perseant 
    370   1.87  perseant /*
    371   1.87  perseant  * Find the previous (next lowest numbered) free inode, if any.
    372   1.87  perseant  * If there is none, return LFS_UNUSED_INUM.
    373   1.87  perseant  */
    374   1.87  perseant static inline ino_t
    375   1.87  perseant lfs_freelist_prev(struct lfs *fs, ino_t ino)
    376   1.87  perseant {
    377   1.88  perseant 	ino_t tino, bound, bb, freehdbb;
    378   1.88  perseant 
    379   1.88  perseant 	if (fs->lfs_freehd == LFS_UNUSED_INUM)	 /* No free inodes at all */
    380   1.88  perseant 		return LFS_UNUSED_INUM;
    381   1.88  perseant 
    382   1.88  perseant 	/* Search our own word first */
    383   1.88  perseant 	bound = ino & ~BMMASK;
    384   1.89  perseant 	for (tino = ino - 1; tino >= bound && tino > LFS_UNUSED_INUM; tino--)
    385   1.88  perseant 		if (ISSET_BITMAP_FREE(fs, tino))
    386   1.88  perseant 			return tino;
    387   1.88  perseant 	/* If there are no lower words to search, just return */
    388   1.88  perseant 	if (ino >> BMSHIFT == 0)
    389   1.88  perseant 		return LFS_UNUSED_INUM;
    390   1.88  perseant 
    391   1.88  perseant 	/*
    392   1.88  perseant 	 * Find a word with a free inode in it.  We have to be a bit
    393   1.88  perseant 	 * careful here since ino_t is unsigned.
    394   1.88  perseant 	 */
    395   1.88  perseant 	freehdbb = (fs->lfs_freehd >> BMSHIFT);
    396   1.88  perseant 	for (bb = (ino >> BMSHIFT) - 1; bb >= freehdbb && bb > 0; --bb)
    397   1.88  perseant 		if (fs->lfs_ino_bitmap[bb])
    398   1.88  perseant 			break;
    399   1.88  perseant 	if (fs->lfs_ino_bitmap[bb] == 0)
    400   1.88  perseant 		return LFS_UNUSED_INUM;
    401   1.88  perseant 
    402   1.88  perseant 	/* Search the word we found */
    403   1.89  perseant 	for (tino = (bb << BMSHIFT) | BMMASK; tino >= (bb << BMSHIFT) &&
    404   1.89  perseant 	     tino > LFS_UNUSED_INUM; tino--)
    405   1.88  perseant 		if (ISSET_BITMAP_FREE(fs, tino))
    406   1.88  perseant 			break;
    407   1.87  perseant 
    408   1.87  perseant 	if (tino <= LFS_IFILE_INUM)
    409   1.87  perseant 		tino = LFS_UNUSED_INUM;
    410   1.87  perseant 
    411   1.87  perseant 	return tino;
    412   1.87  perseant }
    413   1.87  perseant 
    414    1.1   mycroft /* Free an inode. */
    415    1.1   mycroft /* ARGUSED */
    416   1.43  perseant /* VOP_BWRITE 2i times */
    417    1.1   mycroft int
    418   1.99  christos lfs_vfree(struct vnode *vp, ino_t ino, int mode)
    419    1.3  christos {
    420    1.1   mycroft 	SEGUSE *sup;
    421   1.48  perseant 	CLEANERINFO *cip;
    422   1.48  perseant 	struct buf *cbp, *bp;
    423    1.1   mycroft 	struct ifile *ifp;
    424    1.1   mycroft 	struct inode *ip;
    425    1.1   mycroft 	struct lfs *fs;
    426   1.59      fvdl 	daddr_t old_iaddr;
    427   1.85      yamt 	ino_t otail;
    428   1.75     perry 
    429    1.1   mycroft 	/* Get the inode number and file system. */
    430   1.30  perseant 	ip = VTOI(vp);
    431    1.1   mycroft 	fs = ip->i_lfs;
    432    1.1   mycroft 	ino = ip->i_number;
    433   1.34  perseant 
    434   1.78  perseant 	ASSERT_NO_SEGLOCK(fs);
    435   1.88  perseant 	DLOG((DLOG_ALLOC, "lfs_vfree: free ino %lld\n", (long long)ino));
    436   1.78  perseant 
    437   1.48  perseant 	/* Drain of pending writes */
    438  1.105        ad 	mutex_enter(&vp->v_interlock);
    439  1.105        ad 	while (fs->lfs_version > 1 && WRITEINPROG(vp)) {
    440  1.105        ad 		cv_wait(&vp->v_cv, &vp->v_interlock);
    441  1.105        ad 	}
    442  1.105        ad 	mutex_exit(&vp->v_interlock);
    443   1.48  perseant 
    444   1.63  perseant 	lfs_seglock(fs, SEGM_PROT);
    445   1.78  perseant 	vn_lock(fs->lfs_ivnode, LK_EXCLUSIVE);
    446   1.75     perry 
    447   1.72      yamt 	lfs_unmark_vnode(vp);
    448  1.105        ad 	mutex_enter(&lfs_lock);
    449  1.103        ad 	if (vp->v_uflag & VU_DIROP) {
    450  1.103        ad 		vp->v_uflag &= ~VU_DIROP;
    451   1.30  perseant 		--lfs_dirvcount;
    452   1.92  perseant 		--fs->lfs_dirvcount;
    453   1.63  perseant 		TAILQ_REMOVE(&fs->lfs_dchainhd, ip, i_lfs_dchain);
    454   1.92  perseant 		wakeup(&fs->lfs_dirvcount);
    455   1.30  perseant 		wakeup(&lfs_dirvcount);
    456  1.105        ad 		mutex_exit(&lfs_lock);
    457   1.30  perseant 		lfs_vunref(vp);
    458   1.90  perseant 
    459   1.90  perseant 		/*
    460   1.90  perseant 		 * If this inode is not going to be written any more, any
    461   1.90  perseant 		 * segment accounting left over from its truncation needs
    462   1.90  perseant 		 * to occur at the end of the next dirops flush.  Attach
    463   1.90  perseant 		 * them to the fs-wide list for that purpose.
    464   1.90  perseant 		 */
    465   1.90  perseant 		if (LIST_FIRST(&ip->i_lfs_segdhd) != NULL) {
    466   1.90  perseant 			struct segdelta *sd;
    467   1.90  perseant 
    468   1.90  perseant 			while((sd = LIST_FIRST(&ip->i_lfs_segdhd)) != NULL) {
    469   1.90  perseant 				LIST_REMOVE(sd, list);
    470   1.90  perseant 				LIST_INSERT_HEAD(&fs->lfs_segdhd, sd, list);
    471   1.90  perseant 			}
    472   1.90  perseant 		}
    473   1.90  perseant 	} else {
    474   1.90  perseant 		/*
    475   1.90  perseant 		 * If it's not a dirop, we can finalize right away.
    476   1.90  perseant 		 */
    477  1.105        ad 		mutex_exit(&lfs_lock);
    478   1.90  perseant 		lfs_finalize_ino_seguse(fs, ip);
    479   1.38  perseant 	}
    480   1.30  perseant 
    481  1.105        ad 	mutex_enter(&lfs_lock);
    482   1.42  perseant 	LFS_CLR_UINO(ip, IN_ACCESSED|IN_CLEANING|IN_MODIFIED);
    483  1.105        ad 	mutex_exit(&lfs_lock);
    484   1.33  perseant 	ip->i_flag &= ~IN_ALLMOD;
    485   1.93  perseant 	ip->i_lfs_iflags |= LFSI_DELETED;
    486   1.93  perseant 
    487    1.1   mycroft 	/*
    488    1.1   mycroft 	 * Set the ifile's inode entry to unused, increment its version number
    489   1.48  perseant 	 * and link it onto the free chain.
    490    1.1   mycroft 	 */
    491   1.87  perseant 	SET_BITMAP_FREE(fs, ino);
    492    1.1   mycroft 	LFS_IENTRY(ifp, fs, ino, bp);
    493    1.1   mycroft 	old_iaddr = ifp->if_daddr;
    494    1.1   mycroft 	ifp->if_daddr = LFS_UNUSED_DADDR;
    495    1.1   mycroft 	++ifp->if_version;
    496   1.48  perseant 	if (fs->lfs_version == 1) {
    497   1.48  perseant 		LFS_GET_HEADFREE(fs, cip, cbp, &(ifp->if_nextfree));
    498   1.48  perseant 		LFS_PUT_HEADFREE(fs, cip, cbp, ino);
    499   1.56  perseant 		(void) LFS_BWRITE_LOG(bp); /* Ifile */
    500   1.48  perseant 	} else {
    501   1.87  perseant 		ino_t tino, onf;
    502   1.87  perseant 
    503   1.48  perseant 		ifp->if_nextfree = LFS_UNUSED_INUM;
    504   1.56  perseant 		(void) LFS_BWRITE_LOG(bp); /* Ifile */
    505   1.87  perseant 
    506   1.87  perseant 		tino = lfs_freelist_prev(fs, ino);
    507   1.87  perseant 		if (tino == LFS_UNUSED_INUM) {
    508   1.87  perseant 			/* Nothing free below us, put us on the head */
    509   1.87  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    510   1.87  perseant 			LFS_GET_HEADFREE(fs, cip, cbp, &(ifp->if_nextfree));
    511   1.87  perseant 			LFS_PUT_HEADFREE(fs, cip, cbp, ino);
    512   1.88  perseant 			DLOG((DLOG_ALLOC, "lfs_vfree: headfree %lld -> %lld\n",
    513   1.87  perseant 			     (long long)ifp->if_nextfree, (long long)ino));
    514   1.87  perseant 			LFS_BWRITE_LOG(bp); /* Ifile */
    515   1.87  perseant 
    516   1.87  perseant 			/* If the list was empty, set tail too */
    517   1.87  perseant 			LFS_GET_TAILFREE(fs, cip, cbp, &otail);
    518   1.87  perseant 			if (otail == LFS_UNUSED_INUM) {
    519   1.87  perseant 				LFS_PUT_TAILFREE(fs, cip, cbp, ino);
    520   1.87  perseant 				DLOG((DLOG_ALLOC, "lfs_vfree: tailfree %lld "
    521   1.87  perseant 				      "-> %lld\n", (long long)otail,
    522   1.87  perseant 				      (long long)ino));
    523   1.87  perseant 			}
    524   1.87  perseant 		} else {
    525   1.87  perseant 			/*
    526   1.87  perseant 			 * Insert this inode into the list after tino.
    527   1.87  perseant 			 * We hold the segment lock so we don't have to
    528   1.87  perseant 			 * worry about blocks being written out of order.
    529   1.87  perseant 			 */
    530   1.87  perseant 			DLOG((DLOG_ALLOC, "lfs_vfree: insert ino %lld "
    531   1.87  perseant 			      " after %lld\n", ino, tino));
    532   1.87  perseant 
    533   1.87  perseant 			LFS_IENTRY(ifp, fs, tino, bp);
    534   1.87  perseant 			onf = ifp->if_nextfree;
    535   1.87  perseant 			ifp->if_nextfree = ino;
    536   1.87  perseant 			LFS_BWRITE_LOG(bp);	/* Ifile */
    537   1.87  perseant 
    538   1.87  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    539   1.87  perseant 			ifp->if_nextfree = onf;
    540   1.87  perseant 			LFS_BWRITE_LOG(bp);	/* Ifile */
    541   1.87  perseant 
    542   1.87  perseant 			/* If we're last, put us on the tail */
    543   1.87  perseant 			if (onf == LFS_UNUSED_INUM) {
    544   1.87  perseant 				LFS_GET_TAILFREE(fs, cip, cbp, &otail);
    545   1.87  perseant 				LFS_PUT_TAILFREE(fs, cip, cbp, ino);
    546   1.87  perseant 				DLOG((DLOG_ALLOC, "lfs_vfree: tailfree %lld "
    547   1.87  perseant 				      "-> %lld\n", (long long)otail,
    548   1.87  perseant 				      (long long)ino));
    549   1.87  perseant 			}
    550   1.87  perseant 		}
    551   1.48  perseant 	}
    552   1.17  perseant #ifdef DIAGNOSTIC
    553   1.53       chs 	if (ino == LFS_UNUSED_INUM) {
    554   1.17  perseant 		panic("inode 0 freed");
    555   1.17  perseant 	}
    556   1.17  perseant #endif /* DIAGNOSTIC */
    557    1.1   mycroft 	if (old_iaddr != LFS_UNUSED_DADDR) {
    558   1.48  perseant 		LFS_SEGENTRY(sup, fs, dtosn(fs, old_iaddr), bp);
    559   1.22  perseant #ifdef DIAGNOSTIC
    560   1.66      fvdl 		if (sup->su_nbytes < sizeof (struct ufs1_dinode)) {
    561   1.43  perseant 			printf("lfs_vfree: negative byte count"
    562   1.62      yamt 			       " (segment %" PRIu32 " short by %d)\n",
    563   1.48  perseant 			       dtosn(fs, old_iaddr),
    564   1.66      fvdl 			       (int)sizeof (struct ufs1_dinode) -
    565   1.66      fvdl 				    sup->su_nbytes);
    566   1.22  perseant 			panic("lfs_vfree: negative byte count");
    567   1.66      fvdl 			sup->su_nbytes = sizeof (struct ufs1_dinode);
    568   1.17  perseant 		}
    569   1.22  perseant #endif
    570   1.66      fvdl 		sup->su_nbytes -= sizeof (struct ufs1_dinode);
    571   1.63  perseant 		LFS_WRITESEGENTRY(sup, fs, dtosn(fs, old_iaddr), bp); /* Ifile */
    572    1.1   mycroft 	}
    573   1.75     perry 
    574    1.1   mycroft 	/* Set superblock modified bit and decrement file count. */
    575  1.105        ad 	mutex_enter(&lfs_lock);
    576    1.1   mycroft 	fs->lfs_fmod = 1;
    577  1.105        ad 	mutex_exit(&lfs_lock);
    578    1.1   mycroft 	--fs->lfs_nfiles;
    579   1.75     perry 
    580   1.78  perseant 	VOP_UNLOCK(fs->lfs_ivnode, 0);
    581   1.56  perseant 	lfs_segunlock(fs);
    582   1.63  perseant 
    583    1.1   mycroft 	return (0);
    584    1.1   mycroft }
    585   1.87  perseant 
    586   1.87  perseant /*
    587   1.87  perseant  * Sort the freelist and set up the free-inode bitmap.
    588   1.87  perseant  * To be called by lfs_mountfs().
    589   1.87  perseant  */
    590   1.87  perseant void
    591   1.87  perseant lfs_order_freelist(struct lfs *fs)
    592   1.87  perseant {
    593   1.87  perseant 	CLEANERINFO *cip;
    594   1.87  perseant 	IFILE *ifp = NULL;
    595   1.87  perseant 	struct buf *bp;
    596   1.87  perseant 	ino_t ino, firstino, lastino, maxino;
    597   1.97  perseant #ifdef notyet
    598   1.97  perseant 	struct vnode *vp;
    599   1.97  perseant #endif
    600   1.87  perseant 
    601   1.95  perseant 	ASSERT_NO_SEGLOCK(fs);
    602   1.95  perseant 	lfs_seglock(fs, SEGM_PROT);
    603   1.95  perseant 
    604   1.87  perseant 	maxino = ((fs->lfs_ivnode->v_size >> fs->lfs_bshift) -
    605   1.87  perseant 		  fs->lfs_cleansz - fs->lfs_segtabsz) * fs->lfs_ifpb;
    606   1.88  perseant 	fs->lfs_ino_bitmap = (lfs_bm_t *)
    607   1.88  perseant 		malloc(((maxino + BMMASK) >> BMSHIFT) * sizeof(lfs_bm_t),
    608   1.88  perseant 		       M_SEGMENT, M_WAITOK | M_ZERO);
    609   1.88  perseant 	KASSERT(fs->lfs_ino_bitmap != NULL);
    610   1.87  perseant 
    611   1.87  perseant 	firstino = lastino = LFS_UNUSED_INUM;
    612   1.87  perseant 	for (ino = 0; ino < maxino; ino++) {
    613   1.87  perseant 		if (ino % fs->lfs_ifpb == 0)
    614   1.87  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    615   1.87  perseant 		else
    616   1.87  perseant 			++ifp;
    617   1.87  perseant 
    618   1.87  perseant 		/* Don't put zero or ifile on the free list */
    619   1.87  perseant 		if (ino == LFS_UNUSED_INUM || ino == LFS_IFILE_INUM)
    620   1.87  perseant 			continue;
    621   1.87  perseant 
    622   1.97  perseant #ifdef notyet
    623   1.97  perseant 		/* Address orphaned files */
    624   1.97  perseant 		if (ifp->if_nextfree == LFS_ORPHAN_NEXTFREE &&
    625   1.97  perseant 		    VFS_VGET(fs->lfs_ivnode->v_mount, ino, &vp) == 0) {
    626  1.104        he 			lfs_truncate(vp, 0, 0, NOCRED);
    627   1.97  perseant 			vput(vp);
    628   1.97  perseant 			LFS_SEGENTRY(sup, fs, dtosn(fs, ifp->if_daddr), bp);
    629   1.97  perseant 			KASSERT(sup->su_nbytes >= DINODE1_SIZE);
    630   1.97  perseant 			sup->su_nbytes -= DINODE1_SIZE;
    631   1.97  perseant 			LFS_WRITESEGENTRY(sup, fs, dtosn(fs, ifp->if_daddr), bp);
    632   1.97  perseant 
    633   1.97  perseant 			/* Set up to fall through to next section */
    634   1.97  perseant 			ifp->if_daddr = LFS_UNUSED_DADDR;
    635   1.97  perseant 			LFS_BWRITE_LOG(bp);
    636   1.97  perseant 			LFS_IENTRY(ifp, fs, ino, bp);
    637   1.97  perseant 		}
    638   1.97  perseant #endif
    639   1.97  perseant 
    640   1.87  perseant 		if (ifp->if_daddr == LFS_UNUSED_DADDR) {
    641   1.87  perseant 			if (firstino == LFS_UNUSED_INUM)
    642   1.87  perseant 				firstino = ino;
    643   1.87  perseant 			else {
    644  1.102        ad 				brelse(bp, 0);
    645   1.87  perseant 
    646   1.87  perseant 				LFS_IENTRY(ifp, fs, lastino, bp);
    647   1.87  perseant 				ifp->if_nextfree = ino;
    648   1.87  perseant 				LFS_BWRITE_LOG(bp);
    649   1.87  perseant 
    650   1.87  perseant 				LFS_IENTRY(ifp, fs, ino, bp);
    651   1.87  perseant 			}
    652   1.87  perseant 			lastino = ino;
    653   1.87  perseant 
    654   1.87  perseant 			SET_BITMAP_FREE(fs, ino);
    655   1.87  perseant 		}
    656   1.87  perseant 
    657   1.87  perseant 		if ((ino + 1) % fs->lfs_ifpb == 0)
    658  1.102        ad 			brelse(bp, 0);
    659   1.87  perseant 	}
    660   1.87  perseant 
    661   1.87  perseant 	LFS_PUT_HEADFREE(fs, cip, bp, firstino);
    662   1.87  perseant 	LFS_PUT_TAILFREE(fs, cip, bp, lastino);
    663   1.95  perseant 
    664   1.95  perseant 	lfs_segunlock(fs);
    665   1.87  perseant }
    666   1.97  perseant 
    667   1.97  perseant void
    668   1.97  perseant lfs_orphan(struct lfs *fs, ino_t ino)
    669   1.97  perseant {
    670   1.97  perseant 	IFILE *ifp;
    671   1.97  perseant 	struct buf *bp;
    672   1.97  perseant 
    673   1.97  perseant 	LFS_IENTRY(ifp, fs, ino, bp);
    674   1.97  perseant 	ifp->if_nextfree = LFS_ORPHAN_NEXTFREE;
    675   1.97  perseant 	LFS_BWRITE_LOG(bp);
    676   1.97  perseant }
    677