Home | History | Annotate | Line # | Download | only in nilfs
nilfs_subr.c revision 1.12
      1 /* $NetBSD: nilfs_subr.c,v 1.12 2014/10/15 09:05:46 hannken Exp $ */
      2 
      3 /*
      4  * Copyright (c) 2008, 2009 Reinoud Zandijk
      5  * All rights reserved.
      6  *
      7  * Redistribution and use in source and binary forms, with or without
      8  * modification, are permitted provided that the following conditions
      9  * are met:
     10  * 1. Redistributions of source code must retain the above copyright
     11  *    notice, this list of conditions and the following disclaimer.
     12  * 2. Redistributions in binary form must reproduce the above copyright
     13  *    notice, this list of conditions and the following disclaimer in the
     14  *    documentation and/or other materials provided with the distribution.
     15  *
     16  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     17  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     18  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     19  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     20  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     21  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     22  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     23  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     24  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     25  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     26  *
     27  */
     28 
     29 #include <sys/cdefs.h>
     30 #ifndef lint
     31 __KERNEL_RCSID(0, "$NetBSD: nilfs_subr.c,v 1.12 2014/10/15 09:05:46 hannken Exp $");
     32 #endif /* not lint */
     33 
     34 #include <sys/param.h>
     35 #include <sys/systm.h>
     36 #include <sys/namei.h>
     37 #include <sys/resourcevar.h>	/* defines plimit structure in proc struct */
     38 #include <sys/kernel.h>
     39 #include <sys/file.h>		/* define FWRITE ... */
     40 #include <sys/stat.h>
     41 #include <sys/buf.h>
     42 #include <sys/proc.h>
     43 #include <sys/mount.h>
     44 #include <sys/vnode.h>
     45 #include <sys/signalvar.h>
     46 #include <sys/malloc.h>
     47 #include <sys/dirent.h>
     48 #include <sys/lockf.h>
     49 #include <sys/kauth.h>
     50 #include <sys/dirhash.h>
     51 
     52 #include <miscfs/genfs/genfs.h>
     53 #include <uvm/uvm_extern.h>
     54 
     55 #include <fs/nilfs/nilfs_mount.h>
     56 #include "nilfs.h"
     57 #include "nilfs_subr.h"
     58 #include "nilfs_bswap.h"
     59 
     60 
     61 #define VTOI(vnode) ((struct nilfs_node *) (vnode)->v_data)
     62 
     63 /* forwards */
     64 static int nilfs_btree_lookup(struct nilfs_node *node, uint64_t lblocknr,
     65 	uint64_t *vblocknr);
     66 
     67 /* basic calculators */
     68 uint64_t nilfs_get_segnum_of_block(struct nilfs_device *nilfsdev,
     69 	uint64_t blocknr)
     70 {
     71 	return blocknr / nilfs_rw32(nilfsdev->super.s_blocks_per_segment);
     72 }
     73 
     74 
     75 void
     76 nilfs_get_segment_range(struct nilfs_device *nilfsdev, uint64_t segnum,
     77         uint64_t *seg_start, uint64_t *seg_end)
     78 {
     79         uint64_t blks_per_seg;
     80 
     81         blks_per_seg = nilfs_rw64(nilfsdev->super.s_blocks_per_segment);
     82         *seg_start = blks_per_seg * segnum;
     83         *seg_end   = *seg_start + blks_per_seg -1;
     84         if (segnum == 0)
     85                 *seg_start = nilfs_rw64(nilfsdev->super.s_first_data_block);
     86 }
     87 
     88 
     89 void nilfs_calc_mdt_consts(struct nilfs_device *nilfsdev,
     90 	struct nilfs_mdt *mdt, int entry_size)
     91 {
     92 	uint32_t blocksize = nilfsdev->blocksize;
     93 
     94 	mdt->entries_per_group = blocksize * 8;	   /* bits in sector */
     95 	mdt->entries_per_block = blocksize / entry_size;
     96 
     97 	mdt->blocks_per_group  =
     98 		(mdt->entries_per_group -1) / mdt->entries_per_block + 1 + 1;
     99 	mdt->groups_per_desc_block =
    100 		blocksize / sizeof(struct nilfs_block_group_desc);
    101 	mdt->blocks_per_desc_block =
    102 		mdt->groups_per_desc_block * mdt->blocks_per_group + 1;
    103 }
    104 
    105 
    106 /* from NetBSD's src/sys/net/if_ethersubr.c */
    107 uint32_t
    108 crc32_le(uint32_t crc, const uint8_t *buf, size_t len)
    109 {
    110         static const uint32_t crctab[] = {
    111                 0x00000000, 0x1db71064, 0x3b6e20c8, 0x26d930ac,
    112                 0x76dc4190, 0x6b6b51f4, 0x4db26158, 0x5005713c,
    113                 0xedb88320, 0xf00f9344, 0xd6d6a3e8, 0xcb61b38c,
    114                 0x9b64c2b0, 0x86d3d2d4, 0xa00ae278, 0xbdbdf21c
    115         };
    116         size_t i;
    117 
    118         for (i = 0; i < len; i++) {
    119                 crc ^= buf[i];
    120                 crc = (crc >> 4) ^ crctab[crc & 0xf];
    121                 crc = (crc >> 4) ^ crctab[crc & 0xf];
    122         }
    123 
    124         return (crc);
    125 }
    126 
    127 
    128 /* dev reading */
    129 static int
    130 nilfs_dev_bread(struct nilfs_device *nilfsdev, uint64_t blocknr,
    131 	struct kauth_cred *cred, int flags, struct buf **bpp)
    132 {
    133 	int blk2dev = nilfsdev->blocksize / DEV_BSIZE;
    134 
    135 	return bread(nilfsdev->devvp, blocknr * blk2dev, nilfsdev->blocksize,
    136 		NOCRED, 0, bpp);
    137 }
    138 
    139 
    140 /* read on a node */
    141 int
    142 nilfs_bread(struct nilfs_node *node, uint64_t blocknr,
    143 	struct kauth_cred *cred, int flags, struct buf **bpp)
    144 {
    145 	struct nilfs_device *nilfsdev = node->nilfsdev;
    146 	uint64_t vblocknr, pblockno;
    147 	int error;
    148 
    149 	error = nilfs_btree_lookup(node, blocknr, &vblocknr);
    150 	if (error)
    151 		return error;
    152 
    153 	/* Read special files through devvp as they have no vnode attached. */
    154 	if (node->ino < NILFS_USER_INO && node->ino != NILFS_ROOT_INO) {
    155 		error = nilfs_nvtop(node, 1, &vblocknr, &pblockno);
    156 		if (error)
    157 			return error;
    158 		return nilfs_dev_bread(nilfsdev, pblockno, cred, flags, bpp);
    159 	}
    160 
    161 	return bread(node->vnode, vblocknr, node->nilfsdev->blocksize,
    162 		cred, flags, bpp);
    163 }
    164 
    165 
    166 /* segment-log reading */
    167 int
    168 nilfs_get_segment_log(struct nilfs_device *nilfsdev, uint64_t *blocknr,
    169 	uint64_t *offset, struct buf **bpp, int len, void *blob)
    170 {
    171 	int blocksize = nilfsdev->blocksize;
    172 	int error;
    173 
    174 	KASSERT(len <= blocksize);
    175 
    176 	if (*offset + len > blocksize) {
    177 		*blocknr = *blocknr + 1;
    178 		*offset = 0;
    179 	}
    180 	if (*offset == 0) {
    181 		if (*bpp)
    182 			brelse(*bpp, BC_AGE);
    183 		/* read in block */
    184 		error = nilfs_dev_bread(nilfsdev, *blocknr, NOCRED, 0, bpp);
    185 		if (error)
    186 			return error;
    187 	}
    188 	memcpy(blob, ((uint8_t *) (*bpp)->b_data) + *offset, len);
    189 	*offset += len;
    190 
    191 	return 0;
    192 }
    193 
    194 /* -------------------------------------------------------------------------- */
    195 
    196 /* btree operations */
    197 
    198 static int
    199 nilfs_btree_lookup_level(struct nilfs_node *node, uint64_t lblocknr,
    200 		uint64_t btree_vblknr, int level, uint64_t *vblocknr)
    201 {
    202 	struct nilfs_device *nilfsdev = node->nilfsdev;
    203 	struct nilfs_btree_node *btree_hdr;
    204 	struct buf *bp;
    205 	uint64_t btree_blknr;
    206 	uint64_t *dkeys, *dptrs, child_btree_blk;
    207 	uint8_t  *pos;
    208 	int i, error, selected;
    209 
    210 	DPRINTF(TRANSLATE, ("nilfs_btree_lookup_level ino %"PRIu64", "
    211 		"lblocknr %"PRIu64", btree_vblknr %"PRIu64", level %d\n",
    212 		node->ino, lblocknr, btree_vblknr, level));
    213 
    214 	/* translate btree_vblknr */
    215 	error = nilfs_nvtop(node, 1, &btree_vblknr, &btree_blknr);
    216 	if (error)
    217 		return error;
    218 
    219 	/* get our block */
    220 	error = nilfs_dev_bread(nilfsdev, btree_blknr, NOCRED, 0, &bp);
    221 	if (error) {
    222 		return error;
    223 	}
    224 
    225 	btree_hdr = (struct nilfs_btree_node *) bp->b_data;
    226 	pos =   (uint8_t *) bp->b_data +
    227 		sizeof(struct nilfs_btree_node) +
    228 		NILFS_BTREE_NODE_EXTRA_PAD_SIZE;
    229 	dkeys = (uint64_t *) pos;
    230 	dptrs = dkeys + NILFS_BTREE_NODE_NCHILDREN_MAX(nilfsdev->blocksize);
    231 
    232 	assert((btree_hdr->bn_flags & NILFS_BTREE_NODE_ROOT) == 0);
    233 
    234 	/* select matching child XXX could use binary search */
    235 	selected = 0;
    236 	for (i = 0; i < nilfs_rw16(btree_hdr->bn_nchildren); i++) {
    237 		if (dkeys[i] > lblocknr)
    238 			break;
    239 		selected = i;
    240 	}
    241 
    242 	if (level == 1) {
    243 		/* if found it mapped */
    244 		if (dkeys[selected] == lblocknr)
    245 			*vblocknr = dptrs[selected];
    246 		brelse(bp, BC_AGE);
    247 		return 0;
    248 	}
    249 
    250 	/* lookup in selected child */
    251 	assert(dkeys[selected] <= lblocknr);
    252 	child_btree_blk = dptrs[selected];
    253 	brelse(bp, BC_AGE);
    254 
    255 	return nilfs_btree_lookup_level(node, lblocknr,
    256 			child_btree_blk, btree_hdr->bn_level-1, vblocknr);
    257 }
    258 
    259 
    260 /* internal function */
    261 static int
    262 nilfs_btree_lookup(struct nilfs_node *node, uint64_t lblocknr,
    263 		uint64_t *vblocknr)
    264 {
    265 	struct nilfs_inode  *inode    = &node->inode;
    266 	struct nilfs_btree_node  *btree_hdr;
    267 	uint64_t *dkeys, *dptrs, *dtrans;
    268 	int i, selected;
    269 	int error;
    270 
    271 	DPRINTF(TRANSLATE, ("nilfs_btree_lookup ino %"PRIu64", "
    272 		"lblocknr %"PRIu64"\n", node->ino, lblocknr));
    273 
    274 	btree_hdr  = (struct nilfs_btree_node *) &inode->i_bmap[0];
    275 	dkeys  = &inode->i_bmap[1];
    276 	dptrs  = dkeys + NILFS_BTREE_ROOT_NCHILDREN_MAX;
    277 	dtrans = &inode->i_bmap[1];
    278 
    279 	/* SMALL, direct lookup */
    280 	*vblocknr = 0;
    281 	if ((btree_hdr->bn_flags & NILFS_BMAP_LARGE) == 0) {
    282 		if (lblocknr < NILFS_DIRECT_NBLOCKS) {
    283 			*vblocknr = dtrans[lblocknr];
    284 			return 0;
    285 		}
    286 		/* not mapped XXX could be considered error here */
    287 		return 0;
    288 	}
    289 
    290 	/* LARGE, select matching child; XXX could use binary search */
    291 	dtrans = NULL;
    292 	error = 0;
    293 	selected = 0;
    294 	for (i = 0; i < nilfs_rw16(btree_hdr->bn_nchildren); i++) {
    295 		if (dkeys[i] > lblocknr)
    296 			break;
    297 		selected = i;
    298 	}
    299 
    300 	/* if selected key > lblocknr, its not mapped */
    301 	if (dkeys[selected] > lblocknr)
    302 		return 0;
    303 
    304 	/* overshooting? then not mapped */
    305 	if (selected == nilfs_rw16(btree_hdr->bn_nchildren))
    306 		return 0;
    307 
    308 	/* level should be > 1 or otherwise it should be a direct one */
    309 	assert(btree_hdr->bn_level > 1);
    310 
    311 	/* lookup in selected child */
    312 	assert(dkeys[selected] <= lblocknr);
    313 	error = nilfs_btree_lookup_level(node, lblocknr,
    314 			dptrs[selected], btree_hdr->bn_level-1, vblocknr);
    315 
    316 	return error;
    317 }
    318 
    319 
    320 /* node should be locked on entry to prevent btree changes (unlikely) */
    321 int
    322 nilfs_btree_nlookup(struct nilfs_node *node, uint64_t from, uint64_t blks,
    323 		uint64_t *l2vmap)
    324 {
    325 	uint64_t lblocknr, *vblocknr;
    326 	int i, error;
    327 
    328 	/* TODO / OPTI multiple translations in one go possible */
    329 	error = EINVAL;
    330 	for (i = 0; i < blks; i++) {
    331 		lblocknr  = from + i;
    332 		vblocknr  = l2vmap + i;
    333 		error = nilfs_btree_lookup(node, lblocknr, vblocknr);
    334 
    335 		DPRINTF(TRANSLATE, ("btree_nlookup ino %"PRIu64", "
    336 			"lblocknr %"PRIu64" -> %"PRIu64"\n",
    337 			node->ino, lblocknr, *vblocknr));
    338 		if (error)
    339 			break;
    340 	}
    341 
    342 	return error;
    343 }
    344 
    345 /* --------------------------------------------------------------------- */
    346 
    347 /* vtop operations */
    348 
    349 /* translate index to a file block number and an entry */
    350 void
    351 nilfs_mdt_trans(struct nilfs_mdt *mdt, uint64_t index,
    352 	uint64_t *blocknr, uint32_t *entry_in_block)
    353 {
    354 	uint64_t blknr;
    355 	uint64_t group, group_offset, blocknr_in_group;
    356 	uint64_t desc_block, desc_offset;
    357 
    358 	/* calculate our offset in the file */
    359 	group             = index / mdt->entries_per_group;
    360 	group_offset      = index % mdt->entries_per_group;
    361 	desc_block        = group / mdt->groups_per_desc_block;
    362 	desc_offset       = group % mdt->groups_per_desc_block;
    363 	blocknr_in_group  = group_offset / mdt->entries_per_block;
    364 
    365 	/* to descgroup offset */
    366 	blknr = 1 + desc_block * mdt->blocks_per_desc_block;
    367 
    368 	/* to group offset */
    369 	blknr += desc_offset * mdt->blocks_per_group;
    370 
    371 	/* to actual file block */
    372 	blknr += 1 + blocknr_in_group;
    373 
    374 	*blocknr        = blknr;
    375 	*entry_in_block = group_offset % mdt->entries_per_block;
    376 }
    377 
    378 
    379 static int
    380 nilfs_vtop(struct nilfs_device *nilfsdev, uint64_t vblocknr, uint64_t *pblocknr)
    381 {
    382 	struct nilfs_dat_entry *entry;
    383 	struct buf *bp;
    384 	uint64_t  ldatblknr;
    385 	uint32_t  entry_in_block;
    386 	int error;
    387 
    388 	nilfs_mdt_trans(&nilfsdev->dat_mdt, vblocknr,
    389 		&ldatblknr, &entry_in_block);
    390 
    391 	error = nilfs_bread(nilfsdev->dat_node, ldatblknr, NOCRED, 0, &bp);
    392 	if (error) {
    393 		printf("vtop: can't read in DAT block %"PRIu64"!\n", ldatblknr);
    394 		return error;
    395 	}
    396 
    397 	/* get our translation */
    398 	entry = ((struct nilfs_dat_entry *) bp->b_data) + entry_in_block;
    399 #if 0
    400 	printf("\tvblk %4"PRIu64" -> %"PRIu64" for "
    401 		"checkpoint %"PRIu64" to %"PRIu64"\n",
    402 		vblocknr,
    403 		nilfs_rw64(entry->de_blocknr),
    404 		nilfs_rw64(entry->de_start),
    405 		nilfs_rw64(entry->de_end));
    406 #endif
    407 
    408 	*pblocknr = nilfs_rw64(entry->de_blocknr);
    409 	brelse(bp, BC_AGE);
    410 
    411 	return 0;
    412 }
    413 
    414 
    415 int
    416 nilfs_nvtop(struct nilfs_node *node, uint64_t blks, uint64_t *l2vmap,
    417 		uint64_t *v2pmap)
    418 {
    419 	uint64_t vblocknr, *pblocknr;
    420 	int i, error;
    421 
    422 	/* the DAT inode is the only one not mapped virtual */
    423 	if (node->ino == NILFS_DAT_INO) {
    424 		memcpy(v2pmap, l2vmap, blks * sizeof(uint64_t));
    425 		return 0;
    426 	}
    427 
    428 	/* TODO / OPTI more translations in one go */
    429 	error = 0;
    430 	for (i = 0; i < blks; i++) {
    431 		vblocknr  = l2vmap[i];
    432 		pblocknr  = v2pmap + i;
    433 		*pblocknr = 0;
    434 
    435 		/* only translate valid vblocknrs */
    436 		if (vblocknr == 0)
    437 			continue;
    438 		error = nilfs_vtop(node->nilfsdev, vblocknr, pblocknr);
    439 		if (error)
    440 			break;
    441 	}
    442 
    443 	return error;
    444 }
    445 
    446 /* --------------------------------------------------------------------- */
    447 
    448 struct nilfs_recover_info {
    449 	uint64_t segnum;
    450 	uint64_t pseg;
    451 
    452 	struct nilfs_segment_summary segsum;
    453 	struct nilfs_super_root      super_root;
    454 	STAILQ_ENTRY(nilfs_recover_info) next;
    455 };
    456 
    457 
    458 /*
    459  * Helper functions of nilfs_mount() that actually mounts the disc.
    460  */
    461 static int
    462 nilfs_load_segsum(struct nilfs_device *nilfsdev,
    463 	struct nilfs_recover_info *ri)
    464 {
    465 	struct buf *bp;
    466 	uint64_t blocknr, offset;
    467 	uint32_t segsum_struct_size;
    468 	uint32_t magic;
    469 	int error;
    470 
    471 	segsum_struct_size = sizeof(struct nilfs_segment_summary);
    472 
    473 	/* read in segsum structure */
    474 	bp      = NULL;
    475 	blocknr = ri->pseg;
    476 	offset  = 0;
    477 	error = nilfs_get_segment_log(nilfsdev,
    478 			&blocknr, &offset, &bp,
    479 			segsum_struct_size, (void *) &ri->segsum);
    480 	if (error)
    481 		goto out;
    482 
    483 	/* sanity checks */
    484 	magic = nilfs_rw32(ri->segsum.ss_magic);
    485 	if (magic != NILFS_SEGSUM_MAGIC) {
    486 		DPRINTF(VOLUMES, ("nilfs: bad magic in pseg %"PRIu64"\n",
    487 			ri->pseg));
    488 		error = EINVAL;
    489 		goto out;
    490 	}
    491 
    492 	/* TODO check segment summary checksum */
    493 	/* TODO check data checksum */
    494 
    495 out:
    496 	if (bp)
    497 		brelse(bp, BC_AGE);
    498 
    499 	return error;
    500 }
    501 
    502 
    503 static int
    504 nilfs_load_super_root(struct nilfs_device *nilfsdev,
    505 	struct nilfs_recover_info *ri)
    506 {
    507 	struct nilfs_segment_summary *segsum = &ri->segsum;
    508 	struct nilfs_super_root *super_root;
    509 	struct buf *bp;
    510 	uint64_t blocknr, offset;
    511 	uint32_t segsum_size, size;
    512 	uint32_t nsumblk, nfileblk;
    513 	uint32_t super_root_crc, comp_crc;
    514 	int off, error;
    515 
    516 	/* process segment summary */
    517 	segsum_size = nilfs_rw32(segsum->ss_sumbytes);
    518 	nsumblk     = (segsum_size - 1) / nilfsdev->blocksize + 1;
    519 	nfileblk    = nilfs_rw32(segsum->ss_nblocks) - nsumblk;
    520 
    521 	/* check if there is a superroot */
    522 	if ((nilfs_rw16(segsum->ss_flags) & NILFS_SS_SR) == 0) {
    523 		DPRINTF(VOLUMES, ("nilfs: no super root in pseg %"PRIu64"\n",
    524 			ri->pseg));
    525 		return ENOENT;
    526 	}
    527 
    528 	/* get our super root, located at the end of the pseg */
    529 	blocknr = ri->pseg + nsumblk + nfileblk - 1;
    530 	offset = 0;
    531 	size = sizeof(struct nilfs_super_root);
    532 	bp = NULL;
    533 	error = nilfs_get_segment_log(nilfsdev,
    534 			&blocknr, &offset, &bp,
    535 			size, (void *) &nilfsdev->super_root);
    536 	if (bp)
    537 		brelse(bp, BC_AGE);
    538 	if (error) {
    539 		printf("read in of superroot failed\n");
    540 		return EIO;
    541 	}
    542 
    543 	/* check super root crc */
    544 	super_root = &nilfsdev->super_root;
    545 	super_root_crc = nilfs_rw32(super_root->sr_sum);
    546 	off = sizeof(super_root->sr_sum);
    547 	comp_crc = crc32_le(nilfs_rw32(nilfsdev->super.s_crc_seed),
    548 		(uint8_t *) super_root + off,
    549 		NILFS_SR_BYTES - off);
    550 	if (super_root_crc != comp_crc) {
    551 		DPRINTF(VOLUMES, ("    invalid superroot, likely from old format\n"));
    552 		return EINVAL;
    553 	}
    554 
    555 	DPRINTF(VOLUMES, ("    got valid superroot\n"));
    556 
    557 	return 0;
    558 }
    559 
    560 /*
    561  * Search for the last super root recorded.
    562  */
    563 void
    564 nilfs_search_super_root(struct nilfs_device *nilfsdev)
    565 {
    566 	struct nilfs_super_block *super;
    567 	struct nilfs_segment_summary *segsum;
    568 	struct nilfs_recover_info *ri, *ori, *i_ri;
    569 	STAILQ_HEAD(,nilfs_recover_info) ri_list;
    570 	uint64_t seg_start, seg_end, cno;
    571 	uint32_t segsum_size;
    572 	uint32_t nsumblk, nfileblk;
    573 	int error;
    574 
    575 	STAILQ_INIT(&ri_list);
    576 
    577 	/* search for last super root */
    578 	ri = malloc(sizeof(struct nilfs_recover_info), M_NILFSTEMP, M_WAITOK);
    579 	memset(ri, 0, sizeof(struct nilfs_recover_info));
    580 
    581 	/* if enabled, start from the specified position */
    582 	if (0) {
    583 		/* start from set start */
    584 		nilfsdev->super.s_last_pseg = nilfsdev->super.s_first_data_block;
    585 		nilfsdev->super.s_last_cno  = nilfs_rw64(1);
    586 	}
    587 
    588 	ri->pseg   = nilfs_rw64(nilfsdev->super.s_last_pseg); /* blknr */
    589 	ri->segnum = nilfs_get_segnum_of_block(nilfsdev, ri->pseg);
    590 
    591 	error = 0;
    592 	cno = nilfs_rw64(nilfsdev->super.s_last_cno);
    593 	DPRINTF(VOLUMES, ("nilfs: seach_super_root start in pseg %"PRIu64"\n",
    594 			ri->pseg));
    595 	for (;;) {
    596 		DPRINTF(VOLUMES, (" at pseg %"PRIu64"\n", ri->pseg));
    597 		error = nilfs_load_segsum(nilfsdev, ri);
    598 		if (error)
    599 			break;
    600 
    601 		segsum = &ri->segsum;
    602 
    603 		/* try to load super root */
    604 		if (nilfs_rw16(segsum->ss_flags) & NILFS_SS_SR) {
    605 			DPRINTF(VOLUMES, (" try super root\n"));
    606 			error = nilfs_load_super_root(nilfsdev, ri);
    607 			if (error)
    608 				break;	/* confused */
    609 			/* wipe current list of ri */
    610 			while (!STAILQ_EMPTY(&ri_list)) {
    611 				i_ri = STAILQ_FIRST(&ri_list);
    612 				STAILQ_REMOVE_HEAD(&ri_list, next);
    613 				free(i_ri, M_NILFSTEMP);
    614 			}
    615 			super = &nilfsdev->super;
    616 
    617 			super->s_last_pseg = nilfs_rw64(ri->pseg);
    618 			super->s_last_cno  = cno++;
    619 			super->s_last_seq  = segsum->ss_seq;
    620 			super->s_state     = nilfs_rw16(NILFS_VALID_FS);
    621 		} else {
    622 			STAILQ_INSERT_TAIL(&ri_list, ri, next);
    623 			ori = ri;
    624 			ri = malloc(sizeof(struct nilfs_recover_info),
    625 				M_NILFSTEMP, M_WAITOK);
    626 			memset(ri, 0, sizeof(struct nilfs_recover_info));
    627 			ri->segnum = ori->segnum;
    628 			ri->pseg   = ori->pseg;
    629 			/* segsum keeps pointing to the `old' ri */
    630 		}
    631 
    632 		/* continue to the next pseg */
    633 		segsum_size = nilfs_rw32(segsum->ss_sumbytes);
    634 		nsumblk     = (segsum_size - 1) / nilfsdev->blocksize + 1;
    635 		nfileblk    = nilfs_rw32(segsum->ss_nblocks) - nsumblk;
    636 
    637 		/* calculate next partial segment location */
    638 		ri->pseg += nsumblk + nfileblk;
    639 
    640 		/* did we reach the end of the segment? if so, go to the next */
    641 		nilfs_get_segment_range(nilfsdev, ri->segnum, &seg_start, &seg_end);
    642 		if (ri->pseg >= seg_end)
    643 			ri->pseg = nilfs_rw64(segsum->ss_next);
    644 		ri->segnum = nilfs_get_segnum_of_block(nilfsdev, ri->pseg);
    645 	}
    646 
    647 	/*
    648 	 * XXX No roll-forward yet of the remaining partial segments.
    649 	 */
    650 
    651 	/* wipe current list of ri */
    652 	while (!STAILQ_EMPTY(&ri_list)) {
    653 		i_ri = STAILQ_FIRST(&ri_list);
    654 		STAILQ_REMOVE_HEAD(&ri_list, next);
    655 		printf("nilfs: ignoring pseg at %"PRIu64"\n", i_ri->pseg);
    656 		free(i_ri, M_NILFSTEMP);
    657 	}
    658 	free(ri, M_NILFSTEMP);
    659 }
    660 
    661 /* --------------------------------------------------------------------- */
    662 
    663 int
    664 nilfs_get_node_raw(struct nilfs_device *nilfsdev, struct nilfs_mount *ump,
    665 	uint64_t ino, struct nilfs_inode *inode, struct nilfs_node **nodep)
    666 {
    667 	struct nilfs_node *node;
    668 
    669 	*nodep = NULL;
    670 
    671 	node = pool_get(&nilfs_node_pool, PR_WAITOK);
    672 	memset(node, 0, sizeof(struct nilfs_node));
    673 
    674 	/* crosslink */
    675 	node->ump      = ump;
    676 	node->nilfsdev = nilfsdev;
    677 
    678 	/* initiase nilfs node */
    679 	node->ino   = ino;
    680 	node->inode = *inode;
    681 	node->lockf = NULL;
    682 
    683 	/* initialise locks */
    684 	mutex_init(&node->node_mutex, MUTEX_DEFAULT, IPL_NONE);
    685 	cv_init(&node->node_lock, "nilfsnlk");
    686 
    687 	/* fixup inode size for system nodes */
    688 	if ((ino < NILFS_USER_INO) && (ino != NILFS_ROOT_INO)) {
    689 		DPRINTF(VOLUMES, ("NEED TO GET my size for inode %"PRIu64"\n",
    690 			ino));
    691 		/* for now set it to maximum, -1 is illegal */
    692 		inode->i_size = nilfs_rw64(((uint64_t) -2));
    693 	}
    694 
    695 	/* return node */
    696 	*nodep = node;
    697 	return 0;
    698 }
    699 
    700 void
    701 nilfs_dispose_node(struct nilfs_node **nodep)
    702 {
    703 	struct nilfs_node *node;
    704 
    705 	/* protect against rogue values */
    706 	if (!*nodep)
    707 		return;
    708 
    709 	node = *nodep;
    710 
    711 	/* remove dirhash if present */
    712 	dirhash_purge(&node->dir_hash);
    713 
    714 	/* destroy our locks */
    715 	mutex_destroy(&node->node_mutex);
    716 	cv_destroy(&node->node_lock);
    717 
    718 	/* free our associated memory */
    719 	pool_put(&nilfs_node_pool, node);
    720 
    721 	*nodep = NULL;
    722 }
    723 
    724 
    725 void
    726 nilfs_itimes(struct nilfs_node *node, struct timespec *acc,
    727 	struct timespec *mod, struct timespec *birth)
    728 {
    729 }
    730 
    731 
    732 int
    733 nilfs_update(struct vnode *node, struct timespec *acc,
    734 	struct timespec *mod, struct timespec *birth, int updflags)
    735 {
    736 	return EROFS;
    737 }
    738 
    739 
    740 int
    741 nilfs_chsize(struct vnode *vp, u_quad_t newsize, kauth_cred_t cred)
    742 {
    743 	return EROFS;
    744 }
    745 
    746 
    747 
    748 int
    749 nilfs_grow_node(struct nilfs_node *node, uint64_t new_size)
    750 {
    751 	return EROFS;
    752 }
    753 
    754 
    755 int
    756 nilfs_shrink_node(struct nilfs_node *node, uint64_t new_size)
    757 {
    758 	return EROFS;
    759 }
    760 
    761 
    762 static int
    763 dirhash_fill(struct nilfs_node *dir_node)
    764 {
    765 	struct vnode *dvp = dir_node->vnode;
    766 	struct dirhash *dirh;
    767 	struct nilfs_dir_entry *ndirent;
    768 	struct dirent dirent;
    769 	struct buf *bp;
    770 	uint64_t file_size, diroffset, blkoff;
    771 	uint64_t blocknr;
    772 	uint32_t blocksize = dir_node->nilfsdev->blocksize;
    773 	uint8_t *pos, name_len;
    774 	int error;
    775 
    776 	DPRINTF(CALL, ("dirhash_fill called\n"));
    777 
    778 	if (dvp->v_type != VDIR)
    779 		return ENOTDIR;
    780 
    781 	/* make sure we have a dirhash to work on */
    782 	dirh = dir_node->dir_hash;
    783 	KASSERT(dirh);
    784 	KASSERT(dirh->refcnt > 0);
    785 
    786 	if (dirh->flags & DIRH_BROKEN)
    787 		return EIO;
    788 
    789 	if (dirh->flags & DIRH_COMPLETE)
    790 		return 0;
    791 
    792 	DPRINTF(DIRHASH, ("Filling directory hash\n"));
    793 
    794 	/* make sure we have a clean dirhash to add to */
    795 	dirhash_purge_entries(dirh);
    796 
    797 	/* get directory filesize */
    798 	file_size = nilfs_rw64(dir_node->inode.i_size);
    799 
    800 	/* walk the directory */
    801 	error = 0;
    802 	diroffset = 0;
    803 
    804 	blocknr = diroffset / blocksize;
    805 	blkoff  = diroffset % blocksize;
    806 	error = nilfs_bread(dir_node, blocknr, NOCRED, 0, &bp);
    807 	if (error) {
    808 		dirh->flags |= DIRH_BROKEN;
    809 		dirhash_purge_entries(dirh);
    810 		return EIO;
    811 	}
    812 	while (diroffset < file_size) {
    813 		DPRINTF(READDIR, ("filldir : offset = %"PRIu64"\n",
    814 			diroffset));
    815 		if (blkoff >= blocksize) {
    816 			blkoff = 0; blocknr++;
    817 			brelse(bp, BC_AGE);
    818 			error = nilfs_bread(dir_node, blocknr, NOCRED, 0,
    819 					&bp);
    820 			if (error) {
    821 				dirh->flags |= DIRH_BROKEN;
    822 				dirhash_purge_entries(dirh);
    823 				return EIO;
    824 			}
    825 		}
    826 
    827 		/* read in one dirent */
    828 		pos = (uint8_t *) bp->b_data + blkoff;
    829 		ndirent = (struct nilfs_dir_entry *) pos;
    830 		name_len = ndirent->name_len;
    831 
    832 		memset(&dirent, 0, sizeof(struct dirent));
    833 		dirent.d_fileno = nilfs_rw64(ndirent->inode);
    834 		dirent.d_type   = ndirent->file_type;	/* 1:1 ? */
    835 		dirent.d_namlen = name_len;
    836 		strncpy(dirent.d_name, ndirent->name, name_len);
    837 		dirent.d_reclen = _DIRENT_SIZE(&dirent);
    838 		DPRINTF(DIRHASH, ("copying `%*.*s`\n", name_len,
    839 			name_len, dirent.d_name));
    840 
    841 		/* XXX is it deleted? extra free space? */
    842 		dirhash_enter(dirh, &dirent, diroffset,
    843 			nilfs_rw16(ndirent->rec_len), 0);
    844 
    845 		/* advance */
    846 		diroffset += nilfs_rw16(ndirent->rec_len);
    847 		blkoff    += nilfs_rw16(ndirent->rec_len);
    848 	}
    849 	brelse(bp, BC_AGE);
    850 
    851 	dirh->flags |= DIRH_COMPLETE;
    852 
    853 	return 0;
    854 }
    855 
    856 
    857 int
    858 nilfs_lookup_name_in_dir(struct vnode *dvp, const char *name, int namelen,
    859 		uint64_t *ino, int *found)
    860 {
    861 	struct nilfs_node	*dir_node = VTOI(dvp);
    862 	struct nilfs_dir_entry *ndirent;
    863 	struct dirhash		*dirh;
    864 	struct dirhash_entry	*dirh_ep;
    865 	struct buf *bp;
    866 	uint64_t diroffset, blkoff;
    867 	uint64_t blocknr;
    868 	uint32_t blocksize = dir_node->nilfsdev->blocksize;
    869 	uint8_t *pos;
    870 	int hit, error;
    871 
    872 	/* set default return */
    873 	*found = 0;
    874 
    875 	/* get our dirhash and make sure its read in */
    876 	dirhash_get(&dir_node->dir_hash);
    877 	error = dirhash_fill(dir_node);
    878 	if (error) {
    879 		dirhash_put(dir_node->dir_hash);
    880 		return error;
    881 	}
    882 	dirh = dir_node->dir_hash;
    883 
    884 	/* allocate temporary space for fid */
    885 
    886 	DPRINTF(DIRHASH, ("dirhash_lookup looking for `%*.*s`\n",
    887 		namelen, namelen, name));
    888 
    889 	/* search our dirhash hits */
    890 	*ino = 0;
    891 	dirh_ep = NULL;
    892 	for (;;) {
    893 		hit = dirhash_lookup(dirh, name, namelen, &dirh_ep);
    894 		/* if no hit, abort the search */
    895 		if (!hit)
    896 			break;
    897 
    898 		/* check this hit */
    899 		diroffset = dirh_ep->offset;
    900 
    901 		blocknr = diroffset / blocksize;
    902 		blkoff  = diroffset % blocksize;
    903 		error = nilfs_bread(dir_node, blocknr, NOCRED, 0, &bp);
    904 		if (error)
    905 			return EIO;
    906 
    907 		/* read in one dirent */
    908 		pos = (uint8_t *) bp->b_data + blkoff;
    909 		ndirent = (struct nilfs_dir_entry *) pos;
    910 
    911 		DPRINTF(DIRHASH, ("dirhash_lookup\tchecking `%*.*s`\n",
    912 			ndirent->name_len, ndirent->name_len, ndirent->name));
    913 
    914 		/* see if its our entry */
    915 		KASSERT(ndirent->name_len == namelen);
    916 		if (strncmp(ndirent->name, name, namelen) == 0) {
    917 			*found = 1;
    918 			*ino = nilfs_rw64(ndirent->inode);
    919 			brelse(bp, BC_AGE);
    920 			break;
    921 		}
    922 		brelse(bp, BC_AGE);
    923 	}
    924 
    925 	dirhash_put(dir_node->dir_hash);
    926 
    927 	return error;
    928 }
    929 
    930 
    931 int
    932 nilfs_dir_detach(struct nilfs_mount *ump, struct nilfs_node *dir_node, struct nilfs_node *node, struct componentname *cnp)
    933 {
    934 	return EROFS;
    935 }
    936 
    937 
    938 int
    939 nilfs_dir_attach(struct nilfs_mount *ump, struct nilfs_node *dir_node, struct nilfs_node *node, struct vattr *vap, struct componentname *cnp)
    940 {
    941 	return EROFS;
    942 }
    943 
    944 
    945 /* XXX return vnode? */
    946 int
    947 nilfs_create_node(struct vnode *dvp, struct vnode **vpp, struct vattr *vap, struct componentname *cnp)
    948 {
    949 	return EROFS;
    950 }
    951 
    952 
    953 void
    954 nilfs_delete_node(struct nilfs_node *node)
    955 {
    956 }
    957 
    958 
    959