Home | History | Annotate | Line # | Download | only in udf
udf_strat_sequential.c revision 1.10.4.1
      1  1.10.4.1    rmind /* $NetBSD: udf_strat_sequential.c,v 1.10.4.1 2011/03/05 20:55:10 rmind Exp $ */
      2       1.1  reinoud 
      3       1.1  reinoud /*
      4       1.1  reinoud  * Copyright (c) 2006, 2008 Reinoud Zandijk
      5       1.1  reinoud  * All rights reserved.
      6       1.1  reinoud  *
      7       1.1  reinoud  * Redistribution and use in source and binary forms, with or without
      8       1.1  reinoud  * modification, are permitted provided that the following conditions
      9       1.1  reinoud  * are met:
     10       1.1  reinoud  * 1. Redistributions of source code must retain the above copyright
     11       1.1  reinoud  *    notice, this list of conditions and the following disclaimer.
     12       1.1  reinoud  * 2. Redistributions in binary form must reproduce the above copyright
     13       1.1  reinoud  *    notice, this list of conditions and the following disclaimer in the
     14       1.1  reinoud  *    documentation and/or other materials provided with the distribution.
     15       1.1  reinoud  *
     16       1.1  reinoud  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     17       1.1  reinoud  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     18       1.1  reinoud  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     19       1.1  reinoud  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     20       1.1  reinoud  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     21       1.1  reinoud  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     22       1.1  reinoud  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     23       1.1  reinoud  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     24       1.1  reinoud  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     25       1.1  reinoud  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     26       1.1  reinoud  *
     27       1.1  reinoud  */
     28       1.1  reinoud 
     29       1.1  reinoud #include <sys/cdefs.h>
     30       1.1  reinoud #ifndef lint
     31  1.10.4.1    rmind __KERNEL_RCSID(0, "$NetBSD: udf_strat_sequential.c,v 1.10.4.1 2011/03/05 20:55:10 rmind Exp $");
     32       1.1  reinoud #endif /* not lint */
     33       1.1  reinoud 
     34       1.1  reinoud 
     35       1.1  reinoud #if defined(_KERNEL_OPT)
     36       1.1  reinoud #include "opt_compat_netbsd.h"
     37       1.1  reinoud #endif
     38       1.1  reinoud 
     39       1.1  reinoud #include <sys/param.h>
     40       1.1  reinoud #include <sys/systm.h>
     41       1.1  reinoud #include <sys/sysctl.h>
     42       1.1  reinoud #include <sys/namei.h>
     43       1.1  reinoud #include <sys/proc.h>
     44       1.1  reinoud #include <sys/kernel.h>
     45       1.1  reinoud #include <sys/vnode.h>
     46       1.1  reinoud #include <miscfs/genfs/genfs_node.h>
     47       1.1  reinoud #include <sys/mount.h>
     48       1.1  reinoud #include <sys/buf.h>
     49       1.1  reinoud #include <sys/file.h>
     50       1.1  reinoud #include <sys/device.h>
     51       1.1  reinoud #include <sys/disklabel.h>
     52       1.1  reinoud #include <sys/ioctl.h>
     53       1.1  reinoud #include <sys/malloc.h>
     54       1.1  reinoud #include <sys/dirent.h>
     55       1.1  reinoud #include <sys/stat.h>
     56       1.1  reinoud #include <sys/conf.h>
     57       1.1  reinoud #include <sys/kauth.h>
     58       1.1  reinoud #include <sys/kthread.h>
     59       1.1  reinoud #include <dev/clock_subr.h>
     60       1.1  reinoud 
     61       1.1  reinoud #include <fs/udf/ecma167-udf.h>
     62       1.1  reinoud #include <fs/udf/udf_mount.h>
     63       1.1  reinoud 
     64       1.1  reinoud #include "udf.h"
     65       1.1  reinoud #include "udf_subr.h"
     66       1.1  reinoud #include "udf_bswap.h"
     67       1.1  reinoud 
     68       1.1  reinoud 
     69       1.1  reinoud #define VTOI(vnode) ((struct udf_node *) vnode->v_data)
     70       1.1  reinoud #define PRIV(ump) ((struct strat_private *) ump->strategy_private)
     71       1.1  reinoud 
     72       1.1  reinoud /* --------------------------------------------------------------------- */
     73       1.1  reinoud 
     74       1.1  reinoud /* BUFQ's */
     75       1.1  reinoud #define UDF_SHED_MAX 3
     76       1.1  reinoud 
     77       1.1  reinoud #define UDF_SHED_READING	0
     78       1.1  reinoud #define UDF_SHED_WRITING	1
     79       1.1  reinoud #define UDF_SHED_SEQWRITING	2
     80       1.1  reinoud 
     81       1.1  reinoud struct strat_private {
     82       1.1  reinoud 	struct pool		 desc_pool;	 	/* node descriptors */
     83       1.1  reinoud 
     84       1.1  reinoud 	lwp_t			*queue_lwp;
     85       1.1  reinoud 	kcondvar_t		 discstrat_cv;		/* to wait on       */
     86       1.1  reinoud 	kmutex_t		 discstrat_mutex;	/* disc strategy    */
     87       1.1  reinoud 
     88       1.1  reinoud 	int			 run_thread;		/* thread control */
     89       1.1  reinoud 	int			 cur_queue;
     90       1.1  reinoud 
     91       1.1  reinoud 	struct disk_strategy	 old_strategy_setting;
     92       1.1  reinoud 	struct bufq_state	*queues[UDF_SHED_MAX];
     93       1.1  reinoud 	struct timespec		 last_queued[UDF_SHED_MAX];
     94       1.1  reinoud };
     95       1.1  reinoud 
     96       1.1  reinoud 
     97       1.1  reinoud /* --------------------------------------------------------------------- */
     98       1.1  reinoud 
     99       1.1  reinoud static void
    100       1.1  reinoud udf_wr_nodedscr_callback(struct buf *buf)
    101       1.1  reinoud {
    102       1.1  reinoud 	struct udf_node *udf_node;
    103       1.1  reinoud 
    104       1.1  reinoud 	KASSERT(buf);
    105       1.1  reinoud 	KASSERT(buf->b_data);
    106       1.1  reinoud 
    107       1.1  reinoud 	/* called when write action is done */
    108       1.1  reinoud 	DPRINTF(WRITE, ("udf_wr_nodedscr_callback(): node written out\n"));
    109       1.1  reinoud 
    110       1.1  reinoud 	udf_node = VTOI(buf->b_vp);
    111       1.1  reinoud 	if (udf_node == NULL) {
    112       1.1  reinoud 		putiobuf(buf);
    113       1.1  reinoud 		printf("udf_wr_node_callback: NULL node?\n");
    114       1.1  reinoud 		return;
    115       1.1  reinoud 	}
    116       1.1  reinoud 
    117       1.1  reinoud 	/* XXX right flags to mark dirty again on error? */
    118       1.1  reinoud 	if (buf->b_error) {
    119       1.1  reinoud 		udf_node->i_flags |= IN_MODIFIED | IN_ACCESSED;
    120       1.1  reinoud 		/* XXX TODO reshedule on error */
    121       1.1  reinoud 	}
    122       1.1  reinoud 
    123       1.2  reinoud 	/* decrement outstanding_nodedscr */
    124       1.2  reinoud 	KASSERT(udf_node->outstanding_nodedscr >= 1);
    125       1.2  reinoud 	udf_node->outstanding_nodedscr--;
    126       1.2  reinoud 	if (udf_node->outstanding_nodedscr == 0) {
    127       1.2  reinoud 		/* first unlock the node */
    128      1.10  reinoud 		UDF_UNLOCK_NODE(udf_node, 0);
    129       1.2  reinoud 		wakeup(&udf_node->outstanding_nodedscr);
    130       1.2  reinoud 	}
    131       1.1  reinoud 
    132       1.1  reinoud 	/* unreference the vnode so it can be recycled */
    133       1.1  reinoud 	holdrele(udf_node->vnode);
    134       1.1  reinoud 
    135       1.1  reinoud 	putiobuf(buf);
    136       1.1  reinoud }
    137       1.1  reinoud 
    138       1.1  reinoud /* --------------------------------------------------------------------- */
    139       1.1  reinoud 
    140       1.1  reinoud static int
    141       1.1  reinoud udf_create_logvol_dscr_seq(struct udf_strat_args *args)
    142       1.1  reinoud {
    143       1.1  reinoud 	union dscrptr   **dscrptr = &args->dscr;
    144       1.1  reinoud 	struct udf_mount *ump = args->ump;
    145       1.1  reinoud 	struct strat_private *priv = PRIV(ump);
    146       1.1  reinoud 	uint32_t lb_size;
    147       1.1  reinoud 
    148       1.1  reinoud 	lb_size = udf_rw32(ump->logical_vol->lb_size);
    149       1.1  reinoud 	*dscrptr = pool_get(&priv->desc_pool, PR_WAITOK);
    150       1.1  reinoud 	memset(*dscrptr, 0, lb_size);
    151       1.1  reinoud 
    152       1.1  reinoud 	return 0;
    153       1.1  reinoud }
    154       1.1  reinoud 
    155       1.1  reinoud 
    156       1.1  reinoud static void
    157       1.1  reinoud udf_free_logvol_dscr_seq(struct udf_strat_args *args)
    158       1.1  reinoud {
    159       1.1  reinoud 	union dscrptr    *dscr = args->dscr;
    160       1.1  reinoud 	struct udf_mount *ump  = args->ump;
    161       1.1  reinoud 	struct strat_private *priv = PRIV(ump);
    162       1.1  reinoud 
    163       1.1  reinoud 	pool_put(&priv->desc_pool, dscr);
    164       1.1  reinoud }
    165       1.1  reinoud 
    166       1.1  reinoud 
    167       1.1  reinoud static int
    168       1.1  reinoud udf_read_logvol_dscr_seq(struct udf_strat_args *args)
    169       1.1  reinoud {
    170       1.1  reinoud 	union dscrptr   **dscrptr = &args->dscr;
    171       1.1  reinoud 	union dscrptr    *tmpdscr;
    172       1.1  reinoud 	struct udf_mount *ump = args->ump;
    173       1.1  reinoud 	struct long_ad   *icb = args->icb;
    174       1.1  reinoud 	struct strat_private *priv = PRIV(ump);
    175       1.1  reinoud 	uint32_t lb_size;
    176       1.1  reinoud 	uint32_t sector, dummy;
    177       1.1  reinoud 	int error;
    178       1.1  reinoud 
    179       1.1  reinoud 	lb_size = udf_rw32(ump->logical_vol->lb_size);
    180       1.1  reinoud 
    181       1.1  reinoud 	error = udf_translate_vtop(ump, icb, &sector, &dummy);
    182       1.1  reinoud 	if (error)
    183       1.1  reinoud 		return error;
    184       1.1  reinoud 
    185       1.1  reinoud 	/* try to read in fe/efe */
    186       1.1  reinoud 	error = udf_read_phys_dscr(ump, sector, M_UDFTEMP, &tmpdscr);
    187       1.1  reinoud 	if (error)
    188       1.1  reinoud 		return error;
    189       1.1  reinoud 
    190       1.1  reinoud 	*dscrptr = pool_get(&priv->desc_pool, PR_WAITOK);
    191       1.1  reinoud 	memcpy(*dscrptr, tmpdscr, lb_size);
    192       1.1  reinoud 	free(tmpdscr, M_UDFTEMP);
    193       1.1  reinoud 
    194       1.1  reinoud 	return 0;
    195       1.1  reinoud }
    196       1.1  reinoud 
    197       1.1  reinoud 
    198       1.1  reinoud static int
    199       1.1  reinoud udf_write_logvol_dscr_seq(struct udf_strat_args *args)
    200       1.1  reinoud {
    201       1.1  reinoud 	union dscrptr    *dscr     = args->dscr;
    202       1.1  reinoud 	struct udf_mount *ump      = args->ump;
    203       1.1  reinoud 	struct udf_node  *udf_node = args->udf_node;
    204       1.1  reinoud 	struct long_ad   *icb      = args->icb;
    205       1.1  reinoud 	int               waitfor  = args->waitfor;
    206       1.1  reinoud 	uint32_t logsectornr, sectornr, dummy;
    207       1.1  reinoud 	int error, vpart;
    208       1.1  reinoud 
    209       1.1  reinoud 	/*
    210       1.1  reinoud 	 * we have to decide if we write it out sequential or at its fixed
    211       1.1  reinoud 	 * position by examining the partition its (to be) written on.
    212       1.1  reinoud 	 */
    213       1.1  reinoud 	vpart       = udf_rw16(udf_node->loc.loc.part_num);
    214       1.1  reinoud 	logsectornr = udf_rw32(icb->loc.lb_num);
    215       1.1  reinoud 	sectornr    = 0;
    216       1.1  reinoud 	if (ump->vtop_tp[vpart] != UDF_VTOP_TYPE_VIRT) {
    217       1.1  reinoud 		error = udf_translate_vtop(ump, icb, &sectornr, &dummy);
    218       1.1  reinoud 		if (error)
    219       1.2  reinoud 			goto out;
    220       1.1  reinoud 	}
    221       1.1  reinoud 
    222       1.2  reinoud 	/* add reference to the vnode to prevent recycling */
    223       1.2  reinoud 	vhold(udf_node->vnode);
    224       1.1  reinoud 
    225       1.1  reinoud 	if (waitfor) {
    226       1.1  reinoud 		DPRINTF(WRITE, ("udf_write_logvol_dscr: sync write\n"));
    227       1.1  reinoud 
    228       1.1  reinoud 		error = udf_write_phys_dscr_sync(ump, udf_node, UDF_C_NODE,
    229       1.1  reinoud 			dscr, sectornr, logsectornr);
    230       1.1  reinoud 	} else {
    231       1.1  reinoud 		DPRINTF(WRITE, ("udf_write_logvol_dscr: no wait, async write\n"));
    232       1.1  reinoud 
    233       1.1  reinoud 		error = udf_write_phys_dscr_async(ump, udf_node, UDF_C_NODE,
    234       1.1  reinoud 			dscr, sectornr, logsectornr, udf_wr_nodedscr_callback);
    235       1.1  reinoud 		/* will be UNLOCKED in call back */
    236       1.2  reinoud 		return error;
    237       1.2  reinoud 	}
    238       1.2  reinoud 
    239       1.2  reinoud 	holdrele(udf_node->vnode);
    240       1.2  reinoud out:
    241       1.2  reinoud 	udf_node->outstanding_nodedscr--;
    242       1.2  reinoud 	if (udf_node->outstanding_nodedscr == 0) {
    243       1.2  reinoud 		UDF_UNLOCK_NODE(udf_node, 0);
    244       1.2  reinoud 		wakeup(&udf_node->outstanding_nodedscr);
    245       1.1  reinoud 	}
    246       1.1  reinoud 
    247       1.1  reinoud 	return error;
    248       1.1  reinoud }
    249       1.1  reinoud 
    250       1.1  reinoud /* --------------------------------------------------------------------- */
    251       1.1  reinoud 
    252       1.1  reinoud /*
    253       1.1  reinoud  * Main file-system specific sheduler. Due to the nature of optical media
    254       1.1  reinoud  * sheduling can't be performed in the traditional way. Most OS
    255       1.1  reinoud  * implementations i've seen thus read or write a file atomically giving all
    256       1.1  reinoud  * kinds of side effects.
    257       1.1  reinoud  *
    258       1.1  reinoud  * This implementation uses a kernel thread to shedule the queued requests in
    259       1.1  reinoud  * such a way that is semi-optimal for optical media; this means aproximately
    260       1.1  reinoud  * (R*|(Wr*|Ws*))* since switching between reading and writing is expensive in
    261       1.1  reinoud  * time.
    262       1.1  reinoud  */
    263       1.1  reinoud 
    264       1.1  reinoud static void
    265       1.1  reinoud udf_queuebuf_seq(struct udf_strat_args *args)
    266       1.1  reinoud {
    267       1.1  reinoud 	struct udf_mount *ump = args->ump;
    268       1.1  reinoud 	struct buf *nestbuf = args->nestbuf;
    269       1.1  reinoud 	struct strat_private *priv = PRIV(ump);
    270       1.1  reinoud 	int queue;
    271       1.1  reinoud 	int what;
    272       1.1  reinoud 
    273       1.1  reinoud 	KASSERT(ump);
    274       1.1  reinoud 	KASSERT(nestbuf);
    275       1.1  reinoud 	KASSERT(nestbuf->b_iodone == nestiobuf_iodone);
    276       1.1  reinoud 
    277       1.1  reinoud 	what = nestbuf->b_udf_c_type;
    278       1.1  reinoud 	queue = UDF_SHED_READING;
    279       1.1  reinoud 	if ((nestbuf->b_flags & B_READ) == 0) {
    280       1.1  reinoud 		/* writing */
    281       1.1  reinoud 		queue = UDF_SHED_SEQWRITING;
    282       1.8  reinoud 		if (what == UDF_C_ABSOLUTE)
    283       1.1  reinoud 			queue = UDF_SHED_WRITING;
    284       1.1  reinoud 	}
    285       1.1  reinoud 
    286       1.1  reinoud 	/* use our own sheduler lists for more complex sheduling */
    287       1.1  reinoud 	mutex_enter(&priv->discstrat_mutex);
    288       1.7     yamt 		bufq_put(priv->queues[queue], nestbuf);
    289       1.1  reinoud 		vfs_timestamp(&priv->last_queued[queue]);
    290       1.1  reinoud 	mutex_exit(&priv->discstrat_mutex);
    291       1.1  reinoud 
    292       1.1  reinoud 	/* signal our thread that there might be something to do */
    293       1.1  reinoud 	cv_signal(&priv->discstrat_cv);
    294       1.1  reinoud }
    295       1.1  reinoud 
    296       1.1  reinoud /* --------------------------------------------------------------------- */
    297       1.1  reinoud 
    298       1.1  reinoud /* TODO convert to lb_size */
    299       1.1  reinoud static void
    300       1.3  reinoud udf_VAT_mapping_update(struct udf_mount *ump, struct buf *buf, uint32_t lb_map)
    301       1.1  reinoud {
    302       1.1  reinoud 	union dscrptr    *fdscr = (union dscrptr *) buf->b_data;
    303       1.1  reinoud 	struct vnode     *vp = buf->b_vp;
    304       1.1  reinoud 	struct udf_node  *udf_node = VTOI(vp);
    305       1.1  reinoud 	uint32_t lb_size, blks;
    306       1.3  reinoud 	uint32_t lb_num;
    307       1.1  reinoud 	uint32_t udf_rw32_lbmap;
    308       1.1  reinoud 	int c_type = buf->b_udf_c_type;
    309       1.1  reinoud 	int error;
    310       1.1  reinoud 
    311       1.1  reinoud 	/* only interested when we're using a VAT */
    312       1.1  reinoud 	KASSERT(ump->vat_node);
    313       1.4  reinoud 	KASSERT(ump->vtop_alloc[ump->node_part] == UDF_ALLOC_VAT);
    314       1.1  reinoud 
    315       1.1  reinoud 	/* only nodes are recorded in the VAT */
    316       1.1  reinoud 	/* NOTE: and the fileset descriptor (FIXME ?) */
    317       1.1  reinoud 	if (c_type != UDF_C_NODE)
    318       1.1  reinoud 		return;
    319       1.1  reinoud 
    320       1.1  reinoud 	/* we now have an UDF FE/EFE node on media with VAT (or VAT itself) */
    321       1.1  reinoud 	lb_size = udf_rw32(ump->logical_vol->lb_size);
    322       1.1  reinoud 	blks = lb_size / DEV_BSIZE;
    323       1.1  reinoud 
    324       1.1  reinoud 	udf_rw32_lbmap = udf_rw32(lb_map);
    325       1.1  reinoud 
    326       1.1  reinoud 	/* if we're the VAT itself, only update our assigned sector number */
    327       1.1  reinoud 	if (udf_node == ump->vat_node) {
    328       1.1  reinoud 		fdscr->tag.tag_loc = udf_rw32_lbmap;
    329       1.1  reinoud 		udf_validate_tag_sum(fdscr);
    330       1.1  reinoud 		DPRINTF(TRANSLATE, ("VAT assigned to sector %u\n",
    331       1.1  reinoud 			udf_rw32(udf_rw32_lbmap)));
    332       1.1  reinoud 		/* no use mapping the VAT node in the VAT */
    333       1.1  reinoud 		return;
    334       1.1  reinoud 	}
    335       1.1  reinoud 
    336       1.2  reinoud 	/* record new position in VAT file */
    337       1.2  reinoud 	lb_num = udf_rw32(fdscr->tag.tag_loc);
    338       1.1  reinoud 
    339       1.2  reinoud 	/* lb_num = udf_rw32(udf_node->write_loc.loc.lb_num); */
    340       1.1  reinoud 
    341       1.1  reinoud 	DPRINTF(TRANSLATE, ("VAT entry change (log %u -> phys %u)\n",
    342       1.1  reinoud 			lb_num, lb_map));
    343       1.1  reinoud 
    344       1.1  reinoud 	/* VAT should be the longer than this write, can't go wrong */
    345       1.1  reinoud 	KASSERT(lb_num <= ump->vat_entries);
    346       1.1  reinoud 
    347       1.1  reinoud 	mutex_enter(&ump->allocate_mutex);
    348       1.1  reinoud 	error = udf_vat_write(ump->vat_node,
    349       1.1  reinoud 			(uint8_t *) &udf_rw32_lbmap, 4,
    350       1.1  reinoud 			ump->vat_offset + lb_num * 4);
    351       1.1  reinoud 	mutex_exit(&ump->allocate_mutex);
    352       1.1  reinoud 
    353       1.1  reinoud 	if (error)
    354       1.1  reinoud 		panic( "udf_VAT_mapping_update: HELP! i couldn't "
    355       1.1  reinoud 			"write in the VAT file ?\n");
    356       1.1  reinoud }
    357       1.1  reinoud 
    358       1.1  reinoud 
    359       1.1  reinoud static void
    360       1.1  reinoud udf_issue_buf(struct udf_mount *ump, int queue, struct buf *buf)
    361       1.1  reinoud {
    362       1.8  reinoud 	union dscrptr *dscr;
    363       1.1  reinoud 	struct long_ad *node_ad_cpy;
    364       1.3  reinoud 	struct part_desc *pdesc;
    365       1.3  reinoud 	uint64_t *lmapping, *lmappos, blknr;
    366       1.1  reinoud 	uint32_t our_sectornr, sectornr, bpos;
    367       1.3  reinoud 	uint32_t ptov;
    368       1.3  reinoud 	uint16_t vpart_num;
    369       1.1  reinoud 	uint8_t *fidblk;
    370       1.1  reinoud 	int sector_size = ump->discinfo.sector_size;
    371       1.1  reinoud 	int blks = sector_size / DEV_BSIZE;
    372       1.1  reinoud 	int len, buf_len;
    373       1.1  reinoud 
    374       1.1  reinoud 	/* if reading, just pass to the device's STRATEGY */
    375       1.1  reinoud 	if (queue == UDF_SHED_READING) {
    376       1.1  reinoud 		DPRINTF(SHEDULE, ("\nudf_issue_buf READ %p : sector %d type %d,"
    377       1.1  reinoud 			"b_resid %d, b_bcount %d, b_bufsize %d\n",
    378       1.1  reinoud 			buf, (uint32_t) buf->b_blkno / blks, buf->b_udf_c_type,
    379       1.1  reinoud 			buf->b_resid, buf->b_bcount, buf->b_bufsize));
    380       1.1  reinoud 		VOP_STRATEGY(ump->devvp, buf);
    381       1.1  reinoud 		return;
    382       1.1  reinoud 	}
    383       1.1  reinoud 
    384       1.1  reinoud 	blknr        = buf->b_blkno;
    385       1.1  reinoud 	our_sectornr = blknr / blks;
    386       1.1  reinoud 
    387       1.1  reinoud 	if (queue == UDF_SHED_WRITING) {
    388       1.1  reinoud 		DPRINTF(SHEDULE, ("\nudf_issue_buf WRITE %p : sector %d "
    389       1.1  reinoud 			"type %d, b_resid %d, b_bcount %d, b_bufsize %d\n",
    390       1.1  reinoud 			buf, (uint32_t) buf->b_blkno / blks, buf->b_udf_c_type,
    391       1.1  reinoud 			buf->b_resid, buf->b_bcount, buf->b_bufsize));
    392       1.8  reinoud 		KASSERT(buf->b_udf_c_type == UDF_C_ABSOLUTE);
    393       1.8  reinoud 
    394       1.8  reinoud 		// udf_fixup_node_internals(ump, buf->b_data, buf->b_udf_c_type);
    395       1.1  reinoud 		VOP_STRATEGY(ump->devvp, buf);
    396       1.1  reinoud 		return;
    397       1.1  reinoud 	}
    398       1.1  reinoud 
    399       1.1  reinoud 	KASSERT(queue == UDF_SHED_SEQWRITING);
    400       1.1  reinoud 	DPRINTF(SHEDULE, ("\nudf_issue_buf SEQWRITE %p : sector XXXX "
    401       1.1  reinoud 		"type %d, b_resid %d, b_bcount %d, b_bufsize %d\n",
    402       1.1  reinoud 		buf, buf->b_udf_c_type, buf->b_resid, buf->b_bcount,
    403       1.1  reinoud 		buf->b_bufsize));
    404       1.1  reinoud 
    405       1.1  reinoud 	/*
    406       1.1  reinoud 	 * Buffers should not have been allocated to disc addresses yet on
    407       1.1  reinoud 	 * this queue. Note that a buffer can get multiple extents allocated.
    408       1.1  reinoud 	 *
    409       1.1  reinoud 	 * lmapping contains lb_num relative to base partition.
    410       1.1  reinoud 	 */
    411       1.1  reinoud 	lmapping    = ump->la_lmapping;
    412       1.1  reinoud 	node_ad_cpy = ump->la_node_ad_cpy;
    413       1.1  reinoud 
    414       1.3  reinoud 	/* logically allocate buf and map it in the file */
    415       1.3  reinoud 	udf_late_allocate_buf(ump, buf, lmapping, node_ad_cpy, &vpart_num);
    416       1.3  reinoud 
    417       1.3  reinoud 	/*
    418       1.3  reinoud 	 * NOTE We are using the knowledge here that sequential media will
    419       1.3  reinoud 	 * always be mapped linearly. Thus no use to explicitly translate the
    420       1.3  reinoud 	 * lmapping list.
    421       1.3  reinoud 	 */
    422       1.3  reinoud 
    423       1.3  reinoud 	/* calculate offset from physical base partition */
    424       1.3  reinoud 	pdesc = ump->partitions[ump->vtop[vpart_num]];
    425       1.3  reinoud 	ptov  = udf_rw32(pdesc->start_loc);
    426       1.3  reinoud 
    427       1.3  reinoud 	/* set buffers blkno to the physical block number */
    428       1.3  reinoud 	buf->b_blkno = (*lmapping + ptov) * blks;
    429       1.1  reinoud 
    430       1.8  reinoud 	/* fixate floating descriptors */
    431       1.8  reinoud 	if (buf->b_udf_c_type == UDF_C_FLOAT_DSCR) {
    432       1.8  reinoud 		/* set our tag location to the absolute position */
    433       1.8  reinoud 		dscr = (union dscrptr *) buf->b_data;
    434       1.8  reinoud 		dscr->tag.tag_loc = udf_rw32(*lmapping + ptov);
    435       1.8  reinoud 		udf_validate_tag_and_crc_sums(dscr);
    436       1.8  reinoud 	}
    437       1.8  reinoud 
    438       1.8  reinoud 	/* update mapping in the VAT */
    439       1.8  reinoud 	if (buf->b_udf_c_type == UDF_C_NODE) {
    440       1.8  reinoud 		udf_VAT_mapping_update(ump, buf, *lmapping);
    441       1.8  reinoud 		udf_fixup_node_internals(ump, buf->b_data, buf->b_udf_c_type);
    442       1.8  reinoud 	}
    443       1.8  reinoud 
    444       1.1  reinoud 	/* if we have FIDs, fixup using the new allocation table */
    445       1.1  reinoud 	if (buf->b_udf_c_type == UDF_C_FIDS) {
    446       1.1  reinoud 		buf_len = buf->b_bcount;
    447       1.1  reinoud 		bpos = 0;
    448       1.1  reinoud 		lmappos = lmapping;
    449       1.1  reinoud 		while (buf_len) {
    450       1.1  reinoud 			sectornr = *lmappos++;
    451       1.1  reinoud 			len = MIN(buf_len, sector_size);
    452       1.1  reinoud 			fidblk = (uint8_t *) buf->b_data + bpos;
    453       1.1  reinoud 			udf_fixup_fid_block(fidblk, sector_size,
    454       1.1  reinoud 				0, len, sectornr);
    455       1.1  reinoud 			bpos += len;
    456       1.1  reinoud 			buf_len -= len;
    457       1.1  reinoud 		}
    458       1.1  reinoud 	}
    459       1.4  reinoud 
    460       1.1  reinoud 	VOP_STRATEGY(ump->devvp, buf);
    461       1.1  reinoud }
    462       1.1  reinoud 
    463       1.1  reinoud 
    464       1.1  reinoud static void
    465       1.1  reinoud udf_doshedule(struct udf_mount *ump)
    466       1.1  reinoud {
    467       1.1  reinoud 	struct buf *buf;
    468       1.1  reinoud 	struct timespec now, *last;
    469       1.1  reinoud 	struct strat_private *priv = PRIV(ump);
    470       1.1  reinoud 	void (*b_callback)(struct buf *);
    471       1.1  reinoud 	int new_queue;
    472       1.1  reinoud 	int error;
    473       1.1  reinoud 
    474       1.7     yamt 	buf = bufq_get(priv->queues[priv->cur_queue]);
    475       1.1  reinoud 	if (buf) {
    476       1.1  reinoud 		/* transfer from the current queue to the device queue */
    477       1.1  reinoud 		mutex_exit(&priv->discstrat_mutex);
    478       1.1  reinoud 
    479       1.1  reinoud 		/* transform buffer to synchronous; XXX needed? */
    480       1.1  reinoud 		b_callback = buf->b_iodone;
    481       1.1  reinoud 		buf->b_iodone = NULL;
    482       1.1  reinoud 		CLR(buf->b_flags, B_ASYNC);
    483       1.1  reinoud 
    484       1.1  reinoud 		/* issue and wait on completion */
    485       1.1  reinoud 		udf_issue_buf(ump, priv->cur_queue, buf);
    486       1.1  reinoud 		biowait(buf);
    487       1.1  reinoud 
    488       1.1  reinoud 		mutex_enter(&priv->discstrat_mutex);
    489       1.1  reinoud 
    490       1.1  reinoud 		/* if there is an error, repair this error, otherwise propagate */
    491       1.1  reinoud 		if (buf->b_error && ((buf->b_flags & B_READ) == 0)) {
    492       1.1  reinoud 			/* check what we need to do */
    493       1.1  reinoud 			panic("UDF write error, can't handle yet!\n");
    494       1.1  reinoud 		}
    495       1.1  reinoud 
    496       1.1  reinoud 		/* propagate result to higher layers */
    497       1.1  reinoud 		if (b_callback) {
    498       1.1  reinoud 			buf->b_iodone = b_callback;
    499       1.1  reinoud 			(*buf->b_iodone)(buf);
    500       1.1  reinoud 		}
    501       1.1  reinoud 
    502       1.1  reinoud 		return;
    503       1.1  reinoud 	}
    504       1.1  reinoud 
    505       1.1  reinoud 	/* Check if we're idling in this state */
    506       1.1  reinoud 	vfs_timestamp(&now);
    507       1.1  reinoud 	last = &priv->last_queued[priv->cur_queue];
    508       1.1  reinoud 	if (ump->discinfo.mmc_class == MMC_CLASS_CD) {
    509       1.1  reinoud 		/* dont switch too fast for CD media; its expensive in time */
    510       1.1  reinoud 		if (now.tv_sec - last->tv_sec < 3)
    511       1.1  reinoud 			return;
    512       1.1  reinoud 	}
    513       1.1  reinoud 
    514       1.1  reinoud 	/* check if we can/should switch */
    515       1.1  reinoud 	new_queue = priv->cur_queue;
    516       1.1  reinoud 
    517       1.7     yamt 	if (bufq_peek(priv->queues[UDF_SHED_READING]))
    518       1.1  reinoud 		new_queue = UDF_SHED_READING;
    519       1.9  reinoud 	if (bufq_peek(priv->queues[UDF_SHED_WRITING]))		/* only for unmount */
    520       1.9  reinoud 		new_queue = UDF_SHED_WRITING;
    521       1.7     yamt 	if (bufq_peek(priv->queues[UDF_SHED_SEQWRITING]))
    522       1.1  reinoud 		new_queue = UDF_SHED_SEQWRITING;
    523       1.1  reinoud 	if (priv->cur_queue == UDF_SHED_READING) {
    524       1.1  reinoud 		if (new_queue == UDF_SHED_SEQWRITING) {
    525       1.1  reinoud 			/* TODO use flag to signal if this is needed */
    526       1.1  reinoud 			mutex_exit(&priv->discstrat_mutex);
    527       1.1  reinoud 
    528       1.1  reinoud 			/* update trackinfo for data and metadata */
    529       1.1  reinoud 			error = udf_update_trackinfo(ump,
    530       1.1  reinoud 					&ump->data_track);
    531       1.1  reinoud 			assert(error == 0);
    532       1.1  reinoud 			error = udf_update_trackinfo(ump,
    533       1.1  reinoud 					&ump->metadata_track);
    534       1.1  reinoud 			assert(error == 0);
    535       1.1  reinoud 			mutex_enter(&priv->discstrat_mutex);
    536       1.1  reinoud 		}
    537       1.1  reinoud 	}
    538       1.1  reinoud 
    539       1.1  reinoud 	if (new_queue != priv->cur_queue) {
    540       1.1  reinoud 		DPRINTF(SHEDULE, ("switching from %d to %d\n",
    541       1.1  reinoud 			priv->cur_queue, new_queue));
    542       1.1  reinoud 	}
    543       1.1  reinoud 
    544       1.1  reinoud 	priv->cur_queue = new_queue;
    545       1.1  reinoud }
    546       1.1  reinoud 
    547       1.1  reinoud 
    548       1.1  reinoud static void
    549       1.1  reinoud udf_discstrat_thread(void *arg)
    550       1.1  reinoud {
    551       1.1  reinoud 	struct udf_mount *ump = (struct udf_mount *) arg;
    552       1.1  reinoud 	struct strat_private *priv = PRIV(ump);
    553       1.1  reinoud 	int empty;
    554       1.1  reinoud 
    555       1.1  reinoud 	empty = 1;
    556       1.1  reinoud 	mutex_enter(&priv->discstrat_mutex);
    557       1.1  reinoud 	while (priv->run_thread || !empty) {
    558       1.1  reinoud 		/* process the current selected queue */
    559       1.1  reinoud 		udf_doshedule(ump);
    560       1.7     yamt 		empty  = (bufq_peek(priv->queues[UDF_SHED_READING]) == NULL);
    561       1.7     yamt 		empty &= (bufq_peek(priv->queues[UDF_SHED_WRITING]) == NULL);
    562       1.7     yamt 		empty &= (bufq_peek(priv->queues[UDF_SHED_SEQWRITING]) == NULL);
    563       1.1  reinoud 
    564       1.1  reinoud 		/* wait for more if needed */
    565       1.1  reinoud 		if (empty)
    566       1.1  reinoud 			cv_timedwait(&priv->discstrat_cv,
    567       1.1  reinoud 				&priv->discstrat_mutex, hz/8);
    568       1.1  reinoud 	}
    569       1.1  reinoud 	mutex_exit(&priv->discstrat_mutex);
    570       1.1  reinoud 
    571       1.1  reinoud 	wakeup(&priv->run_thread);
    572       1.1  reinoud 	kthread_exit(0);
    573       1.1  reinoud 	/* not reached */
    574       1.1  reinoud }
    575       1.1  reinoud 
    576       1.1  reinoud /* --------------------------------------------------------------------- */
    577       1.1  reinoud 
    578       1.1  reinoud static void
    579       1.1  reinoud udf_discstrat_init_seq(struct udf_strat_args *args)
    580       1.1  reinoud {
    581       1.1  reinoud 	struct udf_mount *ump = args->ump;
    582       1.1  reinoud 	struct strat_private *priv = PRIV(ump);
    583       1.1  reinoud 	struct disk_strategy dkstrat;
    584       1.1  reinoud 	uint32_t lb_size;
    585       1.1  reinoud 
    586       1.1  reinoud 	KASSERT(ump);
    587       1.1  reinoud 	KASSERT(ump->logical_vol);
    588       1.1  reinoud 	KASSERT(priv == NULL);
    589       1.1  reinoud 
    590       1.1  reinoud 	lb_size = udf_rw32(ump->logical_vol->lb_size);
    591       1.1  reinoud 	KASSERT(lb_size > 0);
    592       1.1  reinoud 
    593       1.1  reinoud 	/* initialise our memory space */
    594       1.1  reinoud 	ump->strategy_private = malloc(sizeof(struct strat_private),
    595       1.1  reinoud 		M_UDFTEMP, M_WAITOK);
    596       1.1  reinoud 	priv = ump->strategy_private;
    597       1.1  reinoud 	memset(priv, 0 , sizeof(struct strat_private));
    598       1.1  reinoud 
    599       1.1  reinoud 	/* initialise locks */
    600       1.1  reinoud 	cv_init(&priv->discstrat_cv, "udfstrat");
    601       1.1  reinoud 	mutex_init(&priv->discstrat_mutex, MUTEX_DEFAULT, IPL_NONE);
    602       1.1  reinoud 
    603       1.1  reinoud 	/*
    604       1.1  reinoud 	 * Initialise pool for descriptors associated with nodes. This is done
    605       1.1  reinoud 	 * in lb_size units though currently lb_size is dictated to be
    606       1.1  reinoud 	 * sector_size.
    607       1.1  reinoud 	 */
    608       1.1  reinoud 	pool_init(&priv->desc_pool, lb_size, 0, 0, 0, "udf_desc_pool", NULL,
    609       1.1  reinoud 	    IPL_NONE);
    610       1.1  reinoud 
    611       1.1  reinoud 	/*
    612       1.1  reinoud 	 * remember old device strategy method and explicit set method
    613       1.1  reinoud 	 * `discsort' since we have our own more complex strategy that is not
    614       1.1  reinoud 	 * implementable on the CD device and other strategies will get in the
    615       1.1  reinoud 	 * way.
    616       1.1  reinoud 	 */
    617       1.1  reinoud 	memset(&priv->old_strategy_setting, 0,
    618       1.1  reinoud 		sizeof(struct disk_strategy));
    619       1.1  reinoud 	VOP_IOCTL(ump->devvp, DIOCGSTRATEGY, &priv->old_strategy_setting,
    620       1.1  reinoud 		FREAD | FKIOCTL, NOCRED);
    621       1.1  reinoud 	memset(&dkstrat, 0, sizeof(struct disk_strategy));
    622       1.1  reinoud 	strcpy(dkstrat.dks_name, "discsort");
    623       1.1  reinoud 	VOP_IOCTL(ump->devvp, DIOCSSTRATEGY, &dkstrat, FWRITE | FKIOCTL,
    624       1.1  reinoud 		NOCRED);
    625       1.1  reinoud 
    626       1.1  reinoud 	/* initialise our internal sheduler */
    627       1.1  reinoud 	priv->cur_queue = UDF_SHED_READING;
    628       1.1  reinoud 	bufq_alloc(&priv->queues[UDF_SHED_READING], "disksort",
    629       1.1  reinoud 		BUFQ_SORT_RAWBLOCK);
    630       1.1  reinoud 	bufq_alloc(&priv->queues[UDF_SHED_WRITING], "disksort",
    631       1.1  reinoud 		BUFQ_SORT_RAWBLOCK);
    632       1.1  reinoud 	bufq_alloc(&priv->queues[UDF_SHED_SEQWRITING], "fcfs", 0);
    633       1.1  reinoud 	vfs_timestamp(&priv->last_queued[UDF_SHED_READING]);
    634       1.1  reinoud 	vfs_timestamp(&priv->last_queued[UDF_SHED_WRITING]);
    635       1.1  reinoud 	vfs_timestamp(&priv->last_queued[UDF_SHED_SEQWRITING]);
    636       1.1  reinoud 
    637       1.1  reinoud 	/* create our disk strategy thread */
    638       1.1  reinoud 	priv->run_thread = 1;
    639       1.1  reinoud 	if (kthread_create(PRI_NONE, 0 /* KTHREAD_MPSAFE*/, NULL /* cpu_info*/,
    640       1.1  reinoud 		udf_discstrat_thread, ump, &priv->queue_lwp,
    641       1.1  reinoud 		"%s", "udf_rw")) {
    642       1.1  reinoud 		panic("fork udf_rw");
    643       1.1  reinoud 	}
    644       1.1  reinoud }
    645       1.1  reinoud 
    646       1.1  reinoud 
    647       1.1  reinoud static void
    648       1.1  reinoud udf_discstrat_finish_seq(struct udf_strat_args *args)
    649       1.1  reinoud {
    650       1.1  reinoud 	struct udf_mount *ump = args->ump;
    651       1.1  reinoud 	struct strat_private *priv = PRIV(ump);
    652       1.1  reinoud 	int error;
    653       1.1  reinoud 
    654       1.1  reinoud 	if (ump == NULL)
    655       1.1  reinoud 		return;
    656       1.1  reinoud 
    657       1.1  reinoud 	/* stop our sheduling thread */
    658       1.1  reinoud 	KASSERT(priv->run_thread == 1);
    659       1.1  reinoud 	priv->run_thread = 0;
    660       1.1  reinoud 	wakeup(priv->queue_lwp);
    661       1.1  reinoud 	do {
    662       1.1  reinoud 		error = tsleep(&priv->run_thread, PRIBIO+1,
    663       1.1  reinoud 			"udfshedfin", hz);
    664       1.1  reinoud 	} while (error);
    665       1.1  reinoud 	/* kthread should be finished now */
    666       1.1  reinoud 
    667       1.1  reinoud 	/* set back old device strategy method */
    668       1.1  reinoud 	VOP_IOCTL(ump->devvp, DIOCSSTRATEGY, &priv->old_strategy_setting,
    669       1.1  reinoud 			FWRITE, NOCRED);
    670       1.1  reinoud 
    671       1.1  reinoud 	/* destroy our pool */
    672       1.1  reinoud 	pool_destroy(&priv->desc_pool);
    673       1.1  reinoud 
    674  1.10.4.1    rmind 	mutex_destroy(&priv->discstrat_mutex);
    675  1.10.4.1    rmind 	cv_destroy(&priv->discstrat_cv);
    676  1.10.4.1    rmind 
    677       1.1  reinoud 	/* free our private space */
    678       1.1  reinoud 	free(ump->strategy_private, M_UDFTEMP);
    679       1.1  reinoud 	ump->strategy_private = NULL;
    680       1.1  reinoud }
    681       1.1  reinoud 
    682       1.1  reinoud /* --------------------------------------------------------------------- */
    683       1.1  reinoud 
    684       1.1  reinoud struct udf_strategy udf_strat_sequential =
    685       1.1  reinoud {
    686       1.1  reinoud 	udf_create_logvol_dscr_seq,
    687       1.1  reinoud 	udf_free_logvol_dscr_seq,
    688       1.1  reinoud 	udf_read_logvol_dscr_seq,
    689       1.1  reinoud 	udf_write_logvol_dscr_seq,
    690       1.1  reinoud 	udf_queuebuf_seq,
    691       1.1  reinoud 	udf_discstrat_init_seq,
    692       1.1  reinoud 	udf_discstrat_finish_seq
    693       1.1  reinoud };
    694       1.1  reinoud 
    695       1.1  reinoud 
    696