Home | History | Annotate | Line # | Download | only in udf
udf_strat_rmw.c revision 1.9.4.7
      1  1.9.4.7      snj /* $NetBSD: udf_strat_rmw.c,v 1.9.4.7 2009/02/18 00:51:27 snj Exp $ */
      2      1.1  reinoud 
      3      1.1  reinoud /*
      4      1.1  reinoud  * Copyright (c) 2006, 2008 Reinoud Zandijk
      5      1.1  reinoud  * All rights reserved.
      6      1.1  reinoud  *
      7      1.1  reinoud  * Redistribution and use in source and binary forms, with or without
      8      1.1  reinoud  * modification, are permitted provided that the following conditions
      9      1.1  reinoud  * are met:
     10      1.1  reinoud  * 1. Redistributions of source code must retain the above copyright
     11      1.1  reinoud  *    notice, this list of conditions and the following disclaimer.
     12      1.1  reinoud  * 2. Redistributions in binary form must reproduce the above copyright
     13      1.1  reinoud  *    notice, this list of conditions and the following disclaimer in the
     14      1.1  reinoud  *    documentation and/or other materials provided with the distribution.
     15      1.1  reinoud  *
     16      1.1  reinoud  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     17      1.1  reinoud  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     18      1.1  reinoud  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     19      1.1  reinoud  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     20      1.1  reinoud  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     21      1.1  reinoud  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     22      1.1  reinoud  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     23      1.1  reinoud  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     24      1.1  reinoud  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     25      1.1  reinoud  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     26      1.1  reinoud  *
     27      1.1  reinoud  */
     28      1.1  reinoud 
     29      1.1  reinoud #include <sys/cdefs.h>
     30      1.1  reinoud #ifndef lint
     31  1.9.4.7      snj __KERNEL_RCSID(0, "$NetBSD: udf_strat_rmw.c,v 1.9.4.7 2009/02/18 00:51:27 snj Exp $");
     32      1.1  reinoud #endif /* not lint */
     33      1.1  reinoud 
     34      1.1  reinoud 
     35      1.1  reinoud #if defined(_KERNEL_OPT)
     36      1.1  reinoud #include "opt_quota.h"
     37      1.1  reinoud #include "opt_compat_netbsd.h"
     38      1.1  reinoud #endif
     39      1.1  reinoud 
     40      1.1  reinoud #include <sys/param.h>
     41      1.1  reinoud #include <sys/systm.h>
     42      1.1  reinoud #include <sys/sysctl.h>
     43      1.1  reinoud #include <sys/namei.h>
     44      1.1  reinoud #include <sys/proc.h>
     45      1.1  reinoud #include <sys/kernel.h>
     46      1.1  reinoud #include <sys/vnode.h>
     47      1.1  reinoud #include <miscfs/genfs/genfs_node.h>
     48      1.1  reinoud #include <sys/mount.h>
     49      1.1  reinoud #include <sys/buf.h>
     50      1.1  reinoud #include <sys/file.h>
     51      1.1  reinoud #include <sys/device.h>
     52      1.1  reinoud #include <sys/disklabel.h>
     53      1.1  reinoud #include <sys/ioctl.h>
     54      1.1  reinoud #include <sys/malloc.h>
     55      1.1  reinoud #include <sys/dirent.h>
     56      1.1  reinoud #include <sys/stat.h>
     57      1.1  reinoud #include <sys/conf.h>
     58      1.1  reinoud #include <sys/kauth.h>
     59      1.1  reinoud #include <sys/kthread.h>
     60      1.1  reinoud #include <dev/clock_subr.h>
     61      1.1  reinoud 
     62      1.1  reinoud #include <fs/udf/ecma167-udf.h>
     63      1.1  reinoud #include <fs/udf/udf_mount.h>
     64      1.1  reinoud 
     65      1.1  reinoud #include "udf.h"
     66      1.1  reinoud #include "udf_subr.h"
     67      1.1  reinoud #include "udf_bswap.h"
     68      1.1  reinoud 
     69      1.1  reinoud 
     70      1.1  reinoud #define VTOI(vnode) ((struct udf_node *) (vnode)->v_data)
     71      1.1  reinoud #define PRIV(ump) ((struct strat_private *) (ump)->strategy_private)
     72      1.1  reinoud #define BTOE(buf) ((struct udf_eccline *) ((buf)->b_private))
     73      1.1  reinoud 
     74      1.1  reinoud /* --------------------------------------------------------------------- */
     75      1.1  reinoud 
     76      1.1  reinoud #define UDF_MAX_PACKET_SIZE	64			/* DONT change this */
     77      1.1  reinoud 
     78      1.1  reinoud /* sheduler states */
     79  1.9.4.2      snj #define UDF_SHED_WAITING	1			/* waiting on timeout */
     80  1.9.4.2      snj #define UDF_SHED_READING	2
     81  1.9.4.2      snj #define UDF_SHED_WRITING	3
     82  1.9.4.2      snj #define UDF_SHED_SEQWRITING	4
     83  1.9.4.2      snj #define UDF_SHED_IDLE		5			/* resting */
     84  1.9.4.2      snj #define UDF_SHED_FREE		6			/* recycleable */
     85  1.9.4.2      snj #define UDF_SHED_MAX		6+1
     86      1.1  reinoud 
     87      1.1  reinoud /* flags */
     88      1.1  reinoud #define ECC_LOCKED		0x01			/* prevent access   */
     89      1.1  reinoud #define ECC_WANTED		0x02			/* trying access    */
     90      1.1  reinoud #define ECC_SEQWRITING		0x04			/* sequential queue */
     91      1.1  reinoud #define ECC_FLOATING		0x08			/* not queued yet   */
     92      1.1  reinoud 
     93  1.9.4.4      snj #define ECC_WAITTIME		10
     94  1.9.4.2      snj 
     95      1.1  reinoud 
     96      1.1  reinoud TAILQ_HEAD(ecclineq, udf_eccline);
     97      1.1  reinoud struct udf_eccline {
     98      1.1  reinoud 	struct udf_mount	 *ump;
     99      1.1  reinoud 	uint64_t		  present;		/* preserve these */
    100      1.1  reinoud 	uint64_t		  readin;		/* bitmap */
    101      1.1  reinoud 	uint64_t		  dirty;		/* bitmap */
    102      1.1  reinoud 	uint64_t		  error;		/* bitmap */
    103      1.1  reinoud 	uint32_t		  refcnt;
    104      1.1  reinoud 
    105  1.9.4.2      snj 	struct timespec		  wait_time;
    106      1.1  reinoud 	uint32_t		  flags;
    107      1.1  reinoud 	uint32_t		  start_sector;		/* physical */
    108      1.1  reinoud 
    109      1.1  reinoud 	struct buf		 *buf;
    110      1.1  reinoud 	void			 *blob;
    111      1.1  reinoud 
    112      1.1  reinoud 	struct buf		 *bufs[UDF_MAX_PACKET_SIZE];
    113      1.1  reinoud 	uint32_t		  bufs_bpos[UDF_MAX_PACKET_SIZE];
    114      1.1  reinoud 	int			  bufs_len[UDF_MAX_PACKET_SIZE];
    115      1.1  reinoud 
    116      1.1  reinoud 	int			  queued_on;		/* on which BUFQ list */
    117      1.1  reinoud 	LIST_ENTRY(udf_eccline)   hashchain;		/* on sector lookup  */
    118      1.1  reinoud };
    119      1.1  reinoud 
    120      1.1  reinoud 
    121      1.1  reinoud struct strat_private {
    122      1.1  reinoud 	lwp_t			 *queue_lwp;
    123      1.1  reinoud 	kcondvar_t		  discstrat_cv;		/* to wait on       */
    124      1.1  reinoud 	kmutex_t		  discstrat_mutex;	/* disc strategy    */
    125      1.1  reinoud 	kmutex_t		  seqwrite_mutex;	/* protect mappings */
    126      1.1  reinoud 
    127  1.9.4.4      snj 	int			  thread_running;	/* thread control */
    128      1.1  reinoud 	int			  run_thread;		/* thread control */
    129      1.1  reinoud 	int			  thread_finished;	/* thread control */
    130      1.1  reinoud 	int			  cur_queue;
    131      1.1  reinoud 
    132      1.1  reinoud 	int			  num_floating;
    133      1.1  reinoud 	int			  num_queued[UDF_SHED_MAX];
    134      1.1  reinoud 	struct bufq_state	 *queues[UDF_SHED_MAX];
    135      1.1  reinoud 	struct timespec		  last_queued[UDF_SHED_MAX];
    136      1.1  reinoud 	struct disk_strategy	  old_strategy_setting;
    137      1.1  reinoud 
    138      1.1  reinoud 	struct pool		  eccline_pool;
    139      1.1  reinoud 	struct pool		  ecclineblob_pool;
    140      1.1  reinoud 	LIST_HEAD(, udf_eccline)  eccline_hash[UDF_ECCBUF_HASHSIZE];
    141      1.1  reinoud };
    142      1.1  reinoud 
    143      1.1  reinoud /* --------------------------------------------------------------------- */
    144      1.1  reinoud 
    145      1.1  reinoud #define UDF_LOCK_ECCLINE(eccline) udf_lock_eccline(eccline)
    146      1.1  reinoud #define UDF_UNLOCK_ECCLINE(eccline) udf_unlock_eccline(eccline)
    147      1.1  reinoud 
    148      1.1  reinoud /* can be called with or without discstrat lock */
    149      1.1  reinoud static void
    150      1.1  reinoud udf_lock_eccline(struct udf_eccline *eccline)
    151      1.1  reinoud {
    152      1.1  reinoud 	struct strat_private *priv = PRIV(eccline->ump);
    153      1.1  reinoud 	int waslocked, ret;
    154      1.1  reinoud 
    155      1.1  reinoud 	waslocked = mutex_owned(&priv->discstrat_mutex);
    156      1.1  reinoud 	if (!waslocked)
    157      1.1  reinoud 		mutex_enter(&priv->discstrat_mutex);
    158      1.1  reinoud 
    159      1.1  reinoud 	/* wait until its unlocked first */
    160      1.1  reinoud 	while (eccline->flags & ECC_LOCKED) {
    161      1.1  reinoud 		eccline->flags |= ECC_WANTED;
    162      1.1  reinoud 		ret = cv_timedwait(&priv->discstrat_cv, &priv->discstrat_mutex,
    163      1.1  reinoud 			hz/8);
    164      1.1  reinoud 		if (ret == EWOULDBLOCK)
    165      1.1  reinoud 			DPRINTF(LOCKING, ("eccline lock helt, waiting for "
    166      1.1  reinoud 				"release"));
    167      1.1  reinoud 	}
    168      1.1  reinoud 	eccline->flags |= ECC_LOCKED;
    169      1.1  reinoud 	eccline->flags &= ~ECC_WANTED;
    170      1.1  reinoud 
    171      1.1  reinoud 	if (!waslocked)
    172      1.1  reinoud 		mutex_exit(&priv->discstrat_mutex);
    173      1.1  reinoud }
    174      1.1  reinoud 
    175      1.1  reinoud 
    176      1.1  reinoud /* can be called with or without discstrat lock */
    177      1.1  reinoud static void
    178      1.1  reinoud udf_unlock_eccline(struct udf_eccline *eccline)
    179      1.1  reinoud {
    180      1.1  reinoud 	struct strat_private *priv = PRIV(eccline->ump);
    181      1.1  reinoud 	int waslocked;
    182      1.1  reinoud 
    183      1.1  reinoud 	waslocked = mutex_owned(&priv->discstrat_mutex);
    184      1.1  reinoud 	if (!waslocked)
    185      1.1  reinoud 		mutex_enter(&priv->discstrat_mutex);
    186      1.1  reinoud 
    187      1.1  reinoud 	eccline->flags &= ~ECC_LOCKED;
    188      1.1  reinoud 	cv_broadcast(&priv->discstrat_cv);
    189      1.1  reinoud 
    190      1.1  reinoud 	if (!waslocked)
    191      1.1  reinoud 		mutex_exit(&priv->discstrat_mutex);
    192      1.1  reinoud }
    193      1.1  reinoud 
    194      1.1  reinoud 
    195      1.1  reinoud /* NOTE discstrat_mutex should be held! */
    196      1.1  reinoud static void
    197      1.1  reinoud udf_dispose_eccline(struct udf_eccline *eccline)
    198      1.1  reinoud {
    199      1.1  reinoud 	struct strat_private *priv = PRIV(eccline->ump);
    200      1.1  reinoud 	struct buf *ret;
    201      1.1  reinoud 
    202      1.1  reinoud 	KASSERT(mutex_owned(&priv->discstrat_mutex));
    203      1.1  reinoud 
    204      1.1  reinoud 	KASSERT(eccline->refcnt == 0);
    205      1.1  reinoud 	KASSERT(eccline->dirty  == 0);
    206      1.1  reinoud 
    207      1.3  reinoud 	DPRINTF(ECCLINE, ("dispose eccline with start sector %d, "
    208      1.1  reinoud 		"present %0"PRIx64"\n", eccline->start_sector,
    209      1.1  reinoud 		eccline->present));
    210      1.1  reinoud 
    211      1.1  reinoud 	if (eccline->queued_on) {
    212      1.1  reinoud 		ret = BUFQ_CANCEL(priv->queues[eccline->queued_on], eccline->buf);
    213      1.1  reinoud 		KASSERT(ret == eccline->buf);
    214      1.1  reinoud 		priv->num_queued[eccline->queued_on]--;
    215      1.1  reinoud 	}
    216      1.1  reinoud 	LIST_REMOVE(eccline, hashchain);
    217      1.1  reinoud 
    218      1.1  reinoud 	if (eccline->flags & ECC_FLOATING) {
    219      1.1  reinoud 		eccline->flags &= ~ECC_FLOATING;
    220      1.1  reinoud 		priv->num_floating--;
    221      1.1  reinoud 	}
    222      1.1  reinoud 
    223      1.1  reinoud 	putiobuf(eccline->buf);
    224      1.1  reinoud 	pool_put(&priv->ecclineblob_pool, eccline->blob);
    225      1.1  reinoud 	pool_put(&priv->eccline_pool, eccline);
    226      1.1  reinoud }
    227      1.1  reinoud 
    228      1.1  reinoud 
    229      1.1  reinoud /* NOTE discstrat_mutex should be held! */
    230      1.1  reinoud static void
    231      1.1  reinoud udf_push_eccline(struct udf_eccline *eccline, int newqueue)
    232      1.1  reinoud {
    233      1.1  reinoud 	struct strat_private *priv = PRIV(eccline->ump);
    234      1.1  reinoud 	struct buf *ret;
    235      1.1  reinoud 	int curqueue;
    236      1.1  reinoud 
    237      1.1  reinoud 	KASSERT(mutex_owned(&priv->discstrat_mutex));
    238      1.1  reinoud 
    239      1.1  reinoud 	DPRINTF(PARANOIA, ("DEBUG: buf %p pushed on queue %d\n", eccline->buf, newqueue));
    240      1.1  reinoud 
    241      1.1  reinoud 	/* requeue */
    242      1.1  reinoud 	curqueue = eccline->queued_on;
    243      1.1  reinoud 	if (curqueue) {
    244      1.1  reinoud 		ret = BUFQ_CANCEL(priv->queues[curqueue], eccline->buf);
    245      1.1  reinoud 
    246      1.1  reinoud 		DPRINTF(PARANOIA, ("push_eccline BUFQ_CANCEL returned %p when "
    247      1.1  reinoud 			"requested to remove %p from queue %d\n", ret,
    248      1.1  reinoud 			eccline->buf, curqueue));
    249      1.1  reinoud #ifdef DIAGNOSTIC
    250      1.1  reinoud 		if (ret == NULL) {
    251      1.1  reinoud 			int i;
    252      1.1  reinoud 
    253      1.1  reinoud 			printf("udf_push_eccline: bufq_cancel can't find "
    254      1.1  reinoud 				"buffer; dumping queues\n");
    255      1.1  reinoud 			for (i = 1; i < UDF_SHED_MAX; i++) {
    256      1.1  reinoud 				printf("queue %d\n\t", i);
    257      1.1  reinoud 				ret = BUFQ_GET(priv->queues[i]);
    258      1.1  reinoud 				while (ret) {
    259      1.1  reinoud 					printf("%p ", ret);
    260      1.1  reinoud 					if (ret == eccline->buf)
    261      1.1  reinoud 						printf("[<-] ");
    262      1.1  reinoud 					ret = BUFQ_GET(priv->queues[i]);
    263      1.1  reinoud 				}
    264      1.1  reinoud 				printf("\n");
    265      1.1  reinoud 			}
    266      1.1  reinoud 			panic("fatal queue bug; exit");
    267      1.1  reinoud 		}
    268      1.1  reinoud #endif
    269      1.1  reinoud 
    270      1.1  reinoud 		KASSERT(ret == eccline->buf);
    271      1.1  reinoud 		priv->num_queued[curqueue]--;
    272      1.1  reinoud 	}
    273      1.1  reinoud 
    274  1.9.4.1      snj 	/* set buffer block numbers to make sure its queued correctly */
    275  1.9.4.1      snj 	eccline->buf->b_lblkno   = eccline->start_sector;
    276  1.9.4.1      snj 	eccline->buf->b_blkno    = eccline->start_sector;
    277  1.9.4.1      snj 	eccline->buf->b_rawblkno = eccline->start_sector;
    278  1.9.4.1      snj 
    279      1.1  reinoud 	BUFQ_PUT(priv->queues[newqueue], eccline->buf);
    280      1.1  reinoud 	eccline->queued_on = newqueue;
    281      1.1  reinoud 	priv->num_queued[newqueue]++;
    282      1.1  reinoud 	vfs_timestamp(&priv->last_queued[newqueue]);
    283      1.1  reinoud 
    284      1.1  reinoud 	if (eccline->flags & ECC_FLOATING) {
    285      1.1  reinoud 		eccline->flags &= ~ECC_FLOATING;
    286      1.1  reinoud 		priv->num_floating--;
    287      1.1  reinoud 	}
    288      1.1  reinoud 
    289  1.9.4.5      snj 	/* tickle disc strategy statemachine */
    290  1.9.4.5      snj 	if (newqueue != UDF_SHED_IDLE)
    291      1.1  reinoud 		cv_signal(&priv->discstrat_cv);
    292      1.1  reinoud }
    293      1.1  reinoud 
    294      1.1  reinoud 
    295      1.1  reinoud static struct udf_eccline *
    296      1.1  reinoud udf_pop_eccline(struct strat_private *priv, int queued_on)
    297      1.1  reinoud {
    298      1.1  reinoud 	struct udf_eccline *eccline;
    299      1.1  reinoud 	struct buf *buf;
    300      1.1  reinoud 
    301      1.1  reinoud 	KASSERT(mutex_owned(&priv->discstrat_mutex));
    302      1.1  reinoud 
    303      1.1  reinoud 	buf = BUFQ_GET(priv->queues[queued_on]);
    304      1.1  reinoud 	if (!buf) {
    305      1.1  reinoud 		KASSERT(priv->num_queued[queued_on] == 0);
    306      1.1  reinoud 		return NULL;
    307      1.1  reinoud 	}
    308      1.1  reinoud 
    309      1.1  reinoud 	eccline = BTOE(buf);
    310      1.1  reinoud 	KASSERT(eccline->queued_on == queued_on);
    311      1.1  reinoud 	eccline->queued_on = 0;
    312      1.1  reinoud 	priv->num_queued[queued_on]--;
    313      1.1  reinoud 
    314      1.1  reinoud 	if (eccline->flags & ECC_FLOATING)
    315      1.1  reinoud 		panic("popping already marked floating eccline");
    316      1.1  reinoud 	eccline->flags |= ECC_FLOATING;
    317      1.1  reinoud 	priv->num_floating++;
    318      1.1  reinoud 
    319      1.1  reinoud 	DPRINTF(PARANOIA, ("DEBUG: buf %p popped from queue %d\n",
    320      1.1  reinoud 		eccline->buf, queued_on));
    321      1.1  reinoud 
    322      1.1  reinoud 	return eccline;
    323      1.1  reinoud }
    324      1.1  reinoud 
    325      1.1  reinoud 
    326      1.1  reinoud static struct udf_eccline *
    327      1.1  reinoud udf_geteccline(struct udf_mount *ump, uint32_t sector, int flags)
    328      1.1  reinoud {
    329      1.1  reinoud 	struct strat_private *priv = PRIV(ump);
    330      1.1  reinoud 	struct udf_eccline *eccline;
    331      1.1  reinoud 	uint32_t start_sector, lb_size, blobsize;
    332      1.1  reinoud 	uint8_t *eccline_blob;
    333      1.1  reinoud 	int line, line_offset;
    334      1.1  reinoud 	int num_busy, ret;
    335      1.1  reinoud 
    336      1.1  reinoud 	line_offset  = sector % ump->packet_size;
    337      1.1  reinoud 	start_sector = sector - line_offset;
    338      1.1  reinoud 	line = (start_sector/ump->packet_size) & UDF_ECCBUF_HASHMASK;
    339      1.1  reinoud 
    340      1.1  reinoud 	mutex_enter(&priv->discstrat_mutex);
    341  1.9.4.4      snj 	KASSERT(priv->thread_running);
    342      1.1  reinoud 
    343      1.1  reinoud retry:
    344      1.3  reinoud 	DPRINTF(ECCLINE, ("get line sector %d, line %d\n", sector, line));
    345      1.1  reinoud 	LIST_FOREACH(eccline, &priv->eccline_hash[line], hashchain) {
    346      1.1  reinoud 		if (eccline->start_sector == start_sector) {
    347      1.3  reinoud 			DPRINTF(ECCLINE, ("\tfound eccline, start_sector %d\n",
    348      1.1  reinoud 				eccline->start_sector));
    349      1.1  reinoud 
    350      1.1  reinoud 			UDF_LOCK_ECCLINE(eccline);
    351      1.1  reinoud 			/* move from freelist (!) */
    352      1.1  reinoud 			if (eccline->queued_on == UDF_SHED_FREE) {
    353      1.3  reinoud 				DPRINTF(ECCLINE, ("was on freelist\n"));
    354      1.1  reinoud 				KASSERT(eccline->refcnt == 0);
    355      1.1  reinoud 				udf_push_eccline(eccline, UDF_SHED_IDLE);
    356      1.1  reinoud 			}
    357      1.1  reinoud 			eccline->refcnt++;
    358      1.1  reinoud 			mutex_exit(&priv->discstrat_mutex);
    359      1.1  reinoud 			return eccline;
    360      1.1  reinoud 		}
    361      1.1  reinoud 	}
    362      1.1  reinoud 
    363      1.3  reinoud 	DPRINTF(ECCLINE, ("\tnot found in eccline cache\n"));
    364      1.1  reinoud 	/* not found in eccline cache */
    365      1.1  reinoud 
    366      1.1  reinoud 	lb_size  = udf_rw32(ump->logical_vol->lb_size);
    367      1.1  reinoud 	blobsize = ump->packet_size * lb_size;
    368      1.1  reinoud 
    369      1.1  reinoud 	/* dont allow too many pending requests */
    370      1.3  reinoud 	DPRINTF(ECCLINE, ("\tallocating new eccline\n"));
    371      1.1  reinoud 	num_busy = (priv->num_queued[UDF_SHED_SEQWRITING] + priv->num_floating);
    372      1.1  reinoud 	if ((flags & ECC_SEQWRITING) && (num_busy > UDF_ECCLINE_MAXBUSY)) {
    373      1.1  reinoud 		ret = cv_timedwait(&priv->discstrat_cv,
    374      1.1  reinoud 			&priv->discstrat_mutex, hz/8);
    375      1.1  reinoud 		goto retry;
    376      1.1  reinoud 	}
    377      1.1  reinoud 
    378      1.1  reinoud 	eccline_blob = pool_get(&priv->ecclineblob_pool, PR_NOWAIT);
    379      1.1  reinoud 	eccline = pool_get(&priv->eccline_pool, PR_NOWAIT);
    380      1.1  reinoud 	if ((eccline_blob == NULL) || (eccline == NULL)) {
    381      1.1  reinoud 		if (eccline_blob)
    382      1.1  reinoud 			pool_put(&priv->ecclineblob_pool, eccline_blob);
    383      1.1  reinoud 		if (eccline)
    384      1.1  reinoud 			pool_put(&priv->eccline_pool, eccline);
    385      1.1  reinoud 
    386      1.1  reinoud 		/* out of memory for now; canibalise freelist */
    387      1.1  reinoud 		eccline = udf_pop_eccline(priv, UDF_SHED_FREE);
    388      1.1  reinoud 		if (eccline == NULL) {
    389      1.1  reinoud 			/* serious trouble; wait and retry */
    390      1.1  reinoud 			cv_timedwait(&priv->discstrat_cv,
    391      1.1  reinoud 				&priv->discstrat_mutex, hz/8);
    392      1.1  reinoud 			goto retry;
    393      1.1  reinoud 		}
    394      1.1  reinoud 		/* push back line if we're waiting for it */
    395      1.1  reinoud 		if (eccline->flags & ECC_WANTED) {
    396      1.1  reinoud 			udf_push_eccline(eccline, UDF_SHED_IDLE);
    397      1.1  reinoud 			goto retry;
    398      1.1  reinoud 		}
    399      1.1  reinoud 
    400      1.1  reinoud 		/* unlink this entry */
    401      1.1  reinoud 		LIST_REMOVE(eccline, hashchain);
    402      1.1  reinoud 
    403      1.1  reinoud 		KASSERT(eccline->flags & ECC_FLOATING);
    404      1.1  reinoud 
    405      1.1  reinoud 		eccline_blob = eccline->blob;
    406      1.1  reinoud 		memset(eccline, 0, sizeof(struct udf_eccline));
    407      1.1  reinoud 		eccline->flags = ECC_FLOATING;
    408      1.1  reinoud 	} else {
    409      1.1  reinoud 		memset(eccline, 0, sizeof(struct udf_eccline));
    410      1.1  reinoud 		eccline->flags = ECC_FLOATING;
    411      1.1  reinoud 		priv->num_floating++;
    412      1.1  reinoud 	}
    413      1.1  reinoud 
    414      1.1  reinoud 	eccline->queued_on = 0;
    415      1.1  reinoud 	eccline->blob = eccline_blob;
    416      1.1  reinoud 	eccline->buf  = getiobuf(NULL, true);
    417      1.1  reinoud 	eccline->buf->b_private = eccline;	/* IMPORTANT */
    418      1.1  reinoud 
    419      1.1  reinoud 	/* initialise eccline blob */
    420      1.1  reinoud 	memset(eccline->blob, 0, blobsize);
    421      1.1  reinoud 
    422      1.1  reinoud 	eccline->ump = ump;
    423      1.1  reinoud 	eccline->present = eccline->readin = eccline->dirty = 0;
    424      1.1  reinoud 	eccline->error = 0;
    425      1.1  reinoud 	eccline->refcnt = 0;
    426  1.9.4.1      snj 
    427  1.9.4.1      snj 	eccline->start_sector    = start_sector;
    428  1.9.4.1      snj 	eccline->buf->b_lblkno   = start_sector;
    429  1.9.4.1      snj 	eccline->buf->b_blkno    = start_sector;
    430  1.9.4.1      snj 	eccline->buf->b_rawblkno = start_sector;
    431      1.1  reinoud 
    432      1.1  reinoud 	LIST_INSERT_HEAD(&priv->eccline_hash[line], eccline, hashchain);
    433      1.1  reinoud 
    434      1.1  reinoud 	/*
    435      1.1  reinoud 	 * TODO possible optimalisation for checking overlap with partitions
    436      1.1  reinoud 	 * to get a clue on future eccline usage
    437      1.1  reinoud 	 */
    438      1.1  reinoud 	eccline->refcnt++;
    439      1.1  reinoud 	UDF_LOCK_ECCLINE(eccline);
    440      1.1  reinoud 
    441      1.1  reinoud 	mutex_exit(&priv->discstrat_mutex);
    442      1.1  reinoud 
    443      1.1  reinoud 	return eccline;
    444      1.1  reinoud }
    445      1.1  reinoud 
    446      1.1  reinoud 
    447      1.1  reinoud static void
    448      1.1  reinoud udf_puteccline(struct udf_eccline *eccline)
    449      1.1  reinoud {
    450      1.1  reinoud 	struct strat_private *priv = PRIV(eccline->ump);
    451      1.1  reinoud 	struct udf_mount *ump = eccline->ump;
    452      1.1  reinoud 	uint64_t allbits = ((uint64_t) 1 << ump->packet_size)-1;
    453      1.1  reinoud 
    454      1.1  reinoud 	mutex_enter(&priv->discstrat_mutex);
    455      1.1  reinoud 
    456      1.1  reinoud 	/* clear directly all readin requests from present ones */
    457      1.1  reinoud 	if (eccline->readin & eccline->present) {
    458      1.1  reinoud 		/* clear all read bits that are already read in */
    459      1.1  reinoud 		eccline->readin &= (~eccline->present) & allbits;
    460      1.1  reinoud 		wakeup(eccline);
    461      1.1  reinoud 	}
    462      1.1  reinoud 
    463      1.3  reinoud 	DPRINTF(ECCLINE, ("put eccline start sector %d, refcnt %d\n",
    464      1.1  reinoud 		eccline->start_sector, eccline->refcnt));
    465      1.1  reinoud 
    466  1.9.4.2      snj 	/* if we have active nodes we dont set it on seqwriting */
    467      1.1  reinoud 	if (eccline->refcnt > 1)
    468      1.1  reinoud 		eccline->flags &= ~ECC_SEQWRITING;
    469      1.1  reinoud 
    470  1.9.4.2      snj 	vfs_timestamp(&eccline->wait_time);
    471  1.9.4.2      snj 	eccline->wait_time.tv_sec += ECC_WAITTIME;
    472  1.9.4.2      snj 	udf_push_eccline(eccline, UDF_SHED_WAITING);
    473      1.1  reinoud 
    474      1.1  reinoud 	KASSERT(eccline->refcnt >= 1);
    475      1.1  reinoud 	eccline->refcnt--;
    476      1.1  reinoud 	UDF_UNLOCK_ECCLINE(eccline);
    477      1.1  reinoud 
    478  1.9.4.4      snj 	wakeup(eccline);
    479      1.1  reinoud 	mutex_exit(&priv->discstrat_mutex);
    480      1.1  reinoud }
    481      1.1  reinoud 
    482      1.1  reinoud /* --------------------------------------------------------------------- */
    483      1.1  reinoud 
    484      1.1  reinoud static int
    485      1.5  reinoud udf_create_nodedscr_rmw(struct udf_strat_args *args)
    486      1.1  reinoud {
    487      1.1  reinoud 	union dscrptr   **dscrptr  = &args->dscr;
    488      1.1  reinoud 	struct udf_mount *ump      = args->ump;
    489      1.1  reinoud 	struct long_ad   *icb      = args->icb;
    490      1.1  reinoud 	struct udf_eccline *eccline;
    491      1.1  reinoud 	uint64_t bit;
    492      1.1  reinoud 	uint32_t sectornr, lb_size, dummy;
    493      1.1  reinoud 	uint8_t *mem;
    494      1.1  reinoud 	int error, eccsect;
    495      1.1  reinoud 
    496      1.1  reinoud 	error = udf_translate_vtop(ump, icb, &sectornr, &dummy);
    497      1.1  reinoud 	if (error)
    498      1.1  reinoud 		return error;
    499      1.1  reinoud 
    500      1.1  reinoud 	lb_size  = udf_rw32(ump->logical_vol->lb_size);
    501      1.1  reinoud 
    502      1.1  reinoud 	/* get our eccline */
    503      1.1  reinoud 	eccline = udf_geteccline(ump, sectornr, 0);
    504      1.1  reinoud 	eccsect = sectornr - eccline->start_sector;
    505      1.1  reinoud 
    506      1.1  reinoud 	bit = (uint64_t) 1 << eccsect;
    507      1.1  reinoud 	eccline->readin  &= ~bit;	/* just in case */
    508      1.1  reinoud 	eccline->present |=  bit;
    509      1.1  reinoud 	eccline->dirty   &= ~bit;	/* Err... euhm... clean? */
    510      1.1  reinoud 
    511      1.1  reinoud 	eccline->refcnt++;
    512      1.1  reinoud 
    513      1.1  reinoud 	/* clear space */
    514      1.1  reinoud 	mem = ((uint8_t *) eccline->blob) + eccsect * lb_size;
    515      1.1  reinoud 	memset(mem, 0, lb_size);
    516      1.1  reinoud 
    517      1.1  reinoud 	udf_puteccline(eccline);
    518      1.1  reinoud 
    519      1.1  reinoud 	*dscrptr = (union dscrptr *) mem;
    520      1.1  reinoud 	return 0;
    521      1.1  reinoud }
    522      1.1  reinoud 
    523      1.1  reinoud 
    524      1.1  reinoud static void
    525      1.5  reinoud udf_free_nodedscr_rmw(struct udf_strat_args *args)
    526      1.1  reinoud {
    527      1.1  reinoud 	struct udf_mount *ump  = args->ump;
    528      1.1  reinoud 	struct long_ad   *icb  = args->icb;
    529      1.1  reinoud 	struct udf_eccline *eccline;
    530      1.1  reinoud 	uint64_t bit;
    531      1.1  reinoud 	uint32_t sectornr, dummy;
    532      1.1  reinoud 	int error, eccsect;
    533      1.1  reinoud 
    534      1.1  reinoud 	error = udf_translate_vtop(ump, icb, &sectornr, &dummy);
    535      1.1  reinoud 	if (error)
    536      1.1  reinoud 		return;
    537      1.1  reinoud 
    538      1.1  reinoud 	/* get our eccline */
    539      1.1  reinoud 	eccline = udf_geteccline(ump, sectornr, 0);
    540      1.1  reinoud 	eccsect = sectornr - eccline->start_sector;
    541      1.1  reinoud 
    542      1.1  reinoud 	bit = (uint64_t) 1 << eccsect;
    543      1.1  reinoud 	eccline->readin &= ~bit;	/* just in case */
    544      1.1  reinoud 
    545      1.1  reinoud 	KASSERT(eccline->refcnt >= 1);
    546      1.1  reinoud 	eccline->refcnt--;
    547      1.1  reinoud 
    548      1.1  reinoud 	udf_puteccline(eccline);
    549      1.1  reinoud }
    550      1.1  reinoud 
    551      1.1  reinoud 
    552      1.1  reinoud static int
    553      1.5  reinoud udf_read_nodedscr_rmw(struct udf_strat_args *args)
    554      1.1  reinoud {
    555      1.1  reinoud 	union dscrptr   **dscrptr = &args->dscr;
    556      1.1  reinoud 	struct udf_mount *ump = args->ump;
    557      1.1  reinoud 	struct long_ad   *icb = args->icb;
    558      1.1  reinoud 	struct udf_eccline *eccline;
    559      1.1  reinoud 	uint64_t bit;
    560      1.1  reinoud 	uint32_t sectornr, dummy;
    561      1.1  reinoud 	uint8_t *pos;
    562      1.1  reinoud 	int sector_size = ump->discinfo.sector_size;
    563      1.1  reinoud 	int lb_size = udf_rw32(ump->logical_vol->lb_size);
    564      1.1  reinoud 	int i, error, dscrlen, eccsect;
    565      1.1  reinoud 
    566      1.1  reinoud 	lb_size = lb_size;
    567      1.1  reinoud 	KASSERT(sector_size == lb_size);
    568      1.1  reinoud 	error = udf_translate_vtop(ump, icb, &sectornr, &dummy);
    569      1.1  reinoud 	if (error)
    570      1.1  reinoud 		return error;
    571      1.1  reinoud 
    572      1.1  reinoud 	/* get our eccline */
    573      1.1  reinoud 	eccline = udf_geteccline(ump, sectornr, 0);
    574      1.1  reinoud 	eccsect = sectornr - eccline->start_sector;
    575      1.1  reinoud 
    576      1.1  reinoud 	bit = (uint64_t) 1 << eccsect;
    577      1.1  reinoud 	if ((eccline->present & bit) == 0) {
    578      1.1  reinoud 		/* mark bit for readin */
    579      1.1  reinoud 		eccline->readin |= bit;
    580      1.1  reinoud 		eccline->refcnt++;	/* prevent recycling */
    581      1.1  reinoud 		KASSERT(eccline->bufs[eccsect] == NULL);
    582      1.1  reinoud 		udf_puteccline(eccline);
    583      1.1  reinoud 
    584      1.1  reinoud 		/* wait for completion; XXX remodel to lock bit code */
    585      1.1  reinoud 		error = 0;
    586      1.1  reinoud 		while ((eccline->present & bit) == 0) {
    587      1.1  reinoud 			tsleep(eccline, PRIBIO+1, "udflvdrd", hz/8);
    588      1.1  reinoud 			if (eccline->error & bit) {
    589      1.1  reinoud 				KASSERT(eccline->refcnt >= 1);
    590      1.1  reinoud 				eccline->refcnt--;	/* undo temp refcnt */
    591      1.1  reinoud 				*dscrptr = NULL;
    592      1.1  reinoud 				return EIO;		/* XXX error code */
    593      1.1  reinoud 			}
    594      1.1  reinoud 		}
    595      1.1  reinoud 
    596      1.1  reinoud 		/* reget our line */
    597      1.1  reinoud 		eccline = udf_geteccline(ump, sectornr, 0);
    598      1.1  reinoud 		KASSERT(eccline->refcnt >= 1);
    599      1.1  reinoud 		eccline->refcnt--;	/* undo refcnt */
    600      1.1  reinoud 	}
    601      1.1  reinoud 
    602      1.1  reinoud 	*dscrptr = (union dscrptr *)
    603      1.1  reinoud 		(((uint8_t *) eccline->blob) + eccsect * sector_size);
    604      1.1  reinoud 
    605      1.1  reinoud 	/* code from read_phys_descr */
    606      1.1  reinoud 	/* check if its a valid tag */
    607      1.1  reinoud 	error = udf_check_tag(*dscrptr);
    608      1.1  reinoud 	if (error) {
    609      1.1  reinoud 		/* check if its an empty block */
    610      1.1  reinoud 		pos = (uint8_t *) *dscrptr;
    611      1.1  reinoud 		for (i = 0; i < sector_size; i++, pos++) {
    612      1.1  reinoud 			if (*pos) break;
    613      1.1  reinoud 		}
    614      1.1  reinoud 		if (i == sector_size) {
    615      1.1  reinoud 			/* return no error but with no dscrptr */
    616      1.1  reinoud 			error = 0;
    617      1.1  reinoud 		}
    618      1.1  reinoud 		*dscrptr = NULL;
    619      1.1  reinoud 		udf_puteccline(eccline);
    620      1.1  reinoud 		return error;
    621      1.1  reinoud 	}
    622      1.1  reinoud 
    623      1.1  reinoud 	/* calculate descriptor size */
    624      1.1  reinoud 	dscrlen = udf_tagsize(*dscrptr, sector_size);
    625      1.1  reinoud 	error = udf_check_tag_payload(*dscrptr, dscrlen);
    626      1.1  reinoud 	if (error) {
    627      1.1  reinoud 		*dscrptr = NULL;
    628      1.1  reinoud 		udf_puteccline(eccline);
    629      1.1  reinoud 		return error;
    630      1.1  reinoud 	}
    631      1.1  reinoud 
    632      1.1  reinoud 	eccline->refcnt++;
    633      1.1  reinoud 	udf_puteccline(eccline);
    634      1.1  reinoud 
    635      1.1  reinoud 	return 0;
    636      1.1  reinoud }
    637      1.1  reinoud 
    638      1.1  reinoud 
    639      1.1  reinoud static int
    640      1.5  reinoud udf_write_nodedscr_rmw(struct udf_strat_args *args)
    641      1.1  reinoud {
    642      1.1  reinoud 	union dscrptr    *dscrptr = args->dscr;
    643      1.1  reinoud 	struct udf_mount *ump = args->ump;
    644      1.1  reinoud 	struct long_ad   *icb = args->icb;
    645      1.1  reinoud 	struct udf_node *udf_node = args->udf_node;
    646      1.1  reinoud 	struct udf_eccline *eccline;
    647      1.1  reinoud 	uint64_t bit;
    648      1.1  reinoud 	uint32_t sectornr, logsectornr, dummy;
    649      1.1  reinoud 	// int waitfor  = args->waitfor;
    650      1.1  reinoud 	int sector_size = ump->discinfo.sector_size;
    651      1.1  reinoud 	int lb_size = udf_rw32(ump->logical_vol->lb_size);
    652      1.1  reinoud 	int error, eccsect;
    653      1.1  reinoud 
    654      1.1  reinoud 	lb_size = lb_size;
    655      1.1  reinoud 	KASSERT(sector_size == lb_size);
    656      1.1  reinoud 	sectornr    = 0;
    657      1.1  reinoud 	error = udf_translate_vtop(ump, icb, &sectornr, &dummy);
    658      1.1  reinoud 	if (error)
    659      1.1  reinoud 		return error;
    660      1.1  reinoud 
    661      1.5  reinoud 	/* add reference to the vnode to prevent recycling */
    662      1.5  reinoud 	vhold(udf_node->vnode);
    663      1.5  reinoud 
    664      1.1  reinoud 	/* get our eccline */
    665      1.1  reinoud 	eccline = udf_geteccline(ump, sectornr, 0);
    666      1.1  reinoud 	eccsect = sectornr - eccline->start_sector;
    667      1.1  reinoud 
    668      1.1  reinoud 	bit = (uint64_t) 1 << eccsect;
    669      1.1  reinoud 
    670      1.1  reinoud 	/* old callback still pending? */
    671      1.1  reinoud 	if (eccline->bufs[eccsect]) {
    672      1.5  reinoud 		DPRINTF(WRITE, ("udf_write_nodedscr_rmw: writing descriptor"
    673      1.1  reinoud 					" over buffer?\n"));
    674      1.1  reinoud 		nestiobuf_done(eccline->bufs[eccsect],
    675      1.1  reinoud 				eccline->bufs_len[eccsect],
    676      1.1  reinoud 				0);
    677      1.1  reinoud 		eccline->bufs[eccsect] = NULL;
    678      1.1  reinoud 	}
    679      1.1  reinoud 
    680      1.1  reinoud 	/* set sector number in the descriptor and validate */
    681      1.1  reinoud 	dscrptr = (union dscrptr *)
    682      1.1  reinoud 		(((uint8_t *) eccline->blob) + eccsect * sector_size);
    683      1.1  reinoud 	KASSERT(dscrptr == args->dscr);
    684      1.1  reinoud 
    685      1.1  reinoud 	logsectornr = udf_rw32(icb->loc.lb_num);
    686      1.1  reinoud 	dscrptr->tag.tag_loc = udf_rw32(logsectornr);
    687      1.1  reinoud 	udf_validate_tag_and_crc_sums(dscrptr);
    688      1.1  reinoud 
    689      1.1  reinoud 	udf_fixup_node_internals(ump, (uint8_t *) dscrptr, UDF_C_NODE);
    690      1.1  reinoud 
    691      1.1  reinoud 	/* set our flags */
    692      1.1  reinoud 	KASSERT(eccline->present & bit);
    693      1.1  reinoud 	eccline->dirty |= bit;
    694      1.1  reinoud 
    695      1.1  reinoud 	KASSERT(udf_tagsize(dscrptr, sector_size) <= sector_size);
    696      1.1  reinoud 
    697      1.1  reinoud 	udf_puteccline(eccline);
    698      1.1  reinoud 
    699      1.5  reinoud 	holdrele(udf_node->vnode);
    700      1.5  reinoud 	udf_node->outstanding_nodedscr--;
    701      1.5  reinoud 	if (udf_node->outstanding_nodedscr == 0) {
    702      1.5  reinoud 		UDF_UNLOCK_NODE(udf_node, udf_node->i_flags & IN_CALLBACK_ULK);
    703      1.5  reinoud 		wakeup(&udf_node->outstanding_nodedscr);
    704      1.5  reinoud 	}
    705      1.5  reinoud 
    706      1.1  reinoud 	/* XXX waitfor not used */
    707      1.1  reinoud 	return 0;
    708      1.1  reinoud }
    709      1.1  reinoud 
    710      1.1  reinoud 
    711      1.1  reinoud static void
    712      1.1  reinoud udf_queuebuf_rmw(struct udf_strat_args *args)
    713      1.1  reinoud {
    714      1.1  reinoud 	struct udf_mount *ump = args->ump;
    715      1.1  reinoud 	struct buf *buf = args->nestbuf;
    716      1.6  reinoud 	struct desc_tag *tag;
    717      1.1  reinoud 	struct strat_private *priv = PRIV(ump);
    718      1.1  reinoud 	struct udf_eccline *eccline;
    719      1.1  reinoud 	struct long_ad *node_ad_cpy;
    720      1.1  reinoud 	uint64_t bit, *lmapping, *pmapping, *lmappos, *pmappos, blknr;
    721      1.6  reinoud 	uint32_t buf_len, len, sectors, sectornr, our_sectornr;
    722      1.1  reinoud 	uint32_t bpos;
    723      1.6  reinoud 	uint16_t vpart_num;
    724      1.1  reinoud 	uint8_t *fidblk, *src, *dst;
    725      1.1  reinoud 	int sector_size = ump->discinfo.sector_size;
    726      1.1  reinoud 	int blks = sector_size / DEV_BSIZE;
    727      1.1  reinoud 	int eccsect, what, queue, error;
    728      1.1  reinoud 
    729      1.1  reinoud 	KASSERT(ump);
    730      1.1  reinoud 	KASSERT(buf);
    731      1.1  reinoud 	KASSERT(buf->b_iodone == nestiobuf_iodone);
    732      1.1  reinoud 
    733      1.1  reinoud 	blknr        = buf->b_blkno;
    734      1.1  reinoud 	our_sectornr = blknr / blks;
    735      1.1  reinoud 
    736      1.1  reinoud 	what = buf->b_udf_c_type;
    737      1.1  reinoud 	queue = UDF_SHED_READING;
    738      1.1  reinoud 	if ((buf->b_flags & B_READ) == 0) {
    739      1.1  reinoud 		/* writing */
    740      1.1  reinoud 		queue = UDF_SHED_SEQWRITING;
    741  1.9.4.7      snj 		if (what == UDF_C_ABSOLUTE)
    742  1.9.4.7      snj 			queue = UDF_SHED_WRITING;
    743      1.1  reinoud 		if (what == UDF_C_DSCR)
    744      1.1  reinoud 			queue = UDF_SHED_WRITING;
    745      1.1  reinoud 		if (what == UDF_C_NODE)
    746      1.1  reinoud 			queue = UDF_SHED_WRITING;
    747      1.1  reinoud 	}
    748      1.1  reinoud 
    749      1.1  reinoud 	if (queue == UDF_SHED_READING) {
    750      1.3  reinoud 		DPRINTF(SHEDULE, ("\nudf_queuebuf_rmw READ %p : sector %d type %d,"
    751      1.1  reinoud 			"b_resid %d, b_bcount %d, b_bufsize %d\n",
    752      1.1  reinoud 			buf, (uint32_t) buf->b_blkno / blks, buf->b_udf_c_type,
    753      1.1  reinoud 			buf->b_resid, buf->b_bcount, buf->b_bufsize));
    754      1.1  reinoud 
    755      1.1  reinoud 		/* mark bits for reading */
    756      1.1  reinoud 		buf_len = buf->b_bcount;
    757      1.1  reinoud 		sectornr = our_sectornr;
    758      1.1  reinoud 		eccline = udf_geteccline(ump, sectornr, 0);
    759      1.1  reinoud 		eccsect = sectornr - eccline->start_sector;
    760      1.1  reinoud 		bpos = 0;
    761      1.1  reinoud 		while (buf_len) {
    762      1.1  reinoud 			len = MIN(buf_len, sector_size);
    763      1.1  reinoud 			if (eccsect == ump->packet_size) {
    764      1.1  reinoud 				udf_puteccline(eccline);
    765      1.1  reinoud 				eccline = udf_geteccline(ump, sectornr, 0);
    766      1.1  reinoud 				eccsect = sectornr - eccline->start_sector;
    767      1.1  reinoud 			}
    768      1.1  reinoud 			bit = (uint64_t) 1 << eccsect;
    769      1.1  reinoud 			error = eccline->error & bit ? EIO : 0;
    770      1.1  reinoud 			if (eccline->present & bit) {
    771      1.1  reinoud 				src = (uint8_t *) eccline->blob +
    772      1.1  reinoud 					eccsect * sector_size;
    773      1.1  reinoud 				dst = (uint8_t *) buf->b_data + bpos;
    774      1.1  reinoud 				if (!error)
    775      1.1  reinoud 					memcpy(dst, src, len);
    776      1.1  reinoud 				nestiobuf_done(buf, len, error);
    777      1.1  reinoud 			} else {
    778      1.1  reinoud 				eccline->readin |= bit;
    779      1.1  reinoud 				KASSERT(eccline->bufs[eccsect] == NULL);
    780      1.1  reinoud 				eccline->bufs[eccsect] = buf;
    781      1.1  reinoud 				eccline->bufs_bpos[eccsect] = bpos;
    782      1.1  reinoud 				eccline->bufs_len[eccsect] = len;
    783      1.1  reinoud 			}
    784      1.1  reinoud 			bpos += sector_size;
    785      1.1  reinoud 			eccsect++;
    786      1.1  reinoud 			sectornr++;
    787      1.1  reinoud 			buf_len -= len;
    788      1.1  reinoud 		}
    789      1.1  reinoud 		udf_puteccline(eccline);
    790      1.1  reinoud 		return;
    791      1.1  reinoud 	}
    792      1.1  reinoud 
    793      1.1  reinoud 	if (queue == UDF_SHED_WRITING) {
    794      1.3  reinoud 		DPRINTF(SHEDULE, ("\nudf_queuebuf_rmw WRITE %p : sector %d "
    795      1.1  reinoud 			"type %d, b_resid %d, b_bcount %d, b_bufsize %d\n",
    796      1.1  reinoud 			buf, (uint32_t) buf->b_blkno / blks, buf->b_udf_c_type,
    797      1.1  reinoud 			buf->b_resid, buf->b_bcount, buf->b_bufsize));
    798      1.1  reinoud 		/* if we have FIDs fixup using buffer's sector number(s) */
    799      1.1  reinoud 		if (buf->b_udf_c_type == UDF_C_FIDS) {
    800      1.1  reinoud 			panic("UDF_C_FIDS in SHED_WRITING!\n");
    801      1.1  reinoud #if 0
    802      1.1  reinoud 			buf_len = buf->b_bcount;
    803      1.1  reinoud 			sectornr = our_sectornr;
    804      1.1  reinoud 			bpos = 0;
    805      1.1  reinoud 			while (buf_len) {
    806      1.1  reinoud 				len = MIN(buf_len, sector_size);
    807      1.1  reinoud 				fidblk = (uint8_t *) buf->b_data + bpos;
    808      1.1  reinoud 				udf_fixup_fid_block(fidblk, sector_size,
    809      1.1  reinoud 					0, len, sectornr);
    810      1.1  reinoud 				sectornr++;
    811      1.1  reinoud 				bpos += len;
    812      1.1  reinoud 				buf_len -= len;
    813      1.1  reinoud 			}
    814      1.1  reinoud #endif
    815      1.1  reinoud 		}
    816      1.1  reinoud 		udf_fixup_node_internals(ump, buf->b_data, buf->b_udf_c_type);
    817      1.1  reinoud 
    818      1.1  reinoud 		/* copy parts into the bufs and set for writing */
    819      1.1  reinoud 		buf_len = buf->b_bcount;
    820      1.1  reinoud 		sectornr = our_sectornr;
    821      1.1  reinoud 		eccline = udf_geteccline(ump, sectornr, 0);
    822      1.1  reinoud 		eccsect = sectornr - eccline->start_sector;
    823      1.1  reinoud 		bpos = 0;
    824      1.1  reinoud 		while (buf_len) {
    825      1.1  reinoud 			len = MIN(buf_len, sector_size);
    826      1.1  reinoud 			if (eccsect == ump->packet_size) {
    827      1.1  reinoud 				udf_puteccline(eccline);
    828      1.1  reinoud 				eccline = udf_geteccline(ump, sectornr, 0);
    829      1.1  reinoud 				eccsect = sectornr - eccline->start_sector;
    830      1.1  reinoud 			}
    831      1.1  reinoud 			bit = (uint64_t) 1 << eccsect;
    832      1.1  reinoud 			KASSERT((eccline->readin & bit) == 0);
    833      1.1  reinoud 			eccline->present |= bit;
    834      1.1  reinoud 			eccline->dirty   |= bit;
    835      1.1  reinoud 			if (eccline->bufs[eccsect]) {
    836      1.1  reinoud 				/* old callback still pending */
    837      1.1  reinoud 				nestiobuf_done(eccline->bufs[eccsect],
    838      1.1  reinoud 						eccline->bufs_len[eccsect],
    839      1.1  reinoud 						0);
    840      1.1  reinoud 				eccline->bufs[eccsect] = NULL;
    841      1.1  reinoud 			}
    842      1.1  reinoud 
    843      1.2  reinoud 			src = (uint8_t *) buf->b_data + bpos;
    844      1.2  reinoud 			dst = (uint8_t *) eccline->blob + eccsect * sector_size;
    845      1.2  reinoud 			if (len != sector_size)
    846      1.2  reinoud 				memset(dst, 0, sector_size);
    847      1.2  reinoud 			memcpy(dst, src, len);
    848      1.2  reinoud 
    849      1.1  reinoud 			/* note that its finished for this extent */
    850      1.1  reinoud 			eccline->bufs[eccsect] = NULL;
    851      1.1  reinoud 			nestiobuf_done(buf, len, 0);
    852      1.1  reinoud 
    853      1.1  reinoud 			bpos += sector_size;
    854      1.1  reinoud 			eccsect++;
    855      1.1  reinoud 			sectornr++;
    856      1.1  reinoud 			buf_len -= len;
    857      1.1  reinoud 		}
    858      1.1  reinoud 		udf_puteccline(eccline);
    859      1.1  reinoud 		return;
    860      1.1  reinoud 
    861      1.1  reinoud 	}
    862      1.1  reinoud 
    863      1.1  reinoud 	/* sequential writing */
    864      1.1  reinoud 	KASSERT(queue == UDF_SHED_SEQWRITING);
    865      1.3  reinoud 	DPRINTF(SHEDULE, ("\nudf_queuebuf_rmw SEQWRITE %p : sector XXXX "
    866      1.1  reinoud 		"type %d, b_resid %d, b_bcount %d, b_bufsize %d\n",
    867      1.1  reinoud 		buf, buf->b_udf_c_type, buf->b_resid, buf->b_bcount,
    868      1.1  reinoud 		buf->b_bufsize));
    869      1.1  reinoud 	/*
    870      1.1  reinoud 	 * Buffers should not have been allocated to disc addresses yet on
    871      1.1  reinoud 	 * this queue. Note that a buffer can get multiple extents allocated.
    872      1.1  reinoud 	 * Note that it *looks* like the normal writing but its different in
    873      1.1  reinoud 	 * the details.
    874      1.1  reinoud 	 *
    875      1.6  reinoud 	 * lmapping contains lb_num relative to base partition.
    876      1.6  reinoud 	 *
    877      1.6  reinoud 	 * XXX should we try to claim/organize the allocated memory to
    878      1.6  reinoud 	 * block-aligned pieces?
    879      1.1  reinoud 	 */
    880      1.1  reinoud 	mutex_enter(&priv->seqwrite_mutex);
    881      1.1  reinoud 
    882      1.1  reinoud 	lmapping    = ump->la_lmapping;
    883      1.1  reinoud 	node_ad_cpy = ump->la_node_ad_cpy;
    884      1.1  reinoud 
    885      1.6  reinoud 	/* logically allocate buf and map it in the file */
    886      1.6  reinoud 	udf_late_allocate_buf(ump, buf, lmapping, node_ad_cpy, &vpart_num);
    887      1.1  reinoud 
    888      1.1  reinoud 	/* if we have FIDs, fixup using the new allocation table */
    889      1.1  reinoud 	if (buf->b_udf_c_type == UDF_C_FIDS) {
    890      1.1  reinoud 		buf_len = buf->b_bcount;
    891      1.1  reinoud 		bpos = 0;
    892      1.1  reinoud 		lmappos = lmapping;
    893      1.1  reinoud 		while (buf_len) {
    894      1.1  reinoud 			sectornr = *lmappos++;
    895      1.1  reinoud 			len = MIN(buf_len, sector_size);
    896      1.1  reinoud 			fidblk = (uint8_t *) buf->b_data + bpos;
    897      1.1  reinoud 			udf_fixup_fid_block(fidblk, sector_size,
    898      1.1  reinoud 				0, len, sectornr);
    899      1.1  reinoud 			bpos += len;
    900      1.1  reinoud 			buf_len -= len;
    901      1.1  reinoud 		}
    902      1.1  reinoud 	}
    903      1.6  reinoud 	if (buf->b_udf_c_type == UDF_C_METADATA_SBM) {
    904      1.6  reinoud 		if (buf->b_lblkno == 0) {
    905      1.6  reinoud 			/* update the tag location inside */
    906      1.6  reinoud 			tag = (struct desc_tag *) buf->b_data;
    907      1.7  reinoud 			tag->tag_loc = udf_rw32(*lmapping);
    908      1.6  reinoud 			udf_validate_tag_and_crc_sums(buf->b_data);
    909      1.6  reinoud 		}
    910      1.6  reinoud 	}
    911      1.1  reinoud 	udf_fixup_node_internals(ump, buf->b_data, buf->b_udf_c_type);
    912      1.1  reinoud 
    913      1.6  reinoud 	/*
    914      1.6  reinoud 	 * Translate new mappings in lmapping to pmappings.
    915      1.6  reinoud 	 * pmapping to contain lb_nums as used for disc adressing.
    916      1.6  reinoud 	 */
    917      1.6  reinoud 	pmapping = ump->la_pmapping;
    918      1.6  reinoud 	sectors  = (buf->b_bcount + sector_size -1) / sector_size;
    919      1.6  reinoud 	udf_translate_vtop_list(ump, sectors, vpart_num, lmapping, pmapping);
    920      1.6  reinoud 
    921      1.1  reinoud 	/* copy parts into the bufs and set for writing */
    922      1.1  reinoud 	pmappos = pmapping;
    923      1.1  reinoud 	buf_len = buf->b_bcount;
    924      1.1  reinoud 	sectornr = *pmappos++;
    925      1.1  reinoud 	eccline = udf_geteccline(ump, sectornr, ECC_SEQWRITING);
    926      1.1  reinoud 	eccsect = sectornr - eccline->start_sector;
    927      1.1  reinoud 	bpos = 0;
    928      1.1  reinoud 	while (buf_len) {
    929      1.1  reinoud 		len = MIN(buf_len, sector_size);
    930      1.1  reinoud 		eccsect = sectornr - eccline->start_sector;
    931      1.1  reinoud 		if ((eccsect < 0) || (eccsect >= ump->packet_size)) {
    932      1.1  reinoud 			eccline->flags |= ECC_SEQWRITING;
    933      1.1  reinoud 			udf_puteccline(eccline);
    934      1.1  reinoud 			eccline = udf_geteccline(ump, sectornr, ECC_SEQWRITING);
    935      1.1  reinoud 			eccsect = sectornr - eccline->start_sector;
    936      1.1  reinoud 		}
    937      1.1  reinoud 		bit = (uint64_t) 1 << eccsect;
    938      1.1  reinoud 		KASSERT((eccline->readin & bit) == 0);
    939      1.1  reinoud 		eccline->present |= bit;
    940      1.1  reinoud 		eccline->dirty   |= bit;
    941      1.1  reinoud 		eccline->bufs[eccsect] = NULL;
    942      1.1  reinoud 
    943      1.1  reinoud 		src = (uint8_t *) buf->b_data + bpos;
    944      1.1  reinoud 		dst = (uint8_t *)
    945      1.1  reinoud 			eccline->blob + eccsect * sector_size;
    946      1.1  reinoud 		if (len != sector_size)
    947      1.1  reinoud 			memset(dst, 0, sector_size);
    948      1.1  reinoud 		memcpy(dst, src, len);
    949      1.1  reinoud 
    950      1.1  reinoud 		/* note that its finished for this extent */
    951      1.1  reinoud 		nestiobuf_done(buf, len, 0);
    952      1.1  reinoud 
    953      1.1  reinoud 		bpos += sector_size;
    954      1.1  reinoud 		sectornr = *pmappos++;
    955      1.1  reinoud 		buf_len -= len;
    956      1.1  reinoud 	}
    957      1.1  reinoud 	eccline->flags |= ECC_SEQWRITING;
    958      1.1  reinoud 	udf_puteccline(eccline);
    959      1.1  reinoud 	mutex_exit(&priv->seqwrite_mutex);
    960      1.1  reinoud }
    961      1.1  reinoud 
    962      1.1  reinoud /* --------------------------------------------------------------------- */
    963      1.1  reinoud 
    964      1.1  reinoud static void
    965      1.1  reinoud udf_shedule_read_callback(struct buf *buf)
    966      1.1  reinoud {
    967      1.1  reinoud 	struct udf_eccline *eccline = BTOE(buf);
    968      1.1  reinoud 	struct udf_mount *ump = eccline->ump;
    969      1.1  reinoud 	uint64_t bit;
    970      1.1  reinoud 	uint8_t *src, *dst;
    971      1.1  reinoud 	int sector_size = ump->discinfo.sector_size;
    972      1.1  reinoud 	int error, i, len;
    973      1.1  reinoud 
    974      1.3  reinoud 	DPRINTF(ECCLINE, ("read callback called\n"));
    975      1.1  reinoud 	/* post process read action */
    976      1.1  reinoud 	error = buf->b_error;
    977      1.1  reinoud 	for (i = 0; i < ump->packet_size; i++) {
    978      1.1  reinoud 		bit = (uint64_t) 1 << i;
    979      1.1  reinoud 		src = (uint8_t *) buf->b_data +   i * sector_size;
    980      1.1  reinoud 		dst = (uint8_t *) eccline->blob + i * sector_size;
    981      1.1  reinoud 		if (eccline->present & bit)
    982      1.1  reinoud 			continue;
    983      1.8  reinoud 		eccline->present |= bit;
    984      1.8  reinoud 		if (error)
    985      1.1  reinoud 			eccline->error |= bit;
    986      1.1  reinoud 		if (eccline->bufs[i]) {
    987      1.1  reinoud 			dst = (uint8_t *) eccline->bufs[i]->b_data +
    988      1.1  reinoud 				eccline->bufs_bpos[i];
    989      1.1  reinoud 			len = eccline->bufs_len[i];
    990      1.1  reinoud 			if (!error)
    991      1.1  reinoud 				memcpy(dst, src, len);
    992      1.1  reinoud 			nestiobuf_done(eccline->bufs[i], len, error);
    993      1.1  reinoud 			eccline->bufs[i] = NULL;
    994      1.1  reinoud 		}
    995      1.1  reinoud 
    996      1.1  reinoud 	}
    997      1.1  reinoud 	KASSERT(buf->b_data == eccline->blob);
    998      1.1  reinoud 	KASSERT(eccline->present == ((uint64_t) 1 << ump->packet_size)-1);
    999      1.1  reinoud 
   1000      1.1  reinoud 	/*
   1001      1.1  reinoud 	 * XXX TODO what to do on read errors? read in all sectors
   1002      1.1  reinoud 	 * synchronously and allocate a sparable entry?
   1003      1.1  reinoud 	 */
   1004      1.1  reinoud 
   1005      1.1  reinoud 	udf_puteccline(eccline);
   1006      1.3  reinoud 	DPRINTF(ECCLINE, ("read callback finished\n"));
   1007      1.1  reinoud }
   1008      1.1  reinoud 
   1009      1.1  reinoud 
   1010      1.1  reinoud static void
   1011      1.1  reinoud udf_shedule_write_callback(struct buf *buf)
   1012      1.1  reinoud {
   1013      1.1  reinoud 	struct udf_eccline *eccline = BTOE(buf);
   1014      1.1  reinoud 	struct udf_mount *ump = eccline->ump;
   1015      1.1  reinoud 	uint64_t bit;
   1016      1.1  reinoud 	int error, i, len;
   1017      1.1  reinoud 
   1018      1.3  reinoud 	DPRINTF(ECCLINE, ("write callback called\n"));
   1019      1.1  reinoud 	/* post process write action */
   1020      1.1  reinoud 	error = buf->b_error;
   1021      1.1  reinoud 	for (i = 0; i < ump->packet_size; i++) {
   1022      1.1  reinoud 		bit = (uint64_t) 1 << i;
   1023      1.1  reinoud 		if ((eccline->dirty & bit) == 0)
   1024      1.1  reinoud 			continue;
   1025      1.1  reinoud 		if (error) {
   1026      1.1  reinoud 			eccline->error |= bit;
   1027      1.1  reinoud 		} else {
   1028      1.1  reinoud 			eccline->dirty &= ~bit;
   1029      1.1  reinoud 		}
   1030      1.1  reinoud 		if (eccline->bufs[i]) {
   1031      1.1  reinoud 			len = eccline->bufs_len[i];
   1032      1.1  reinoud 			nestiobuf_done(eccline->bufs[i], len, error);
   1033      1.1  reinoud 			eccline->bufs[i] = NULL;
   1034      1.1  reinoud 		}
   1035      1.1  reinoud 	}
   1036      1.1  reinoud 	KASSERT(eccline->dirty == 0);
   1037      1.1  reinoud 
   1038      1.1  reinoud 	KASSERT(error == 0);
   1039      1.1  reinoud 	/*
   1040  1.9.4.4      snj 	 * XXX TODO on write errors allocate a sparable entry and reissue
   1041      1.1  reinoud 	 */
   1042      1.1  reinoud 
   1043      1.1  reinoud 	udf_puteccline(eccline);
   1044      1.1  reinoud }
   1045      1.1  reinoud 
   1046      1.1  reinoud 
   1047      1.1  reinoud static void
   1048      1.1  reinoud udf_issue_eccline(struct udf_eccline *eccline, int queued_on)
   1049      1.1  reinoud {
   1050      1.1  reinoud 	struct udf_mount *ump = eccline->ump;
   1051      1.1  reinoud 	struct strat_private *priv = PRIV(ump);
   1052      1.1  reinoud 	struct buf *buf, *nestbuf;
   1053      1.1  reinoud 	uint64_t bit, allbits = ((uint64_t) 1 << ump->packet_size)-1;
   1054      1.1  reinoud 	uint32_t start;
   1055      1.1  reinoud 	int sector_size = ump->discinfo.sector_size;
   1056      1.1  reinoud 	int blks = sector_size / DEV_BSIZE;
   1057      1.1  reinoud 	int i;
   1058      1.1  reinoud 
   1059      1.1  reinoud 	if (queued_on == UDF_SHED_READING) {
   1060      1.3  reinoud 		DPRINTF(SHEDULE, ("udf_issue_eccline reading : "));
   1061      1.1  reinoud 		/* read all bits that are not yet present */
   1062      1.1  reinoud 		eccline->readin = (~eccline->present) & allbits;
   1063      1.1  reinoud 		KASSERT(eccline->readin);
   1064      1.1  reinoud 		start = eccline->start_sector;
   1065      1.1  reinoud 		buf = eccline->buf;
   1066      1.1  reinoud 		buf->b_flags    = B_READ | B_ASYNC;
   1067      1.4  reinoud 		SET(buf->b_cflags, BC_BUSY);	/* mark buffer busy */
   1068      1.1  reinoud 		buf->b_oflags   = 0;
   1069      1.1  reinoud 		buf->b_iodone   = udf_shedule_read_callback;
   1070      1.1  reinoud 		buf->b_data     = eccline->blob;
   1071      1.1  reinoud 		buf->b_bcount   = ump->packet_size * sector_size;
   1072      1.1  reinoud 		buf->b_resid    = buf->b_bcount;
   1073      1.1  reinoud 		buf->b_bufsize  = buf->b_bcount;
   1074      1.1  reinoud 		buf->b_private  = eccline;
   1075      1.1  reinoud 		BIO_SETPRIO(buf, BPRIO_DEFAULT);
   1076      1.1  reinoud 		buf->b_lblkno   = buf->b_blkno = buf->b_rawblkno = start * blks;
   1077      1.1  reinoud 		buf->b_proc     = NULL;
   1078      1.1  reinoud 
   1079      1.1  reinoud 		if (eccline->present != 0) {
   1080      1.1  reinoud 			for (i = 0; i < ump->packet_size; i++) {
   1081      1.1  reinoud 				bit = (uint64_t) 1 << i;
   1082      1.1  reinoud 				if (eccline->present & bit) {
   1083      1.1  reinoud 					nestiobuf_done(buf, sector_size, 0);
   1084      1.1  reinoud 					continue;
   1085      1.1  reinoud 				}
   1086      1.1  reinoud 				nestbuf = getiobuf(NULL, true);
   1087      1.1  reinoud 				nestiobuf_setup(buf, nestbuf, i * sector_size,
   1088      1.1  reinoud 					sector_size);
   1089      1.1  reinoud 				/* adjust blocknumber to read */
   1090      1.1  reinoud 				nestbuf->b_blkno = buf->b_blkno + i*blks;
   1091      1.1  reinoud 				nestbuf->b_rawblkno = buf->b_rawblkno + i*blks;
   1092      1.1  reinoud 
   1093      1.3  reinoud 				DPRINTF(SHEDULE, ("sector %d ",
   1094      1.3  reinoud 					start + i));
   1095      1.1  reinoud 				/* call asynchronous */
   1096      1.1  reinoud 				VOP_STRATEGY(ump->devvp, nestbuf);
   1097      1.1  reinoud 			}
   1098      1.3  reinoud 			DPRINTF(SHEDULE, ("\n"));
   1099      1.1  reinoud 			return;
   1100      1.1  reinoud 		}
   1101      1.1  reinoud 	} else {
   1102      1.1  reinoud 		/* write or seqwrite */
   1103      1.3  reinoud 		DPRINTF(SHEDULE, ("udf_issue_eccline writing or seqwriting : "));
   1104  1.9.4.4      snj 		DPRINTF(SHEDULE, ("\n\tpresent %"PRIx64", readin %"PRIx64", "
   1105  1.9.4.4      snj 			"dirty %"PRIx64"\n\t", eccline->present, eccline->readin,
   1106  1.9.4.4      snj 			eccline->dirty));
   1107      1.1  reinoud 		if (eccline->present != allbits) {
   1108      1.1  reinoud 			/* requeue to read-only */
   1109      1.3  reinoud 			DPRINTF(SHEDULE, ("\n\t-> not complete, requeue to "
   1110      1.3  reinoud 				"reading\n"));
   1111      1.1  reinoud 			udf_push_eccline(eccline, UDF_SHED_READING);
   1112      1.1  reinoud 			return;
   1113      1.1  reinoud 		}
   1114      1.1  reinoud 		start = eccline->start_sector;
   1115      1.1  reinoud 		buf = eccline->buf;
   1116      1.1  reinoud 		buf->b_flags    = B_WRITE | B_ASYNC;
   1117      1.4  reinoud 		SET(buf->b_cflags, BC_BUSY);	/* mark buffer busy */
   1118      1.1  reinoud 		buf->b_oflags   = 0;
   1119      1.1  reinoud 		buf->b_iodone   = udf_shedule_write_callback;
   1120      1.1  reinoud 		buf->b_data     = eccline->blob;
   1121      1.1  reinoud 		buf->b_bcount   = ump->packet_size * sector_size;
   1122      1.1  reinoud 		buf->b_resid    = buf->b_bcount;
   1123      1.1  reinoud 		buf->b_bufsize  = buf->b_bcount;
   1124      1.1  reinoud 		buf->b_private  = eccline;
   1125      1.1  reinoud 		BIO_SETPRIO(buf, BPRIO_DEFAULT);
   1126      1.1  reinoud 		buf->b_lblkno   = buf->b_blkno = buf->b_rawblkno = start * blks;
   1127      1.1  reinoud 		buf->b_proc     = NULL;
   1128      1.1  reinoud 	}
   1129      1.1  reinoud 
   1130      1.1  reinoud 	mutex_exit(&priv->discstrat_mutex);
   1131      1.1  reinoud 		/* call asynchronous */
   1132      1.3  reinoud 		DPRINTF(SHEDULE, ("sector %d for %d\n",
   1133      1.3  reinoud 			start, ump->packet_size));
   1134      1.1  reinoud 		VOP_STRATEGY(ump->devvp, buf);
   1135      1.1  reinoud 	mutex_enter(&priv->discstrat_mutex);
   1136      1.1  reinoud }
   1137      1.1  reinoud 
   1138      1.1  reinoud 
   1139      1.1  reinoud static void
   1140      1.1  reinoud udf_discstrat_thread(void *arg)
   1141      1.1  reinoud {
   1142      1.1  reinoud 	struct udf_mount *ump = (struct udf_mount *) arg;
   1143      1.1  reinoud 	struct strat_private *priv = PRIV(ump);
   1144      1.1  reinoud 	struct udf_eccline *eccline;
   1145      1.1  reinoud 	struct timespec now, *last;
   1146  1.9.4.2      snj 	uint64_t allbits = ((uint64_t) 1 << ump->packet_size)-1;
   1147  1.9.4.2      snj 	int new_queue, wait, work, num, cnt;
   1148      1.1  reinoud 
   1149      1.1  reinoud 	work = 1;
   1150  1.9.4.4      snj 	priv->thread_running = 1;
   1151      1.1  reinoud 	mutex_enter(&priv->discstrat_mutex);
   1152      1.1  reinoud 	priv->num_floating = 0;
   1153      1.1  reinoud 	while (priv->run_thread || work || priv->num_floating) {
   1154  1.9.4.2      snj 		/* get our time */
   1155  1.9.4.2      snj 		vfs_timestamp(&now);
   1156  1.9.4.2      snj 
   1157  1.9.4.2      snj 		/* maintenance: handle eccline state machine */
   1158  1.9.4.2      snj 		num = priv->num_queued[UDF_SHED_WAITING];
   1159  1.9.4.2      snj 		cnt = 0;
   1160  1.9.4.2      snj 		while (cnt < num) {
   1161  1.9.4.2      snj 			eccline = udf_pop_eccline(priv, UDF_SHED_WAITING);
   1162  1.9.4.2      snj 			/* requeue */
   1163  1.9.4.2      snj 			new_queue = UDF_SHED_FREE;
   1164  1.9.4.2      snj 			if (eccline->refcnt > 0)
   1165  1.9.4.2      snj 				new_queue = UDF_SHED_IDLE;
   1166  1.9.4.2      snj 			if (eccline->flags & ECC_WANTED)
   1167  1.9.4.2      snj 				new_queue = UDF_SHED_IDLE;
   1168  1.9.4.2      snj 			if (eccline->readin)
   1169  1.9.4.2      snj 				new_queue = UDF_SHED_READING;
   1170  1.9.4.2      snj 			if (eccline->dirty) {
   1171  1.9.4.2      snj 				new_queue = UDF_SHED_WAITING;
   1172  1.9.4.4      snj 				if ((eccline->wait_time.tv_sec - now.tv_sec <= 0) ||
   1173  1.9.4.4      snj 				   ((eccline->present == allbits) &&
   1174  1.9.4.4      snj 				    (eccline->flags & ECC_SEQWRITING)))
   1175  1.9.4.4      snj 				{
   1176  1.9.4.2      snj 					new_queue = UDF_SHED_WRITING;
   1177  1.9.4.2      snj 					if (eccline->flags & ECC_SEQWRITING)
   1178  1.9.4.2      snj 						new_queue = UDF_SHED_SEQWRITING;
   1179  1.9.4.2      snj 					if (eccline->present != allbits)
   1180  1.9.4.2      snj 						new_queue = UDF_SHED_READING;
   1181  1.9.4.2      snj 				}
   1182  1.9.4.2      snj 			}
   1183  1.9.4.2      snj 			udf_push_eccline(eccline, new_queue);
   1184  1.9.4.2      snj 			cnt++;
   1185  1.9.4.2      snj 		}
   1186  1.9.4.2      snj 
   1187      1.1  reinoud 		/* maintenance: free exess ecclines */
   1188      1.1  reinoud 		while (priv->num_queued[UDF_SHED_FREE] > UDF_ECCLINE_MAXFREE) {
   1189      1.1  reinoud 			eccline = udf_pop_eccline(priv, UDF_SHED_FREE);
   1190      1.1  reinoud 			KASSERT(eccline);
   1191      1.1  reinoud 			KASSERT(eccline->refcnt == 0);
   1192  1.9.4.2      snj 			if (eccline->flags & ECC_WANTED) {
   1193  1.9.4.2      snj 				udf_push_eccline(eccline, UDF_SHED_IDLE);
   1194  1.9.4.2      snj 				DPRINTF(ECCLINE, ("Tried removing, pushed back to free list\n"));
   1195  1.9.4.2      snj 			} else {
   1196  1.9.4.2      snj 				DPRINTF(ECCLINE, ("Removing entry from free list\n"));
   1197  1.9.4.2      snj 				udf_dispose_eccline(eccline);
   1198  1.9.4.2      snj 			}
   1199      1.1  reinoud 		}
   1200      1.1  reinoud 
   1201  1.9.4.2      snj 		/* process the current selected queue */
   1202      1.1  reinoud 		/* get our time */
   1203      1.1  reinoud 		vfs_timestamp(&now);
   1204      1.1  reinoud 		last = &priv->last_queued[priv->cur_queue];
   1205      1.1  reinoud 
   1206      1.1  reinoud 		/* get our line */
   1207      1.1  reinoud 		eccline = udf_pop_eccline(priv, priv->cur_queue);
   1208      1.1  reinoud 		if (eccline) {
   1209      1.1  reinoud 			wait = 0;
   1210      1.1  reinoud 			new_queue = priv->cur_queue;
   1211      1.3  reinoud 			DPRINTF(ECCLINE, ("UDF_ISSUE_ECCLINE\n"));
   1212      1.1  reinoud 
   1213      1.1  reinoud 			/* complete the `get' by locking and refcounting it */
   1214      1.1  reinoud 			UDF_LOCK_ECCLINE(eccline);
   1215      1.1  reinoud 			eccline->refcnt++;
   1216      1.1  reinoud 
   1217      1.1  reinoud 			udf_issue_eccline(eccline, priv->cur_queue);
   1218      1.1  reinoud 		} else {
   1219  1.9.4.4      snj 			/* don't switch too quickly */
   1220  1.9.4.4      snj 			if (now.tv_sec - last->tv_sec < 2) {
   1221  1.9.4.4      snj 				/* wait some time */
   1222  1.9.4.4      snj 				cv_timedwait(&priv->discstrat_cv,
   1223  1.9.4.4      snj 					&priv->discstrat_mutex, hz);
   1224  1.9.4.4      snj 				/* we assume there is work to be done */
   1225  1.9.4.4      snj 				work = 1;
   1226  1.9.4.4      snj 				continue;
   1227  1.9.4.4      snj 			}
   1228  1.9.4.4      snj 
   1229  1.9.4.4      snj 			/* XXX select on queue lengths ? */
   1230      1.1  reinoud 			wait = 1;
   1231      1.1  reinoud 			/* check if we can/should switch */
   1232      1.1  reinoud 			new_queue = priv->cur_queue;
   1233      1.1  reinoud 			if (BUFQ_PEEK(priv->queues[UDF_SHED_READING]))
   1234      1.1  reinoud 				new_queue = UDF_SHED_READING;
   1235      1.1  reinoud 			if (BUFQ_PEEK(priv->queues[UDF_SHED_WRITING]))
   1236      1.1  reinoud 				new_queue = UDF_SHED_WRITING;
   1237      1.1  reinoud 			if (BUFQ_PEEK(priv->queues[UDF_SHED_SEQWRITING]))
   1238      1.1  reinoud 				new_queue = UDF_SHED_SEQWRITING;
   1239      1.1  reinoud 		}
   1240      1.1  reinoud 
   1241      1.1  reinoud 		/* give room */
   1242      1.1  reinoud 		mutex_exit(&priv->discstrat_mutex);
   1243      1.1  reinoud 
   1244      1.1  reinoud 		if (new_queue != priv->cur_queue) {
   1245      1.1  reinoud 			wait = 0;
   1246      1.1  reinoud 			DPRINTF(SHEDULE, ("switching from %d to %d\n",
   1247      1.1  reinoud 				priv->cur_queue, new_queue));
   1248      1.1  reinoud 			priv->cur_queue = new_queue;
   1249      1.1  reinoud 		}
   1250      1.1  reinoud 		mutex_enter(&priv->discstrat_mutex);
   1251      1.1  reinoud 
   1252      1.1  reinoud 		/* wait for more if needed */
   1253      1.1  reinoud 		if (wait)
   1254      1.1  reinoud 			cv_timedwait(&priv->discstrat_cv,
   1255  1.9.4.4      snj 				&priv->discstrat_mutex, hz/4);	/* /8 */
   1256      1.1  reinoud 
   1257  1.9.4.2      snj 		work  = (BUFQ_PEEK(priv->queues[UDF_SHED_WAITING]) != NULL);
   1258  1.9.4.2      snj 		work |= (BUFQ_PEEK(priv->queues[UDF_SHED_READING]) != NULL);
   1259      1.1  reinoud 		work |= (BUFQ_PEEK(priv->queues[UDF_SHED_WRITING]) != NULL);
   1260      1.1  reinoud 		work |= (BUFQ_PEEK(priv->queues[UDF_SHED_SEQWRITING]) != NULL);
   1261      1.1  reinoud 
   1262      1.1  reinoud 		DPRINTF(PARANOIA, ("work : (%d, %d, %d) -> work %d, float %d\n",
   1263      1.1  reinoud 			(BUFQ_PEEK(priv->queues[UDF_SHED_READING]) != NULL),
   1264      1.1  reinoud 			(BUFQ_PEEK(priv->queues[UDF_SHED_WRITING]) != NULL),
   1265      1.1  reinoud 			(BUFQ_PEEK(priv->queues[UDF_SHED_SEQWRITING]) != NULL),
   1266      1.1  reinoud 			work, priv->num_floating));
   1267      1.1  reinoud 	}
   1268      1.1  reinoud 
   1269      1.1  reinoud 	mutex_exit(&priv->discstrat_mutex);
   1270      1.1  reinoud 
   1271      1.1  reinoud 	/* tear down remaining ecclines */
   1272      1.1  reinoud 	mutex_enter(&priv->discstrat_mutex);
   1273  1.9.4.2      snj 	KASSERT(priv->num_queued[UDF_SHED_WAITING] == 0);
   1274      1.1  reinoud 	KASSERT(priv->num_queued[UDF_SHED_IDLE] == 0);
   1275      1.1  reinoud 	KASSERT(priv->num_queued[UDF_SHED_READING] == 0);
   1276      1.1  reinoud 	KASSERT(priv->num_queued[UDF_SHED_WRITING] == 0);
   1277      1.1  reinoud 	KASSERT(priv->num_queued[UDF_SHED_SEQWRITING] == 0);
   1278      1.1  reinoud 
   1279  1.9.4.2      snj 	KASSERT(BUFQ_PEEK(priv->queues[UDF_SHED_WAITING]) == NULL);
   1280      1.1  reinoud 	KASSERT(BUFQ_PEEK(priv->queues[UDF_SHED_IDLE]) == NULL);
   1281      1.1  reinoud 	KASSERT(BUFQ_PEEK(priv->queues[UDF_SHED_READING]) == NULL);
   1282      1.1  reinoud 	KASSERT(BUFQ_PEEK(priv->queues[UDF_SHED_WRITING]) == NULL);
   1283      1.1  reinoud 	KASSERT(BUFQ_PEEK(priv->queues[UDF_SHED_SEQWRITING]) == NULL);
   1284      1.1  reinoud 	eccline = udf_pop_eccline(priv, UDF_SHED_FREE);
   1285      1.1  reinoud 	while (eccline) {
   1286      1.1  reinoud 		udf_dispose_eccline(eccline);
   1287      1.1  reinoud 		eccline = udf_pop_eccline(priv, UDF_SHED_FREE);
   1288      1.1  reinoud 	}
   1289      1.1  reinoud 	KASSERT(priv->num_queued[UDF_SHED_FREE] == 0);
   1290      1.1  reinoud 	mutex_exit(&priv->discstrat_mutex);
   1291      1.1  reinoud 
   1292  1.9.4.4      snj 	priv->thread_running  = 0;
   1293      1.1  reinoud 	priv->thread_finished = 1;
   1294      1.1  reinoud 	wakeup(&priv->run_thread);
   1295      1.1  reinoud 	kthread_exit(0);
   1296      1.1  reinoud 	/* not reached */
   1297      1.1  reinoud }
   1298      1.1  reinoud 
   1299      1.1  reinoud /* --------------------------------------------------------------------- */
   1300      1.1  reinoud 
   1301      1.1  reinoud /*
   1302      1.1  reinoud  * Buffer memory pool allocator.
   1303      1.1  reinoud  */
   1304      1.1  reinoud 
   1305      1.1  reinoud static void *
   1306      1.1  reinoud ecclinepool_page_alloc(struct pool *pp, int flags)
   1307      1.1  reinoud {
   1308      1.1  reinoud         return (void *)uvm_km_alloc(kernel_map,
   1309      1.1  reinoud             MAXBSIZE, MAXBSIZE,
   1310      1.1  reinoud             ((flags & PR_WAITOK) ? 0 : UVM_KMF_NOWAIT | UVM_KMF_TRYLOCK)
   1311      1.1  reinoud 	    	| UVM_KMF_WIRED /* UVM_KMF_PAGABLE? */);
   1312      1.1  reinoud }
   1313      1.1  reinoud 
   1314      1.1  reinoud static void
   1315      1.1  reinoud ecclinepool_page_free(struct pool *pp, void *v)
   1316      1.1  reinoud {
   1317      1.1  reinoud         uvm_km_free(kernel_map, (vaddr_t)v, MAXBSIZE, UVM_KMF_WIRED);
   1318      1.1  reinoud }
   1319      1.1  reinoud 
   1320      1.1  reinoud static struct pool_allocator ecclinepool_allocator = {
   1321      1.1  reinoud         .pa_alloc = ecclinepool_page_alloc,
   1322      1.1  reinoud         .pa_free  = ecclinepool_page_free,
   1323      1.1  reinoud         .pa_pagesz = MAXBSIZE,
   1324      1.1  reinoud };
   1325      1.1  reinoud 
   1326      1.1  reinoud 
   1327      1.1  reinoud static void
   1328      1.1  reinoud udf_discstrat_init_rmw(struct udf_strat_args *args)
   1329      1.1  reinoud {
   1330      1.1  reinoud 	struct udf_mount *ump = args->ump;
   1331      1.1  reinoud 	struct strat_private *priv = PRIV(ump);
   1332      1.1  reinoud 	uint32_t lb_size, blobsize, hashline;
   1333      1.1  reinoud 	int i;
   1334      1.1  reinoud 
   1335      1.1  reinoud 	KASSERT(ump);
   1336      1.1  reinoud 	KASSERT(ump->logical_vol);
   1337      1.1  reinoud 	KASSERT(priv == NULL);
   1338      1.1  reinoud 
   1339      1.1  reinoud 	lb_size = udf_rw32(ump->logical_vol->lb_size);
   1340      1.1  reinoud 	blobsize = ump->packet_size * lb_size;
   1341      1.1  reinoud 	KASSERT(lb_size > 0);
   1342      1.1  reinoud 	KASSERT(ump->packet_size <= 64);
   1343      1.1  reinoud 
   1344      1.1  reinoud 	/* initialise our memory space */
   1345      1.1  reinoud 	ump->strategy_private = malloc(sizeof(struct strat_private),
   1346      1.1  reinoud 		M_UDFTEMP, M_WAITOK);
   1347      1.1  reinoud 	priv = ump->strategy_private;
   1348      1.1  reinoud 	memset(priv, 0 , sizeof(struct strat_private));
   1349      1.1  reinoud 
   1350      1.1  reinoud 	/* initialise locks */
   1351      1.1  reinoud 	cv_init(&priv->discstrat_cv, "udfstrat");
   1352  1.9.4.6      snj 	mutex_init(&priv->discstrat_mutex, MUTEX_DEFAULT, IPL_NONE);
   1353      1.1  reinoud 	mutex_init(&priv->seqwrite_mutex, MUTEX_DEFAULT, IPL_NONE);
   1354      1.1  reinoud 
   1355      1.1  reinoud 	/* initialise struct eccline pool */
   1356      1.1  reinoud 	pool_init(&priv->eccline_pool, sizeof(struct udf_eccline),
   1357      1.1  reinoud 		0, 0, 0, "udf_eccline_pool", NULL, IPL_NONE);
   1358      1.1  reinoud 
   1359      1.1  reinoud 	/* initialise eccline blob pool */
   1360  1.9.4.3      snj         ecclinepool_allocator.pa_pagesz = blobsize;
   1361      1.1  reinoud 	pool_init(&priv->ecclineblob_pool, blobsize,
   1362  1.9.4.3      snj 		0, 0, 0, "udf_eccline_blob", &ecclinepool_allocator, IPL_NONE);
   1363      1.1  reinoud 
   1364      1.1  reinoud 	/* initialise main queues */
   1365      1.1  reinoud 	for (i = 0; i < UDF_SHED_MAX; i++) {
   1366      1.1  reinoud 		priv->num_queued[i] = 0;
   1367      1.1  reinoud 		vfs_timestamp(&priv->last_queued[i]);
   1368      1.1  reinoud 	}
   1369  1.9.4.2      snj 	bufq_alloc(&priv->queues[UDF_SHED_WAITING], "fcfs",
   1370  1.9.4.2      snj 		BUFQ_SORT_RAWBLOCK);
   1371      1.1  reinoud 	bufq_alloc(&priv->queues[UDF_SHED_READING], "disksort",
   1372      1.1  reinoud 		BUFQ_SORT_RAWBLOCK);
   1373      1.1  reinoud 	bufq_alloc(&priv->queues[UDF_SHED_WRITING], "disksort",
   1374      1.1  reinoud 		BUFQ_SORT_RAWBLOCK);
   1375      1.1  reinoud 	bufq_alloc(&priv->queues[UDF_SHED_SEQWRITING], "disksort", 0);
   1376      1.1  reinoud 
   1377      1.1  reinoud 	/* initialise administrative queues */
   1378      1.1  reinoud 	bufq_alloc(&priv->queues[UDF_SHED_IDLE], "fcfs", 0);
   1379      1.1  reinoud 	bufq_alloc(&priv->queues[UDF_SHED_FREE], "fcfs", 0);
   1380      1.1  reinoud 
   1381      1.1  reinoud 	for (hashline = 0; hashline < UDF_ECCBUF_HASHSIZE; hashline++) {
   1382      1.1  reinoud 		LIST_INIT(&priv->eccline_hash[hashline]);
   1383      1.1  reinoud 	}
   1384      1.1  reinoud 
   1385      1.1  reinoud 	/* create our disk strategy thread */
   1386      1.1  reinoud 	priv->cur_queue = UDF_SHED_READING;
   1387      1.1  reinoud 	priv->thread_finished = 0;
   1388  1.9.4.4      snj 	priv->thread_running  = 0;
   1389      1.1  reinoud 	priv->run_thread      = 1;
   1390      1.1  reinoud 	if (kthread_create(PRI_NONE, 0 /* KTHREAD_MPSAFE*/, NULL /* cpu_info*/,
   1391      1.1  reinoud 		udf_discstrat_thread, ump, &priv->queue_lwp,
   1392      1.1  reinoud 		"%s", "udf_rw")) {
   1393      1.1  reinoud 		panic("fork udf_rw");
   1394      1.1  reinoud 	}
   1395  1.9.4.4      snj 
   1396  1.9.4.4      snj 	/* wait for thread to spin up */
   1397  1.9.4.4      snj 	while (!priv->thread_running) {
   1398  1.9.4.4      snj 		tsleep(&priv->thread_running, PRIBIO+1, "udfshedstart", hz);
   1399  1.9.4.4      snj 	}
   1400      1.1  reinoud }
   1401      1.1  reinoud 
   1402      1.1  reinoud 
   1403      1.1  reinoud static void
   1404      1.1  reinoud udf_discstrat_finish_rmw(struct udf_strat_args *args)
   1405      1.1  reinoud {
   1406      1.1  reinoud 	struct udf_mount *ump = args->ump;
   1407      1.1  reinoud 	struct strat_private *priv = PRIV(ump);
   1408      1.1  reinoud 	int error;
   1409      1.1  reinoud 
   1410      1.1  reinoud 	if (ump == NULL)
   1411      1.1  reinoud 		return;
   1412      1.1  reinoud 
   1413      1.1  reinoud 	/* stop our sheduling thread */
   1414      1.1  reinoud 	KASSERT(priv->run_thread == 1);
   1415      1.1  reinoud 	priv->run_thread = 0;
   1416      1.1  reinoud 	wakeup(priv->queue_lwp);
   1417      1.1  reinoud 	while (!priv->thread_finished) {
   1418      1.1  reinoud 		error = tsleep(&priv->run_thread, PRIBIO+1,
   1419      1.1  reinoud 			"udfshedfin", hz);
   1420      1.1  reinoud 	}
   1421      1.1  reinoud 	/* kthread should be finished now */
   1422      1.1  reinoud 
   1423      1.1  reinoud 	/* cleanup our pools */
   1424      1.1  reinoud 	pool_destroy(&priv->eccline_pool);
   1425      1.1  reinoud 	pool_destroy(&priv->ecclineblob_pool);
   1426      1.1  reinoud 
   1427      1.1  reinoud 	cv_destroy(&priv->discstrat_cv);
   1428      1.1  reinoud 	mutex_destroy(&priv->discstrat_mutex);
   1429      1.1  reinoud 	mutex_destroy(&priv->seqwrite_mutex);
   1430      1.1  reinoud 
   1431      1.1  reinoud 	/* free our private space */
   1432      1.1  reinoud 	free(ump->strategy_private, M_UDFTEMP);
   1433      1.1  reinoud 	ump->strategy_private = NULL;
   1434      1.1  reinoud }
   1435      1.1  reinoud 
   1436      1.1  reinoud /* --------------------------------------------------------------------- */
   1437      1.1  reinoud 
   1438      1.1  reinoud struct udf_strategy udf_strat_rmw =
   1439      1.1  reinoud {
   1440      1.5  reinoud 	udf_create_nodedscr_rmw,
   1441      1.5  reinoud 	udf_free_nodedscr_rmw,
   1442      1.5  reinoud 	udf_read_nodedscr_rmw,
   1443      1.5  reinoud 	udf_write_nodedscr_rmw,
   1444      1.1  reinoud 	udf_queuebuf_rmw,
   1445      1.1  reinoud 	udf_discstrat_init_rmw,
   1446      1.1  reinoud 	udf_discstrat_finish_rmw
   1447      1.1  reinoud };
   1448      1.1  reinoud 
   1449