Home | History | Annotate | Line # | Download | only in dm
dm_target_stripe.c revision 1.9.4.2
      1  1.9.4.2    rmind /*$NetBSD: dm_target_stripe.c,v 1.9.4.2 2011/03/05 20:53:07 rmind Exp $*/
      2      1.1     haad 
      3      1.1     haad /*
      4      1.1     haad  * Copyright (c) 2009 The NetBSD Foundation, Inc.
      5      1.1     haad  * All rights reserved.
      6      1.1     haad  *
      7      1.1     haad  * This code is derived from software contributed to The NetBSD Foundation
      8      1.1     haad  * by Adam Hamsik.
      9      1.1     haad  *
     10      1.1     haad  * Redistribution and use in source and binary forms, with or without
     11      1.1     haad  * modification, are permitted provided that the following conditions
     12      1.1     haad  * are met:
     13      1.1     haad  * 1. Redistributions of source code must retain the above copyright
     14      1.1     haad  *    notice, this list of conditions and the following disclaimer.
     15      1.1     haad  * 2. Redistributions in binary form must reproduce the above copyright
     16      1.1     haad  *    notice, this list of conditions and the following disclaimer in the
     17      1.1     haad  *    documentation and/or other materials provided with the distribution.
     18      1.1     haad  *
     19      1.1     haad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20      1.1     haad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21      1.1     haad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22      1.1     haad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23      1.1     haad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24      1.1     haad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25      1.1     haad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26      1.1     haad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27      1.1     haad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28      1.1     haad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29      1.1     haad  * POSSIBILITY OF SUCH DAMAGE.
     30      1.1     haad  */
     31      1.1     haad 
     32      1.1     haad /*
     33      1.1     haad  * This file implements initial version of device-mapper stripe target.
     34      1.1     haad  */
     35      1.1     haad #include <sys/types.h>
     36      1.1     haad #include <sys/param.h>
     37      1.1     haad 
     38      1.1     haad #include <sys/buf.h>
     39      1.3     haad #include <sys/kmem.h>
     40      1.3     haad #include <sys/vnode.h>
     41  1.9.4.2    rmind #include <sys/lwp.h>
     42      1.1     haad 
     43      1.1     haad #include "dm.h"
     44      1.1     haad 
     45      1.1     haad #ifdef DM_TARGET_MODULE
     46      1.1     haad /*
     47      1.1     haad  * Every target can be compiled directly to dm driver or as a
     48      1.1     haad  * separate module this part of target is used for loading targets
     49      1.1     haad  * to dm driver.
     50      1.1     haad  * Target can be unloaded from kernel only if there are no users of
     51      1.1     haad  * it e.g. there are no devices which uses that target.
     52      1.1     haad  */
     53      1.1     haad #include <sys/kernel.h>
     54      1.1     haad #include <sys/module.h>
     55      1.1     haad 
     56      1.1     haad MODULE(MODULE_CLASS_MISC, dm_target_stripe, NULL);
     57      1.1     haad 
     58      1.1     haad static int
     59      1.1     haad dm_target_stripe_modcmd(modcmd_t cmd, void *arg)
     60      1.1     haad {
     61      1.1     haad 	dm_target_t *dmt;
     62      1.1     haad 	int r;
     63      1.1     haad 	dmt = NULL;
     64      1.9     haad 
     65      1.1     haad 	switch (cmd) {
     66      1.1     haad 	case MODULE_CMD_INIT:
     67      1.3     haad 		if ((dmt = dm_target_lookup("stripe")) != NULL) {
     68      1.3     haad 			dm_target_unbusy(dmt);
     69      1.1     haad 			return EEXIST;
     70      1.3     haad 		}
     71      1.1     haad 		dmt = dm_target_alloc("stripe");
     72      1.9     haad 
     73      1.1     haad 		dmt->version[0] = 1;
     74      1.1     haad 		dmt->version[1] = 0;
     75      1.1     haad 		dmt->version[2] = 0;
     76      1.1     haad 		strlcpy(dmt->name, "stripe", DM_MAX_TYPE_NAME);
     77      1.1     haad 		dmt->init = &dm_target_stripe_init;
     78      1.1     haad 		dmt->status = &dm_target_stripe_status;
     79      1.1     haad 		dmt->strategy = &dm_target_stripe_strategy;
     80  1.9.4.1    rmind 		dmt->sync = &dm_target_stripe_sync;
     81      1.1     haad 		dmt->deps = &dm_target_stripe_deps;
     82      1.1     haad 		dmt->destroy = &dm_target_stripe_destroy;
     83      1.1     haad 		dmt->upcall = &dm_target_stripe_upcall;
     84      1.1     haad 
     85      1.1     haad 		r = dm_target_insert(dmt);
     86      1.9     haad 
     87      1.1     haad 		break;
     88      1.1     haad 
     89      1.1     haad 	case MODULE_CMD_FINI:
     90      1.1     haad 		r = dm_target_rem("stripe");
     91      1.1     haad 		break;
     92      1.1     haad 
     93      1.1     haad 	case MODULE_CMD_STAT:
     94      1.1     haad 		return ENOTTY;
     95      1.1     haad 
     96      1.1     haad 	default:
     97      1.1     haad 		return ENOTTY;
     98      1.1     haad 	}
     99      1.1     haad 
    100      1.1     haad 	return r;
    101      1.1     haad }
    102      1.1     haad #endif
    103      1.1     haad 
    104      1.3     haad /*
    105      1.3     haad  * Init function called from dm_table_load_ioctl.
    106  1.9.4.2    rmind  * DM_STRIPE_DEV_OFFSET should always hold the index of the first device-offset
    107  1.9.4.2    rmind  * pair in the parameters.
    108      1.3     haad  * Example line sent to dm from lvm tools when using striped target.
    109      1.3     haad  * start length striped #stripes chunk_size device1 offset1 ... deviceN offsetN
    110      1.3     haad  * 0 65536 striped 2 512 /dev/hda 0 /dev/hdb 0
    111      1.3     haad  */
    112      1.1     haad int
    113      1.9     haad dm_target_stripe_init(dm_dev_t * dmv, void **target_config, char *params)
    114      1.1     haad {
    115  1.9.4.2    rmind 	dm_target_linear_config_t *tlc;
    116      1.3     haad 	dm_target_stripe_config_t *tsc;
    117      1.8     haad 	size_t len;
    118      1.8     haad 	char **ap, *argv[10];
    119  1.9.4.2    rmind 	int strpc, strpi;
    120      1.8     haad 
    121      1.9     haad 	if (params == NULL)
    122      1.3     haad 		return EINVAL;
    123      1.8     haad 
    124      1.8     haad 	len = strlen(params) + 1;
    125      1.9     haad 
    126      1.8     haad 	/*
    127      1.8     haad 	 * Parse a string, containing tokens delimited by white space,
    128      1.8     haad 	 * into an argument vector
    129      1.8     haad 	 */
    130      1.8     haad 	for (ap = argv; ap < &argv[9] &&
    131      1.9     haad 	    (*ap = strsep(&params, " \t")) != NULL;) {
    132      1.8     haad 		if (**ap != '\0')
    133      1.8     haad 			ap++;
    134      1.8     haad 	}
    135      1.9     haad 
    136      1.8     haad 	printf("Stripe target init function called!!\n");
    137      1.1     haad 
    138  1.9.4.2    rmind 	printf("Stripe target chunk size %s number of stripes %s\n",
    139  1.9.4.2    rmind 	    argv[1], argv[0]);
    140      1.3     haad 
    141  1.9.4.2    rmind 	if ((tsc = kmem_alloc(sizeof(*tsc), KM_NOSLEEP)) == NULL)
    142      1.3     haad 		return ENOMEM;
    143      1.9     haad 
    144  1.9.4.2    rmind 	/* Initialize linked list for striping devices */
    145  1.9.4.2    rmind 	TAILQ_INIT(&tsc->stripe_devs);
    146      1.3     haad 
    147      1.8     haad 	/* Save length of param string */
    148      1.8     haad 	tsc->params_len = len;
    149      1.8     haad 	tsc->stripe_chunksize = atoi(argv[1]);
    150      1.9     haad 	tsc->stripe_num = (uint8_t) atoi(argv[0]);
    151      1.9     haad 
    152  1.9.4.2    rmind 	strpc = DM_STRIPE_DEV_OFFSET + (tsc->stripe_num * 2);
    153  1.9.4.2    rmind 	for (strpi = DM_STRIPE_DEV_OFFSET; strpi < strpc; strpi += 2) {
    154  1.9.4.2    rmind 		printf("Stripe target device name %s -- offset %s\n",
    155  1.9.4.2    rmind 		       argv[strpi], argv[strpi+1]);
    156  1.9.4.2    rmind 
    157  1.9.4.2    rmind 		tlc = kmem_alloc(sizeof(*tlc), KM_NOSLEEP);
    158  1.9.4.2    rmind 		if ((tlc->pdev = dm_pdev_insert(argv[strpi])) == NULL)
    159  1.9.4.2    rmind 			return ENOENT;
    160  1.9.4.2    rmind 		tlc->offset = atoi(argv[strpi+1]);
    161  1.9.4.2    rmind 
    162  1.9.4.2    rmind 		/* Insert striping device to linked list. */
    163  1.9.4.2    rmind 		TAILQ_INSERT_TAIL(&tsc->stripe_devs, tlc, entries);
    164  1.9.4.2    rmind 	}
    165  1.9.4.2    rmind 
    166      1.3     haad 	*target_config = tsc;
    167      1.1     haad 
    168      1.1     haad 	dmv->dev_type = DM_STRIPE_DEV;
    169      1.9     haad 
    170      1.3     haad 	return 0;
    171      1.1     haad }
    172      1.1     haad /* Status routine called to get params string. */
    173      1.1     haad char *
    174      1.1     haad dm_target_stripe_status(void *target_config)
    175      1.1     haad {
    176  1.9.4.2    rmind 	dm_target_linear_config_t *tlc;
    177      1.3     haad 	dm_target_stripe_config_t *tsc;
    178  1.9.4.2    rmind 	char *params, *tmp;
    179      1.3     haad 
    180      1.3     haad 	tsc = target_config;
    181      1.9     haad 
    182      1.7     haad 	if ((params = kmem_alloc(DM_MAX_PARAMS_SIZE, KM_SLEEP)) == NULL)
    183      1.3     haad 		return NULL;
    184      1.3     haad 
    185  1.9.4.2    rmind 	if ((tmp = kmem_alloc(DM_MAX_PARAMS_SIZE, KM_SLEEP)) == NULL)
    186  1.9.4.2    rmind 		return NULL;
    187  1.9.4.2    rmind 
    188  1.9.4.2    rmind 	snprintf(params, DM_MAX_PARAMS_SIZE, "%d %" PRIu64,
    189  1.9.4.2    rmind 	    tsc->stripe_num, tsc->stripe_chunksize);
    190  1.9.4.2    rmind 
    191  1.9.4.2    rmind 	TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
    192  1.9.4.2    rmind 		snprintf(tmp, DM_MAX_PARAMS_SIZE, " %s %" PRIu64,
    193  1.9.4.2    rmind 		    tlc->pdev->name, tlc->offset);
    194  1.9.4.2    rmind 		strcat(params, tmp);
    195  1.9.4.2    rmind 	}
    196  1.9.4.2    rmind 
    197  1.9.4.2    rmind 	kmem_free(tmp, DM_MAX_PARAMS_SIZE);
    198      1.9     haad 
    199      1.3     haad 	return params;
    200      1.9     haad }
    201      1.1     haad /* Strategy routine called from dm_strategy. */
    202      1.1     haad int
    203      1.9     haad dm_target_stripe_strategy(dm_table_entry_t * table_en, struct buf * bp)
    204      1.1     haad {
    205  1.9.4.2    rmind 	dm_target_linear_config_t *tlc;
    206      1.4  reinoud 	dm_target_stripe_config_t *tsc;
    207      1.4  reinoud 	struct buf *nestbuf;
    208      1.4  reinoud 	uint64_t blkno, blkoff;
    209      1.4  reinoud 	uint64_t stripe, stripe_blknr;
    210      1.4  reinoud 	uint32_t stripe_off, stripe_rest, num_blks, issue_blks;
    211  1.9.4.2    rmind 	int i, stripe_devnr;
    212      1.4  reinoud 
    213      1.4  reinoud 	tsc = table_en->target_config;
    214      1.4  reinoud 	if (tsc == NULL)
    215      1.4  reinoud 		return 0;
    216      1.4  reinoud 
    217      1.8     haad /*	printf("Stripe target read function called %" PRIu64 "!!\n",
    218      1.4  reinoud 	tlc->offset);*/
    219      1.4  reinoud 
    220      1.4  reinoud 	/* calculate extent of request */
    221      1.4  reinoud 	KASSERT(bp->b_resid % DEV_BSIZE == 0);
    222      1.4  reinoud 
    223      1.9     haad 	blkno = bp->b_blkno;
    224      1.4  reinoud 	blkoff = 0;
    225      1.4  reinoud 	num_blks = bp->b_resid / DEV_BSIZE;
    226      1.4  reinoud 	for (;;) {
    227      1.4  reinoud 		/* blockno to strip piece nr */
    228      1.9     haad 		stripe = blkno / tsc->stripe_chunksize;
    229      1.4  reinoud 		stripe_off = blkno % tsc->stripe_chunksize;
    230      1.4  reinoud 
    231      1.4  reinoud 		/* where we are inside the strip */
    232      1.4  reinoud 		stripe_devnr = stripe % tsc->stripe_num;
    233      1.4  reinoud 		stripe_blknr = stripe / tsc->stripe_num;
    234      1.4  reinoud 
    235      1.4  reinoud 		/* how much is left before we hit a boundary */
    236      1.4  reinoud 		stripe_rest = tsc->stripe_chunksize - stripe_off;
    237      1.4  reinoud 
    238      1.4  reinoud 		/* issue this piece on stripe `stripe' */
    239      1.4  reinoud 		issue_blks = MIN(stripe_rest, num_blks);
    240      1.4  reinoud 		nestbuf = getiobuf(NULL, true);
    241      1.4  reinoud 
    242      1.4  reinoud 		nestiobuf_setup(bp, nestbuf, blkoff, issue_blks * DEV_BSIZE);
    243      1.4  reinoud 		nestbuf->b_blkno = stripe_blknr * tsc->stripe_chunksize + stripe_off;
    244      1.4  reinoud 
    245  1.9.4.2    rmind 		tlc = TAILQ_FIRST(&tsc->stripe_devs);
    246  1.9.4.2    rmind 		for (i = 0; i < stripe_devnr && tlc == NULL; i++)
    247  1.9.4.2    rmind 			tlc = TAILQ_NEXT(tlc, entries);
    248  1.9.4.2    rmind 
    249  1.9.4.2    rmind 		/* by this point we should have an tlc */
    250  1.9.4.2    rmind 		KASSERT(tlc == NULL);
    251  1.9.4.2    rmind 
    252  1.9.4.2    rmind 		nestbuf->b_blkno += tlc->offset;
    253  1.9.4.2    rmind 
    254  1.9.4.2    rmind 		VOP_STRATEGY(tlc->pdev->pdev_vnode, nestbuf);
    255      1.4  reinoud 
    256      1.9     haad 		blkno += issue_blks;
    257      1.9     haad 		blkoff += issue_blks * DEV_BSIZE;
    258      1.4  reinoud 		num_blks -= issue_blks;
    259      1.4  reinoud 
    260      1.4  reinoud 		if (num_blks <= 0)
    261      1.4  reinoud 			break;
    262      1.4  reinoud 	}
    263      1.1     haad 
    264      1.1     haad 	return 0;
    265      1.1     haad }
    266  1.9.4.1    rmind /* Sync underlying disk caches. */
    267  1.9.4.1    rmind int
    268  1.9.4.1    rmind dm_target_stripe_sync(dm_table_entry_t * table_en)
    269  1.9.4.1    rmind {
    270  1.9.4.2    rmind 	int cmd, err;
    271  1.9.4.1    rmind 	dm_target_stripe_config_t *tsc;
    272  1.9.4.2    rmind 	dm_target_linear_config_t *tlc;
    273  1.9.4.1    rmind 
    274  1.9.4.1    rmind 	tsc = table_en->target_config;
    275  1.9.4.1    rmind 
    276  1.9.4.1    rmind 	err = 0;
    277  1.9.4.1    rmind 	cmd = 1;
    278  1.9.4.1    rmind 
    279  1.9.4.2    rmind 	TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
    280  1.9.4.2    rmind 		if ((err = VOP_IOCTL(tlc->pdev->pdev_vnode, DIOCCACHESYNC,
    281  1.9.4.1    rmind 			    &cmd, FREAD|FWRITE, kauth_cred_get())) != 0)
    282  1.9.4.1    rmind 			return err;
    283  1.9.4.1    rmind 	}
    284  1.9.4.1    rmind 
    285  1.9.4.1    rmind 	return err;
    286  1.9.4.1    rmind 
    287  1.9.4.1    rmind }
    288  1.9.4.1    rmind /* Destroy target specific data. */
    289      1.1     haad int
    290      1.9     haad dm_target_stripe_destroy(dm_table_entry_t * table_en)
    291      1.1     haad {
    292      1.3     haad 	dm_target_stripe_config_t *tsc;
    293  1.9.4.2    rmind 	dm_target_linear_config_t *tlc;
    294      1.9     haad 
    295      1.3     haad 	tsc = table_en->target_config;
    296      1.3     haad 
    297      1.3     haad 	if (tsc == NULL)
    298      1.3     haad 		return 0;
    299      1.9     haad 
    300  1.9.4.2    rmind 	while ((tlc = TAILQ_FIRST(&tsc->stripe_devs)) != NULL) {
    301  1.9.4.2    rmind 		TAILQ_REMOVE(&tsc->stripe_devs, tlc, entries);
    302  1.9.4.2    rmind 		dm_pdev_decr(tlc->pdev);
    303  1.9.4.2    rmind 		kmem_free(tlc, sizeof(*tlc));
    304  1.9.4.2    rmind 	}
    305      1.1     haad 
    306      1.1     haad 	/* Unbusy target so we can unload it */
    307      1.1     haad 	dm_target_unbusy(table_en->target);
    308      1.9     haad 
    309  1.9.4.2    rmind 	kmem_free(tsc, sizeof(*tsc));
    310      1.9     haad 
    311      1.3     haad 	table_en->target_config = NULL;
    312      1.3     haad 
    313      1.1     haad 	return 0;
    314      1.1     haad }
    315      1.1     haad /* Doesn't not need to do anything here. */
    316      1.1     haad int
    317      1.9     haad dm_target_stripe_deps(dm_table_entry_t * table_en, prop_array_t prop_array)
    318      1.9     haad {
    319      1.3     haad 	dm_target_stripe_config_t *tsc;
    320  1.9.4.2    rmind 	dm_target_linear_config_t *tlc;
    321      1.3     haad 	struct vattr va;
    322      1.9     haad 
    323      1.3     haad 	int error;
    324      1.9     haad 
    325      1.3     haad 	if (table_en->target_config == NULL)
    326      1.3     haad 		return ENOENT;
    327      1.9     haad 
    328      1.3     haad 	tsc = table_en->target_config;
    329      1.9     haad 
    330  1.9.4.2    rmind 	TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
    331  1.9.4.2    rmind 		if ((error = VOP_GETATTR(tlc->pdev->pdev_vnode, &va, curlwp->l_cred)) != 0)
    332  1.9.4.2    rmind 			return error;
    333      1.3     haad 
    334  1.9.4.2    rmind 		prop_array_add_uint64(prop_array, (uint64_t) va.va_rdev);
    335  1.9.4.2    rmind 	}
    336      1.9     haad 
    337      1.1     haad 	return 0;
    338      1.1     haad }
    339      1.1     haad /* Unsupported for this target. */
    340      1.1     haad int
    341      1.9     haad dm_target_stripe_upcall(dm_table_entry_t * table_en, struct buf * bp)
    342      1.1     haad {
    343      1.1     haad 	return 0;
    344      1.1     haad }
    345  1.9.4.2    rmind /*
    346  1.9.4.2    rmind  * Compute physical block size
    347  1.9.4.2    rmind  * For a stripe target we chose the maximum sector size of all
    348  1.9.4.2    rmind  * stripe devices. For the supported power-of-2 sizes this is equivalent
    349  1.9.4.2    rmind  * to the least common multiple.
    350  1.9.4.2    rmind  */
    351  1.9.4.2    rmind int
    352  1.9.4.2    rmind dm_target_stripe_secsize(dm_table_entry_t * table_en, unsigned *secsizep)
    353  1.9.4.2    rmind {
    354  1.9.4.2    rmind 	dm_target_linear_config_t *tlc;
    355  1.9.4.2    rmind 	dm_target_stripe_config_t *tsc;
    356  1.9.4.2    rmind 	unsigned secsize;
    357  1.9.4.2    rmind 
    358  1.9.4.2    rmind 	secsize = 0;
    359  1.9.4.2    rmind 
    360  1.9.4.2    rmind 	tsc = table_en->target_config;
    361  1.9.4.2    rmind 	if (tsc != NULL) {
    362  1.9.4.2    rmind 		TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
    363  1.9.4.2    rmind 			if (secsize < tlc->pdev->pdev_secsize)
    364  1.9.4.2    rmind 				secsize = tlc->pdev->pdev_secsize;
    365  1.9.4.2    rmind 		}
    366  1.9.4.2    rmind 	}
    367  1.9.4.2    rmind 
    368  1.9.4.2    rmind 	*secsizep = secsize;
    369  1.9.4.2    rmind 
    370  1.9.4.2    rmind 	return 0;
    371  1.9.4.2    rmind }
    372