Home | History | Annotate | Line # | Download | only in dm
dm_target_stripe.c revision 1.32
      1  1.32   tkusumi /*$NetBSD: dm_target_stripe.c,v 1.32 2019/12/08 10:50:21 tkusumi Exp $*/
      2   1.1      haad 
      3   1.1      haad /*
      4   1.1      haad  * Copyright (c) 2009 The NetBSD Foundation, Inc.
      5   1.1      haad  * All rights reserved.
      6   1.1      haad  *
      7   1.1      haad  * This code is derived from software contributed to The NetBSD Foundation
      8   1.1      haad  * by Adam Hamsik.
      9   1.1      haad  *
     10   1.1      haad  * Redistribution and use in source and binary forms, with or without
     11   1.1      haad  * modification, are permitted provided that the following conditions
     12   1.1      haad  * are met:
     13   1.1      haad  * 1. Redistributions of source code must retain the above copyright
     14   1.1      haad  *    notice, this list of conditions and the following disclaimer.
     15   1.1      haad  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.1      haad  *    notice, this list of conditions and the following disclaimer in the
     17   1.1      haad  *    documentation and/or other materials provided with the distribution.
     18   1.1      haad  *
     19   1.1      haad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.1      haad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.1      haad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.1      haad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.1      haad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.1      haad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.1      haad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.1      haad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.1      haad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.1      haad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.1      haad  * POSSIBILITY OF SUCH DAMAGE.
     30   1.1      haad  */
     31  1.23  christos #include <sys/cdefs.h>
     32  1.32   tkusumi __KERNEL_RCSID(0, "$NetBSD: dm_target_stripe.c,v 1.32 2019/12/08 10:50:21 tkusumi Exp $");
     33   1.1      haad 
     34   1.1      haad /*
     35   1.1      haad  * This file implements initial version of device-mapper stripe target.
     36   1.1      haad  */
     37   1.1      haad #include <sys/types.h>
     38   1.1      haad #include <sys/param.h>
     39   1.1      haad 
     40   1.1      haad #include <sys/buf.h>
     41   1.3      haad #include <sys/kmem.h>
     42  1.12  uebayasi #include <sys/lwp.h>
     43   1.1      haad 
     44   1.1      haad #include "dm.h"
     45   1.1      haad 
     46  1.32   tkusumi typedef struct target_stripe_config {
     47  1.32   tkusumi #define DM_STRIPE_DEV_OFFSET 2
     48  1.32   tkusumi 	struct target_linear_devs stripe_devs;
     49  1.32   tkusumi 	uint8_t stripe_num;
     50  1.32   tkusumi 	uint64_t stripe_chunksize;
     51  1.32   tkusumi 	size_t params_len;
     52  1.32   tkusumi } dm_target_stripe_config_t;
     53  1.32   tkusumi 
     54   1.1      haad #ifdef DM_TARGET_MODULE
     55   1.1      haad /*
     56   1.1      haad  * Every target can be compiled directly to dm driver or as a
     57   1.1      haad  * separate module this part of target is used for loading targets
     58   1.1      haad  * to dm driver.
     59   1.1      haad  * Target can be unloaded from kernel only if there are no users of
     60   1.1      haad  * it e.g. there are no devices which uses that target.
     61   1.1      haad  */
     62   1.1      haad #include <sys/kernel.h>
     63   1.1      haad #include <sys/module.h>
     64   1.1      haad 
     65   1.1      haad MODULE(MODULE_CLASS_MISC, dm_target_stripe, NULL);
     66   1.1      haad 
     67   1.1      haad static int
     68   1.1      haad dm_target_stripe_modcmd(modcmd_t cmd, void *arg)
     69   1.1      haad {
     70   1.1      haad 	dm_target_t *dmt;
     71   1.1      haad 	int r;
     72   1.1      haad 	dmt = NULL;
     73   1.9      haad 
     74   1.1      haad 	switch (cmd) {
     75   1.1      haad 	case MODULE_CMD_INIT:
     76   1.3      haad 		if ((dmt = dm_target_lookup("stripe")) != NULL) {
     77   1.3      haad 			dm_target_unbusy(dmt);
     78   1.1      haad 			return EEXIST;
     79   1.3      haad 		}
     80   1.1      haad 		dmt = dm_target_alloc("stripe");
     81   1.9      haad 
     82   1.1      haad 		dmt->version[0] = 1;
     83   1.1      haad 		dmt->version[1] = 0;
     84   1.1      haad 		dmt->version[2] = 0;
     85   1.1      haad 		dmt->init = &dm_target_stripe_init;
     86   1.1      haad 		dmt->status = &dm_target_stripe_status;
     87   1.1      haad 		dmt->strategy = &dm_target_stripe_strategy;
     88  1.10      haad 		dmt->sync = &dm_target_stripe_sync;
     89   1.1      haad 		dmt->deps = &dm_target_stripe_deps;
     90   1.1      haad 		dmt->destroy = &dm_target_stripe_destroy;
     91   1.1      haad 		dmt->upcall = &dm_target_stripe_upcall;
     92  1.15     ahoka 		dmt->secsize = &dm_target_stripe_secsize;
     93   1.1      haad 
     94   1.1      haad 		r = dm_target_insert(dmt);
     95   1.9      haad 
     96   1.1      haad 		break;
     97   1.1      haad 
     98   1.1      haad 	case MODULE_CMD_FINI:
     99   1.1      haad 		r = dm_target_rem("stripe");
    100   1.1      haad 		break;
    101   1.1      haad 
    102   1.1      haad 	case MODULE_CMD_STAT:
    103   1.1      haad 		return ENOTTY;
    104   1.1      haad 
    105   1.1      haad 	default:
    106   1.1      haad 		return ENOTTY;
    107   1.1      haad 	}
    108   1.1      haad 
    109   1.1      haad 	return r;
    110   1.1      haad }
    111   1.1      haad #endif
    112   1.1      haad 
    113  1.21  christos static void
    114  1.21  christos dm_target_stripe_fini(dm_target_stripe_config_t *tsc)
    115  1.21  christos {
    116  1.21  christos 	dm_target_linear_config_t *tlc;
    117  1.21  christos 
    118  1.21  christos 	if (tsc == NULL)
    119  1.21  christos 		return;
    120  1.21  christos 
    121  1.21  christos 	while ((tlc = TAILQ_FIRST(&tsc->stripe_devs)) != NULL) {
    122  1.21  christos 		TAILQ_REMOVE(&tsc->stripe_devs, tlc, entries);
    123  1.21  christos 		dm_pdev_decr(tlc->pdev);
    124  1.21  christos 		kmem_free(tlc, sizeof(*tlc));
    125  1.21  christos 	}
    126  1.21  christos 
    127  1.21  christos 	kmem_free(tsc, sizeof(*tsc));
    128  1.21  christos }
    129  1.21  christos 
    130   1.3      haad /*
    131   1.3      haad  * Init function called from dm_table_load_ioctl.
    132  1.11      haad  * DM_STRIPE_DEV_OFFSET should always hold the index of the first device-offset
    133  1.11      haad  * pair in the parameters.
    134   1.3      haad  * Example line sent to dm from lvm tools when using striped target.
    135   1.3      haad  * start length striped #stripes chunk_size device1 offset1 ... deviceN offsetN
    136   1.3      haad  * 0 65536 striped 2 512 /dev/hda 0 /dev/hdb 0
    137   1.3      haad  */
    138   1.1      haad int
    139  1.31   tkusumi dm_target_stripe_init(dm_table_entry_t *table_en, char *params)
    140   1.1      haad {
    141  1.11      haad 	dm_target_linear_config_t *tlc;
    142   1.3      haad 	dm_target_stripe_config_t *tsc;
    143   1.8      haad 	size_t len;
    144   1.8      haad 	char **ap, *argv[10];
    145  1.11      haad 	int strpc, strpi;
    146   1.8      haad 
    147   1.9      haad 	if (params == NULL)
    148   1.3      haad 		return EINVAL;
    149   1.8      haad 
    150   1.8      haad 	len = strlen(params) + 1;
    151   1.9      haad 
    152   1.8      haad 	/*
    153   1.8      haad 	 * Parse a string, containing tokens delimited by white space,
    154   1.8      haad 	 * into an argument vector
    155   1.8      haad 	 */
    156  1.18      haad 	for (ap = argv; ap <= &argv[9] &&
    157   1.9      haad 	    (*ap = strsep(&params, " \t")) != NULL;) {
    158   1.8      haad 		if (**ap != '\0')
    159   1.8      haad 			ap++;
    160   1.8      haad 	}
    161   1.9      haad 
    162   1.8      haad 	printf("Stripe target init function called!!\n");
    163   1.1      haad 
    164  1.11      haad 	printf("Stripe target chunk size %s number of stripes %s\n",
    165  1.11      haad 	    argv[1], argv[0]);
    166   1.3      haad 
    167  1.24       chs 	tsc = kmem_alloc(sizeof(*tsc), KM_SLEEP);
    168   1.9      haad 
    169  1.11      haad 	/* Initialize linked list for striping devices */
    170  1.11      haad 	TAILQ_INIT(&tsc->stripe_devs);
    171   1.3      haad 
    172   1.8      haad 	/* Save length of param string */
    173   1.8      haad 	tsc->params_len = len;
    174   1.8      haad 	tsc->stripe_chunksize = atoi(argv[1]);
    175   1.9      haad 	tsc->stripe_num = (uint8_t) atoi(argv[0]);
    176   1.9      haad 
    177  1.11      haad 	strpc = DM_STRIPE_DEV_OFFSET + (tsc->stripe_num * 2);
    178  1.11      haad 	for (strpi = DM_STRIPE_DEV_OFFSET; strpi < strpc; strpi += 2) {
    179  1.11      haad 		printf("Stripe target device name %s -- offset %s\n",
    180  1.11      haad 		       argv[strpi], argv[strpi+1]);
    181  1.11      haad 
    182  1.24       chs 		tlc = kmem_alloc(sizeof(*tlc), KM_SLEEP);
    183  1.20       agc 		if ((tlc->pdev = dm_pdev_insert(argv[strpi])) == NULL) {
    184  1.20       agc 			kmem_free(tlc, sizeof(*tlc));
    185  1.21  christos 			dm_target_stripe_fini(tsc);
    186  1.15     ahoka 			return ENOENT;
    187  1.20       agc 		}
    188  1.11      haad 		tlc->offset = atoi(argv[strpi+1]);
    189  1.11      haad 
    190  1.11      haad 		/* Insert striping device to linked list. */
    191  1.11      haad 		TAILQ_INSERT_TAIL(&tsc->stripe_devs, tlc, entries);
    192  1.11      haad 	}
    193  1.11      haad 
    194  1.31   tkusumi 	table_en->target_config = tsc;
    195   1.1      haad 
    196   1.3      haad 	return 0;
    197   1.1      haad }
    198  1.23  christos 
    199   1.1      haad /* Status routine called to get params string. */
    200   1.1      haad char *
    201   1.1      haad dm_target_stripe_status(void *target_config)
    202   1.1      haad {
    203  1.11      haad 	dm_target_linear_config_t *tlc;
    204   1.3      haad 	dm_target_stripe_config_t *tsc;
    205  1.11      haad 	char *params, *tmp;
    206   1.3      haad 
    207   1.3      haad 	tsc = target_config;
    208   1.9      haad 
    209  1.22       chs 	params = kmem_alloc(DM_MAX_PARAMS_SIZE, KM_SLEEP);
    210  1.22       chs 	tmp = kmem_alloc(DM_MAX_PARAMS_SIZE, KM_SLEEP);
    211  1.11      haad 
    212  1.11      haad 	snprintf(params, DM_MAX_PARAMS_SIZE, "%d %" PRIu64,
    213  1.11      haad 	    tsc->stripe_num, tsc->stripe_chunksize);
    214  1.11      haad 
    215  1.11      haad 	TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
    216  1.11      haad 		snprintf(tmp, DM_MAX_PARAMS_SIZE, " %s %" PRIu64,
    217  1.11      haad 		    tlc->pdev->name, tlc->offset);
    218  1.11      haad 		strcat(params, tmp);
    219  1.11      haad 	}
    220  1.11      haad 
    221  1.11      haad 	kmem_free(tmp, DM_MAX_PARAMS_SIZE);
    222   1.9      haad 
    223   1.3      haad 	return params;
    224   1.9      haad }
    225  1.23  christos 
    226   1.1      haad /* Strategy routine called from dm_strategy. */
    227   1.1      haad int
    228  1.30   tkusumi dm_target_stripe_strategy(dm_table_entry_t *table_en, struct buf *bp)
    229   1.1      haad {
    230  1.11      haad 	dm_target_linear_config_t *tlc;
    231   1.4   reinoud 	dm_target_stripe_config_t *tsc;
    232   1.4   reinoud 	struct buf *nestbuf;
    233   1.4   reinoud 	uint64_t blkno, blkoff;
    234   1.4   reinoud 	uint64_t stripe, stripe_blknr;
    235   1.4   reinoud 	uint32_t stripe_off, stripe_rest, num_blks, issue_blks;
    236  1.11      haad 	int i, stripe_devnr;
    237   1.4   reinoud 
    238   1.4   reinoud 	tsc = table_en->target_config;
    239   1.4   reinoud 	if (tsc == NULL)
    240   1.4   reinoud 		return 0;
    241   1.4   reinoud 
    242   1.8      haad /*	printf("Stripe target read function called %" PRIu64 "!!\n",
    243   1.4   reinoud 	tlc->offset);*/
    244   1.4   reinoud 
    245   1.4   reinoud 	/* calculate extent of request */
    246   1.4   reinoud 	KASSERT(bp->b_resid % DEV_BSIZE == 0);
    247   1.4   reinoud 
    248   1.9      haad 	blkno = bp->b_blkno;
    249   1.4   reinoud 	blkoff = 0;
    250   1.4   reinoud 	num_blks = bp->b_resid / DEV_BSIZE;
    251   1.4   reinoud 	for (;;) {
    252  1.29   tkusumi 		/* blockno to stripe piece nr */
    253   1.9      haad 		stripe = blkno / tsc->stripe_chunksize;
    254   1.4   reinoud 		stripe_off = blkno % tsc->stripe_chunksize;
    255   1.4   reinoud 
    256  1.29   tkusumi 		/* where we are inside the stripe */
    257   1.4   reinoud 		stripe_devnr = stripe % tsc->stripe_num;
    258   1.4   reinoud 		stripe_blknr = stripe / tsc->stripe_num;
    259   1.4   reinoud 
    260   1.4   reinoud 		/* how much is left before we hit a boundary */
    261   1.4   reinoud 		stripe_rest = tsc->stripe_chunksize - stripe_off;
    262   1.4   reinoud 
    263   1.4   reinoud 		/* issue this piece on stripe `stripe' */
    264   1.4   reinoud 		issue_blks = MIN(stripe_rest, num_blks);
    265   1.4   reinoud 		nestbuf = getiobuf(NULL, true);
    266   1.4   reinoud 
    267   1.4   reinoud 		nestiobuf_setup(bp, nestbuf, blkoff, issue_blks * DEV_BSIZE);
    268   1.4   reinoud 		nestbuf->b_blkno = stripe_blknr * tsc->stripe_chunksize + stripe_off;
    269   1.4   reinoud 
    270  1.11      haad 		tlc = TAILQ_FIRST(&tsc->stripe_devs);
    271  1.14      haad 		for (i = 0; i < stripe_devnr && tlc != NULL; i++)
    272  1.11      haad 			tlc = TAILQ_NEXT(tlc, entries);
    273  1.11      haad 
    274  1.11      haad 		/* by this point we should have an tlc */
    275  1.17      haad 		KASSERT(tlc != NULL);
    276  1.11      haad 
    277  1.11      haad 		nestbuf->b_blkno += tlc->offset;
    278  1.11      haad 
    279  1.11      haad 		VOP_STRATEGY(tlc->pdev->pdev_vnode, nestbuf);
    280   1.4   reinoud 
    281   1.9      haad 		blkno += issue_blks;
    282   1.9      haad 		blkoff += issue_blks * DEV_BSIZE;
    283   1.4   reinoud 		num_blks -= issue_blks;
    284   1.4   reinoud 
    285   1.4   reinoud 		if (num_blks <= 0)
    286   1.4   reinoud 			break;
    287   1.4   reinoud 	}
    288   1.1      haad 
    289   1.1      haad 	return 0;
    290   1.1      haad }
    291  1.23  christos 
    292  1.10      haad /* Sync underlying disk caches. */
    293  1.10      haad int
    294  1.30   tkusumi dm_target_stripe_sync(dm_table_entry_t *table_en)
    295  1.10      haad {
    296  1.11      haad 	int cmd, err;
    297  1.10      haad 	dm_target_stripe_config_t *tsc;
    298  1.11      haad 	dm_target_linear_config_t *tlc;
    299  1.10      haad 
    300  1.10      haad 	tsc = table_en->target_config;
    301  1.10      haad 
    302  1.10      haad 	err = 0;
    303  1.10      haad 	cmd = 1;
    304  1.10      haad 
    305  1.11      haad 	TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
    306  1.11      haad 		if ((err = VOP_IOCTL(tlc->pdev->pdev_vnode, DIOCCACHESYNC,
    307  1.10      haad 			    &cmd, FREAD|FWRITE, kauth_cred_get())) != 0)
    308  1.10      haad 			return err;
    309  1.10      haad 	}
    310  1.15     ahoka 
    311  1.10      haad 	return err;
    312  1.10      haad 
    313  1.10      haad }
    314  1.23  christos 
    315  1.10      haad /* Destroy target specific data. */
    316   1.1      haad int
    317  1.30   tkusumi dm_target_stripe_destroy(dm_table_entry_t *table_en)
    318   1.1      haad {
    319  1.21  christos 	dm_target_stripe_fini(table_en->target_config);
    320   1.1      haad 
    321   1.1      haad 	/* Unbusy target so we can unload it */
    322   1.1      haad 	dm_target_unbusy(table_en->target);
    323   1.9      haad 
    324   1.1      haad 	return 0;
    325   1.1      haad }
    326  1.23  christos 
    327   1.1      haad /* Doesn't not need to do anything here. */
    328   1.1      haad int
    329  1.30   tkusumi dm_target_stripe_deps(dm_table_entry_t *table_en, prop_array_t prop_array)
    330   1.9      haad {
    331   1.3      haad 	dm_target_stripe_config_t *tsc;
    332  1.11      haad 	dm_target_linear_config_t *tlc;
    333   1.9      haad 
    334   1.3      haad 	if (table_en->target_config == NULL)
    335   1.3      haad 		return ENOENT;
    336   1.9      haad 
    337   1.3      haad 	tsc = table_en->target_config;
    338   1.9      haad 
    339  1.11      haad 	TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
    340  1.19   hannken 		prop_array_add_uint64(prop_array,
    341  1.19   hannken 		    (uint64_t) tlc->pdev->pdev_vnode->v_rdev);
    342  1.11      haad 	}
    343   1.9      haad 
    344   1.1      haad 	return 0;
    345   1.1      haad }
    346  1.23  christos 
    347   1.1      haad /* Unsupported for this target. */
    348   1.1      haad int
    349  1.30   tkusumi dm_target_stripe_upcall(dm_table_entry_t *table_en, struct buf *bp)
    350   1.1      haad {
    351   1.1      haad 	return 0;
    352   1.1      haad }
    353  1.23  christos 
    354  1.13   mlelstv /*
    355  1.13   mlelstv  * Compute physical block size
    356  1.15     ahoka  * For a stripe target we chose the maximum sector size of all
    357  1.13   mlelstv  * stripe devices. For the supported power-of-2 sizes this is equivalent
    358  1.13   mlelstv  * to the least common multiple.
    359  1.13   mlelstv  */
    360  1.13   mlelstv int
    361  1.30   tkusumi dm_target_stripe_secsize(dm_table_entry_t *table_en, unsigned *secsizep)
    362  1.13   mlelstv {
    363  1.13   mlelstv 	dm_target_linear_config_t *tlc;
    364  1.13   mlelstv 	dm_target_stripe_config_t *tsc;
    365  1.13   mlelstv 	unsigned secsize;
    366  1.13   mlelstv 
    367  1.13   mlelstv 	secsize = 0;
    368  1.13   mlelstv 
    369  1.13   mlelstv 	tsc = table_en->target_config;
    370  1.13   mlelstv 	if (tsc != NULL) {
    371  1.13   mlelstv 		TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
    372  1.13   mlelstv 			if (secsize < tlc->pdev->pdev_secsize)
    373  1.13   mlelstv 				secsize = tlc->pdev->pdev_secsize;
    374  1.13   mlelstv 		}
    375  1.13   mlelstv 	}
    376  1.13   mlelstv 
    377  1.13   mlelstv 	*secsizep = secsize;
    378  1.13   mlelstv 
    379  1.13   mlelstv 	return 0;
    380  1.13   mlelstv }
    381