dm_target_stripe.c revision 1.18 1 1.18 haad /*$NetBSD: dm_target_stripe.c,v 1.18 2012/08/07 16:11:11 haad Exp $*/
2 1.1 haad
3 1.1 haad /*
4 1.1 haad * Copyright (c) 2009 The NetBSD Foundation, Inc.
5 1.1 haad * All rights reserved.
6 1.1 haad *
7 1.1 haad * This code is derived from software contributed to The NetBSD Foundation
8 1.1 haad * by Adam Hamsik.
9 1.1 haad *
10 1.1 haad * Redistribution and use in source and binary forms, with or without
11 1.1 haad * modification, are permitted provided that the following conditions
12 1.1 haad * are met:
13 1.1 haad * 1. Redistributions of source code must retain the above copyright
14 1.1 haad * notice, this list of conditions and the following disclaimer.
15 1.1 haad * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 haad * notice, this list of conditions and the following disclaimer in the
17 1.1 haad * documentation and/or other materials provided with the distribution.
18 1.1 haad *
19 1.1 haad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.1 haad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.1 haad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.1 haad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.1 haad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.1 haad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.1 haad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.1 haad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.1 haad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.1 haad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.1 haad * POSSIBILITY OF SUCH DAMAGE.
30 1.1 haad */
31 1.1 haad
32 1.1 haad /*
33 1.1 haad * This file implements initial version of device-mapper stripe target.
34 1.1 haad */
35 1.1 haad #include <sys/types.h>
36 1.1 haad #include <sys/param.h>
37 1.1 haad
38 1.1 haad #include <sys/buf.h>
39 1.3 haad #include <sys/kmem.h>
40 1.3 haad #include <sys/vnode.h>
41 1.12 uebayasi #include <sys/lwp.h>
42 1.1 haad
43 1.1 haad #include "dm.h"
44 1.1 haad
45 1.1 haad #ifdef DM_TARGET_MODULE
46 1.1 haad /*
47 1.1 haad * Every target can be compiled directly to dm driver or as a
48 1.1 haad * separate module this part of target is used for loading targets
49 1.1 haad * to dm driver.
50 1.1 haad * Target can be unloaded from kernel only if there are no users of
51 1.1 haad * it e.g. there are no devices which uses that target.
52 1.1 haad */
53 1.1 haad #include <sys/kernel.h>
54 1.1 haad #include <sys/module.h>
55 1.1 haad
56 1.1 haad MODULE(MODULE_CLASS_MISC, dm_target_stripe, NULL);
57 1.1 haad
58 1.1 haad static int
59 1.1 haad dm_target_stripe_modcmd(modcmd_t cmd, void *arg)
60 1.1 haad {
61 1.1 haad dm_target_t *dmt;
62 1.1 haad int r;
63 1.1 haad dmt = NULL;
64 1.9 haad
65 1.1 haad switch (cmd) {
66 1.1 haad case MODULE_CMD_INIT:
67 1.3 haad if ((dmt = dm_target_lookup("stripe")) != NULL) {
68 1.3 haad dm_target_unbusy(dmt);
69 1.1 haad return EEXIST;
70 1.3 haad }
71 1.1 haad dmt = dm_target_alloc("stripe");
72 1.9 haad
73 1.1 haad dmt->version[0] = 1;
74 1.1 haad dmt->version[1] = 0;
75 1.1 haad dmt->version[2] = 0;
76 1.1 haad strlcpy(dmt->name, "stripe", DM_MAX_TYPE_NAME);
77 1.1 haad dmt->init = &dm_target_stripe_init;
78 1.1 haad dmt->status = &dm_target_stripe_status;
79 1.1 haad dmt->strategy = &dm_target_stripe_strategy;
80 1.10 haad dmt->sync = &dm_target_stripe_sync;
81 1.1 haad dmt->deps = &dm_target_stripe_deps;
82 1.1 haad dmt->destroy = &dm_target_stripe_destroy;
83 1.1 haad dmt->upcall = &dm_target_stripe_upcall;
84 1.15 ahoka dmt->secsize = &dm_target_stripe_secsize;
85 1.1 haad
86 1.1 haad r = dm_target_insert(dmt);
87 1.9 haad
88 1.1 haad break;
89 1.1 haad
90 1.1 haad case MODULE_CMD_FINI:
91 1.1 haad r = dm_target_rem("stripe");
92 1.1 haad break;
93 1.1 haad
94 1.1 haad case MODULE_CMD_STAT:
95 1.1 haad return ENOTTY;
96 1.1 haad
97 1.1 haad default:
98 1.1 haad return ENOTTY;
99 1.1 haad }
100 1.1 haad
101 1.1 haad return r;
102 1.1 haad }
103 1.1 haad #endif
104 1.1 haad
105 1.3 haad /*
106 1.3 haad * Init function called from dm_table_load_ioctl.
107 1.11 haad * DM_STRIPE_DEV_OFFSET should always hold the index of the first device-offset
108 1.11 haad * pair in the parameters.
109 1.3 haad * Example line sent to dm from lvm tools when using striped target.
110 1.3 haad * start length striped #stripes chunk_size device1 offset1 ... deviceN offsetN
111 1.3 haad * 0 65536 striped 2 512 /dev/hda 0 /dev/hdb 0
112 1.3 haad */
113 1.1 haad int
114 1.9 haad dm_target_stripe_init(dm_dev_t * dmv, void **target_config, char *params)
115 1.1 haad {
116 1.11 haad dm_target_linear_config_t *tlc;
117 1.3 haad dm_target_stripe_config_t *tsc;
118 1.8 haad size_t len;
119 1.8 haad char **ap, *argv[10];
120 1.11 haad int strpc, strpi;
121 1.8 haad
122 1.9 haad if (params == NULL)
123 1.3 haad return EINVAL;
124 1.8 haad
125 1.8 haad len = strlen(params) + 1;
126 1.9 haad
127 1.8 haad /*
128 1.8 haad * Parse a string, containing tokens delimited by white space,
129 1.8 haad * into an argument vector
130 1.8 haad */
131 1.18 haad for (ap = argv; ap <= &argv[9] &&
132 1.9 haad (*ap = strsep(¶ms, " \t")) != NULL;) {
133 1.8 haad if (**ap != '\0')
134 1.8 haad ap++;
135 1.8 haad }
136 1.9 haad
137 1.8 haad printf("Stripe target init function called!!\n");
138 1.1 haad
139 1.11 haad printf("Stripe target chunk size %s number of stripes %s\n",
140 1.11 haad argv[1], argv[0]);
141 1.3 haad
142 1.11 haad if ((tsc = kmem_alloc(sizeof(*tsc), KM_NOSLEEP)) == NULL)
143 1.3 haad return ENOMEM;
144 1.9 haad
145 1.11 haad /* Initialize linked list for striping devices */
146 1.11 haad TAILQ_INIT(&tsc->stripe_devs);
147 1.3 haad
148 1.8 haad /* Save length of param string */
149 1.8 haad tsc->params_len = len;
150 1.8 haad tsc->stripe_chunksize = atoi(argv[1]);
151 1.9 haad tsc->stripe_num = (uint8_t) atoi(argv[0]);
152 1.9 haad
153 1.11 haad strpc = DM_STRIPE_DEV_OFFSET + (tsc->stripe_num * 2);
154 1.11 haad for (strpi = DM_STRIPE_DEV_OFFSET; strpi < strpc; strpi += 2) {
155 1.11 haad printf("Stripe target device name %s -- offset %s\n",
156 1.11 haad argv[strpi], argv[strpi+1]);
157 1.11 haad
158 1.11 haad tlc = kmem_alloc(sizeof(*tlc), KM_NOSLEEP);
159 1.11 haad if ((tlc->pdev = dm_pdev_insert(argv[strpi])) == NULL)
160 1.15 ahoka return ENOENT;
161 1.11 haad tlc->offset = atoi(argv[strpi+1]);
162 1.11 haad
163 1.11 haad /* Insert striping device to linked list. */
164 1.11 haad TAILQ_INSERT_TAIL(&tsc->stripe_devs, tlc, entries);
165 1.11 haad }
166 1.11 haad
167 1.3 haad *target_config = tsc;
168 1.1 haad
169 1.1 haad dmv->dev_type = DM_STRIPE_DEV;
170 1.9 haad
171 1.3 haad return 0;
172 1.1 haad }
173 1.1 haad /* Status routine called to get params string. */
174 1.1 haad char *
175 1.1 haad dm_target_stripe_status(void *target_config)
176 1.1 haad {
177 1.11 haad dm_target_linear_config_t *tlc;
178 1.3 haad dm_target_stripe_config_t *tsc;
179 1.11 haad char *params, *tmp;
180 1.3 haad
181 1.3 haad tsc = target_config;
182 1.9 haad
183 1.7 haad if ((params = kmem_alloc(DM_MAX_PARAMS_SIZE, KM_SLEEP)) == NULL)
184 1.3 haad return NULL;
185 1.3 haad
186 1.11 haad if ((tmp = kmem_alloc(DM_MAX_PARAMS_SIZE, KM_SLEEP)) == NULL)
187 1.11 haad return NULL;
188 1.11 haad
189 1.11 haad snprintf(params, DM_MAX_PARAMS_SIZE, "%d %" PRIu64,
190 1.11 haad tsc->stripe_num, tsc->stripe_chunksize);
191 1.11 haad
192 1.11 haad TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
193 1.11 haad snprintf(tmp, DM_MAX_PARAMS_SIZE, " %s %" PRIu64,
194 1.11 haad tlc->pdev->name, tlc->offset);
195 1.11 haad strcat(params, tmp);
196 1.11 haad }
197 1.11 haad
198 1.11 haad kmem_free(tmp, DM_MAX_PARAMS_SIZE);
199 1.9 haad
200 1.3 haad return params;
201 1.9 haad }
202 1.1 haad /* Strategy routine called from dm_strategy. */
203 1.1 haad int
204 1.9 haad dm_target_stripe_strategy(dm_table_entry_t * table_en, struct buf * bp)
205 1.1 haad {
206 1.11 haad dm_target_linear_config_t *tlc;
207 1.4 reinoud dm_target_stripe_config_t *tsc;
208 1.4 reinoud struct buf *nestbuf;
209 1.4 reinoud uint64_t blkno, blkoff;
210 1.4 reinoud uint64_t stripe, stripe_blknr;
211 1.4 reinoud uint32_t stripe_off, stripe_rest, num_blks, issue_blks;
212 1.11 haad int i, stripe_devnr;
213 1.4 reinoud
214 1.4 reinoud tsc = table_en->target_config;
215 1.4 reinoud if (tsc == NULL)
216 1.4 reinoud return 0;
217 1.4 reinoud
218 1.8 haad /* printf("Stripe target read function called %" PRIu64 "!!\n",
219 1.4 reinoud tlc->offset);*/
220 1.4 reinoud
221 1.4 reinoud /* calculate extent of request */
222 1.4 reinoud KASSERT(bp->b_resid % DEV_BSIZE == 0);
223 1.4 reinoud
224 1.9 haad blkno = bp->b_blkno;
225 1.4 reinoud blkoff = 0;
226 1.4 reinoud num_blks = bp->b_resid / DEV_BSIZE;
227 1.4 reinoud for (;;) {
228 1.4 reinoud /* blockno to strip piece nr */
229 1.9 haad stripe = blkno / tsc->stripe_chunksize;
230 1.4 reinoud stripe_off = blkno % tsc->stripe_chunksize;
231 1.4 reinoud
232 1.4 reinoud /* where we are inside the strip */
233 1.4 reinoud stripe_devnr = stripe % tsc->stripe_num;
234 1.4 reinoud stripe_blknr = stripe / tsc->stripe_num;
235 1.4 reinoud
236 1.4 reinoud /* how much is left before we hit a boundary */
237 1.4 reinoud stripe_rest = tsc->stripe_chunksize - stripe_off;
238 1.4 reinoud
239 1.4 reinoud /* issue this piece on stripe `stripe' */
240 1.4 reinoud issue_blks = MIN(stripe_rest, num_blks);
241 1.4 reinoud nestbuf = getiobuf(NULL, true);
242 1.4 reinoud
243 1.4 reinoud nestiobuf_setup(bp, nestbuf, blkoff, issue_blks * DEV_BSIZE);
244 1.4 reinoud nestbuf->b_blkno = stripe_blknr * tsc->stripe_chunksize + stripe_off;
245 1.4 reinoud
246 1.11 haad tlc = TAILQ_FIRST(&tsc->stripe_devs);
247 1.14 haad for (i = 0; i < stripe_devnr && tlc != NULL; i++)
248 1.11 haad tlc = TAILQ_NEXT(tlc, entries);
249 1.11 haad
250 1.11 haad /* by this point we should have an tlc */
251 1.17 haad KASSERT(tlc != NULL);
252 1.11 haad
253 1.11 haad nestbuf->b_blkno += tlc->offset;
254 1.11 haad
255 1.11 haad VOP_STRATEGY(tlc->pdev->pdev_vnode, nestbuf);
256 1.4 reinoud
257 1.9 haad blkno += issue_blks;
258 1.9 haad blkoff += issue_blks * DEV_BSIZE;
259 1.4 reinoud num_blks -= issue_blks;
260 1.4 reinoud
261 1.4 reinoud if (num_blks <= 0)
262 1.4 reinoud break;
263 1.4 reinoud }
264 1.1 haad
265 1.1 haad return 0;
266 1.1 haad }
267 1.10 haad /* Sync underlying disk caches. */
268 1.10 haad int
269 1.10 haad dm_target_stripe_sync(dm_table_entry_t * table_en)
270 1.10 haad {
271 1.11 haad int cmd, err;
272 1.10 haad dm_target_stripe_config_t *tsc;
273 1.11 haad dm_target_linear_config_t *tlc;
274 1.10 haad
275 1.10 haad tsc = table_en->target_config;
276 1.10 haad
277 1.10 haad err = 0;
278 1.10 haad cmd = 1;
279 1.10 haad
280 1.11 haad TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
281 1.11 haad if ((err = VOP_IOCTL(tlc->pdev->pdev_vnode, DIOCCACHESYNC,
282 1.10 haad &cmd, FREAD|FWRITE, kauth_cred_get())) != 0)
283 1.10 haad return err;
284 1.10 haad }
285 1.15 ahoka
286 1.10 haad return err;
287 1.10 haad
288 1.10 haad }
289 1.10 haad /* Destroy target specific data. */
290 1.1 haad int
291 1.9 haad dm_target_stripe_destroy(dm_table_entry_t * table_en)
292 1.1 haad {
293 1.3 haad dm_target_stripe_config_t *tsc;
294 1.11 haad dm_target_linear_config_t *tlc;
295 1.9 haad
296 1.3 haad tsc = table_en->target_config;
297 1.3 haad
298 1.3 haad if (tsc == NULL)
299 1.3 haad return 0;
300 1.9 haad
301 1.11 haad while ((tlc = TAILQ_FIRST(&tsc->stripe_devs)) != NULL) {
302 1.11 haad TAILQ_REMOVE(&tsc->stripe_devs, tlc, entries);
303 1.11 haad dm_pdev_decr(tlc->pdev);
304 1.11 haad kmem_free(tlc, sizeof(*tlc));
305 1.11 haad }
306 1.1 haad
307 1.1 haad /* Unbusy target so we can unload it */
308 1.1 haad dm_target_unbusy(table_en->target);
309 1.9 haad
310 1.11 haad kmem_free(tsc, sizeof(*tsc));
311 1.9 haad
312 1.3 haad table_en->target_config = NULL;
313 1.3 haad
314 1.1 haad return 0;
315 1.1 haad }
316 1.1 haad /* Doesn't not need to do anything here. */
317 1.1 haad int
318 1.9 haad dm_target_stripe_deps(dm_table_entry_t * table_en, prop_array_t prop_array)
319 1.9 haad {
320 1.3 haad dm_target_stripe_config_t *tsc;
321 1.11 haad dm_target_linear_config_t *tlc;
322 1.3 haad struct vattr va;
323 1.9 haad
324 1.3 haad int error;
325 1.9 haad
326 1.3 haad if (table_en->target_config == NULL)
327 1.3 haad return ENOENT;
328 1.9 haad
329 1.3 haad tsc = table_en->target_config;
330 1.9 haad
331 1.11 haad TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
332 1.16 hannken vn_lock(tlc->pdev->pdev_vnode, LK_SHARED | LK_RETRY);
333 1.16 hannken error = VOP_GETATTR(tlc->pdev->pdev_vnode, &va, curlwp->l_cred);
334 1.16 hannken VOP_UNLOCK(tlc->pdev->pdev_vnode);
335 1.16 hannken if (error != 0)
336 1.11 haad return error;
337 1.3 haad
338 1.11 haad prop_array_add_uint64(prop_array, (uint64_t) va.va_rdev);
339 1.11 haad }
340 1.9 haad
341 1.1 haad return 0;
342 1.1 haad }
343 1.1 haad /* Unsupported for this target. */
344 1.1 haad int
345 1.9 haad dm_target_stripe_upcall(dm_table_entry_t * table_en, struct buf * bp)
346 1.1 haad {
347 1.1 haad return 0;
348 1.1 haad }
349 1.13 mlelstv /*
350 1.13 mlelstv * Compute physical block size
351 1.15 ahoka * For a stripe target we chose the maximum sector size of all
352 1.13 mlelstv * stripe devices. For the supported power-of-2 sizes this is equivalent
353 1.13 mlelstv * to the least common multiple.
354 1.13 mlelstv */
355 1.13 mlelstv int
356 1.13 mlelstv dm_target_stripe_secsize(dm_table_entry_t * table_en, unsigned *secsizep)
357 1.13 mlelstv {
358 1.13 mlelstv dm_target_linear_config_t *tlc;
359 1.13 mlelstv dm_target_stripe_config_t *tsc;
360 1.13 mlelstv unsigned secsize;
361 1.13 mlelstv
362 1.13 mlelstv secsize = 0;
363 1.13 mlelstv
364 1.13 mlelstv tsc = table_en->target_config;
365 1.13 mlelstv if (tsc != NULL) {
366 1.13 mlelstv TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
367 1.13 mlelstv if (secsize < tlc->pdev->pdev_secsize)
368 1.13 mlelstv secsize = tlc->pdev->pdev_secsize;
369 1.13 mlelstv }
370 1.13 mlelstv }
371 1.13 mlelstv
372 1.13 mlelstv *secsizep = secsize;
373 1.13 mlelstv
374 1.13 mlelstv return 0;
375 1.13 mlelstv }
376