dm_target_stripe.c revision 1.23.4.1 1 /*$NetBSD: dm_target_stripe.c,v 1.23.4.1 2020/04/08 14:08:03 martin Exp $*/
2
3 /*
4 * Copyright (c) 2009 The NetBSD Foundation, Inc.
5 * All rights reserved.
6 *
7 * This code is derived from software contributed to The NetBSD Foundation
8 * by Adam Hamsik.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 * POSSIBILITY OF SUCH DAMAGE.
30 */
31 #include <sys/cdefs.h>
32 __KERNEL_RCSID(0, "$NetBSD: dm_target_stripe.c,v 1.23.4.1 2020/04/08 14:08:03 martin Exp $");
33
34 /*
35 * This file implements initial version of device-mapper stripe target.
36 */
37 #include <sys/types.h>
38 #include <sys/param.h>
39 #include <sys/buf.h>
40 #include <sys/kmem.h>
41 #include <sys/lwp.h>
42
43 #include "dm.h"
44
45 typedef struct target_stripe_config {
46 #define DM_STRIPE_DEV_OFFSET 2
47 struct target_linear_devs stripe_devs;
48 uint8_t stripe_num;
49 uint64_t stripe_chunksize;
50 } dm_target_stripe_config_t;
51
52 #ifdef DM_TARGET_MODULE
53 /*
54 * Every target can be compiled directly to dm driver or as a
55 * separate module this part of target is used for loading targets
56 * to dm driver.
57 * Target can be unloaded from kernel only if there are no users of
58 * it e.g. there are no devices which uses that target.
59 */
60 #include <sys/kernel.h>
61 #include <sys/module.h>
62
63 MODULE(MODULE_CLASS_MISC, dm_target_stripe, NULL);
64
65 static int
66 dm_target_stripe_modcmd(modcmd_t cmd, void *arg)
67 {
68 dm_target_t *dmt;
69 int r;
70
71 switch (cmd) {
72 case MODULE_CMD_INIT:
73 if ((dmt = dm_target_lookup("striped")) != NULL) {
74 dm_target_unbusy(dmt);
75 return EEXIST;
76 }
77 dmt = dm_target_alloc("striped");
78
79 dmt->version[0] = 1;
80 dmt->version[1] = 0;
81 dmt->version[2] = 0;
82 dmt->init = &dm_target_stripe_init;
83 dmt->info = &dm_target_stripe_info;
84 dmt->table = &dm_target_stripe_table;
85 dmt->strategy = &dm_target_stripe_strategy;
86 dmt->sync = &dm_target_stripe_sync;
87 dmt->destroy = &dm_target_stripe_destroy;
88 //dmt->upcall = &dm_target_stripe_upcall;
89 dmt->secsize = &dm_target_stripe_secsize;
90
91 r = dm_target_insert(dmt);
92
93 break;
94
95 case MODULE_CMD_FINI:
96 r = dm_target_rem("striped");
97 break;
98
99 case MODULE_CMD_STAT:
100 return ENOTTY;
101
102 default:
103 return ENOTTY;
104 }
105
106 return r;
107 }
108 #endif
109
110 static void
111 dm_target_stripe_fini(dm_target_stripe_config_t *tsc)
112 {
113 dm_target_linear_config_t *tlc;
114
115 if (tsc == NULL)
116 return;
117
118 while ((tlc = TAILQ_FIRST(&tsc->stripe_devs)) != NULL) {
119 TAILQ_REMOVE(&tsc->stripe_devs, tlc, entries);
120 dm_pdev_decr(tlc->pdev);
121 kmem_free(tlc, sizeof(*tlc));
122 }
123
124 kmem_free(tsc, sizeof(*tsc));
125 }
126
127 /*
128 * Init function called from dm_table_load_ioctl.
129 * DM_STRIPE_DEV_OFFSET should always hold the index of the first device-offset
130 * pair in the parameters.
131 * Example line sent to dm from lvm tools when using striped target.
132 * start length striped #stripes chunk_size device1 offset1 ... deviceN offsetN
133 * 0 65536 striped 2 512 /dev/hda 0 /dev/hdb 0
134 */
135 int
136 dm_target_stripe_init(dm_table_entry_t *table_en, int argc, char **argv)
137 {
138 dm_target_linear_config_t *tlc;
139 dm_target_stripe_config_t *tsc;
140 int strpc, strpi;
141
142 if (argc < 2) {
143 printf("Stripe target takes at least 2 args, %d given\n", argc);
144 return EINVAL;
145 }
146
147 printf("Stripe target init function called!!\n");
148 printf("Stripe target chunk size %s number of stripes %s\n",
149 argv[1], argv[0]);
150
151 if ((tsc = kmem_alloc(sizeof(*tsc), KM_NOSLEEP)) == NULL)
152 return ENOMEM;
153
154 /* Initialize linked list for striping devices */
155 TAILQ_INIT(&tsc->stripe_devs);
156
157 /* Save length of param string */
158 tsc->stripe_chunksize = atoi64(argv[1]);
159 tsc->stripe_num = (uint8_t) atoi64(argv[0]);
160
161 strpc = DM_STRIPE_DEV_OFFSET + (tsc->stripe_num * 2);
162 for (strpi = DM_STRIPE_DEV_OFFSET; strpi < strpc; strpi += 2) {
163 printf("Stripe target device name %s -- offset %s\n",
164 argv[strpi], argv[strpi+1]);
165
166 tlc = kmem_alloc(sizeof(*tlc), KM_NOSLEEP);
167 if ((tlc->pdev = dm_pdev_insert(argv[strpi])) == NULL) {
168 kmem_free(tlc, sizeof(*tlc));
169 dm_target_stripe_fini(tsc);
170 return ENOENT;
171 }
172 tlc->offset = atoi64(argv[strpi+1]);
173 dm_table_add_deps(table_en, tlc->pdev);
174
175 /* Insert striping device to linked list. */
176 TAILQ_INSERT_TAIL(&tsc->stripe_devs, tlc, entries);
177 }
178
179 table_en->target_config = tsc;
180
181 return 0;
182 }
183
184 /* Info routine called to get params string. */
185 char *
186 dm_target_stripe_info(void *target_config)
187 {
188 dm_target_linear_config_t *tlc;
189 dm_target_stripe_config_t *tsc;
190 char *params, *ptr, buf[256];
191 int ret, i = 0;
192 size_t len;
193
194 tsc = target_config;
195
196 len = DM_MAX_PARAMS_SIZE;
197 params = kmem_alloc(len, KM_SLEEP);
198 ptr = params;
199
200 ret = snprintf(ptr, len, "%d ", tsc->stripe_num);
201 ptr += ret;
202 len -= ret;
203
204 memset(buf, 0, sizeof(buf));
205 TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
206 ret = snprintf(ptr, len, "%s ", tlc->pdev->udev_name);
207 if (0 /*tlc->num_error*/)
208 buf[i] = 'D';
209 else
210 buf[i] = 'A';
211 i++;
212 ptr += ret;
213 len -= ret;
214 }
215
216 ret = snprintf(ptr, len, "1 %s", buf);
217 ptr += ret;
218 len -= ret;
219
220 return params;
221 }
222
223 /* Table routine called to get params string. */
224 char *
225 dm_target_stripe_table(void *target_config)
226 {
227 dm_target_linear_config_t *tlc;
228 dm_target_stripe_config_t *tsc;
229 char *params, *tmp;
230
231 tsc = target_config;
232
233 params = kmem_alloc(DM_MAX_PARAMS_SIZE, KM_SLEEP);
234 tmp = kmem_alloc(DM_MAX_PARAMS_SIZE, KM_SLEEP);
235
236 snprintf(params, DM_MAX_PARAMS_SIZE, "%d %" PRIu64,
237 tsc->stripe_num, tsc->stripe_chunksize);
238
239 TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
240 snprintf(tmp, DM_MAX_PARAMS_SIZE, " %s %" PRIu64,
241 tlc->pdev->udev_name, tlc->offset);
242 strcat(params, tmp);
243 }
244
245 kmem_free(tmp, DM_MAX_PARAMS_SIZE);
246
247 return params;
248 }
249
250 /* Strategy routine called from dm_strategy. */
251 int
252 dm_target_stripe_strategy(dm_table_entry_t *table_en, struct buf *bp)
253 {
254 dm_target_linear_config_t *tlc;
255 dm_target_stripe_config_t *tsc;
256 struct buf *nestbuf;
257 uint64_t blkno, blkoff;
258 uint64_t stripe, stripe_blknr;
259 uint32_t stripe_off, stripe_rest, num_blks, issue_blks;
260 int i, stripe_devnr;
261
262 tsc = table_en->target_config;
263 if (tsc == NULL)
264 return 0;
265
266 /* calculate extent of request */
267 KASSERT(bp->b_resid % DEV_BSIZE == 0);
268
269 blkno = bp->b_blkno;
270 blkoff = 0;
271 num_blks = bp->b_resid / DEV_BSIZE;
272 for (;;) {
273 /* blockno to stripe piece nr */
274 stripe = blkno / tsc->stripe_chunksize;
275 stripe_off = blkno % tsc->stripe_chunksize;
276
277 /* where we are inside the stripe */
278 stripe_devnr = stripe % tsc->stripe_num;
279 stripe_blknr = stripe / tsc->stripe_num;
280
281 /* how much is left before we hit a boundary */
282 stripe_rest = tsc->stripe_chunksize - stripe_off;
283
284 /* issue this piece on stripe `stripe' */
285 issue_blks = MIN(stripe_rest, num_blks);
286 nestbuf = getiobuf(NULL, true);
287
288 nestiobuf_setup(bp, nestbuf, blkoff, issue_blks * DEV_BSIZE);
289 nestbuf->b_blkno = stripe_blknr * tsc->stripe_chunksize + stripe_off;
290
291 tlc = TAILQ_FIRST(&tsc->stripe_devs);
292 for (i = 0; i < stripe_devnr && tlc != NULL; i++)
293 tlc = TAILQ_NEXT(tlc, entries);
294
295 /* by this point we should have an tlc */
296 KASSERT(tlc != NULL);
297
298 nestbuf->b_blkno += tlc->offset;
299
300 VOP_STRATEGY(tlc->pdev->pdev_vnode, nestbuf);
301
302 blkno += issue_blks;
303 blkoff += issue_blks * DEV_BSIZE;
304 num_blks -= issue_blks;
305
306 if (num_blks <= 0)
307 break;
308 }
309
310 return 0;
311 }
312
313 /* Sync underlying disk caches. */
314 int
315 dm_target_stripe_sync(dm_table_entry_t *table_en)
316 {
317 int cmd, err;
318 dm_target_stripe_config_t *tsc;
319 dm_target_linear_config_t *tlc;
320
321 tsc = table_en->target_config;
322
323 err = 0;
324 cmd = 1;
325
326 TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
327 if ((err = VOP_IOCTL(tlc->pdev->pdev_vnode, DIOCCACHESYNC,
328 &cmd, FREAD|FWRITE, kauth_cred_get())) != 0)
329 return err;
330 }
331
332 return err;
333
334 }
335
336 /* Destroy target specific data. */
337 int
338 dm_target_stripe_destroy(dm_table_entry_t *table_en)
339 {
340
341 dm_target_stripe_fini(table_en->target_config);
342
343 /* Unbusy target so we can unload it */
344 dm_target_unbusy(table_en->target);
345
346 return 0;
347 }
348
349 #if 0
350 /* Unsupported for this target. */
351 int
352 dm_target_stripe_upcall(dm_table_entry_t *table_en, struct buf *bp)
353 {
354
355 return 0;
356 }
357 #endif
358
359 /*
360 * Compute physical block size
361 * For a stripe target we chose the maximum sector size of all
362 * stripe devices. For the supported power-of-2 sizes this is equivalent
363 * to the least common multiple.
364 */
365 int
366 dm_target_stripe_secsize(dm_table_entry_t *table_en, unsigned int *secsizep)
367 {
368 dm_target_linear_config_t *tlc;
369 dm_target_stripe_config_t *tsc;
370 unsigned int secsize;
371
372 secsize = 0;
373
374 tsc = table_en->target_config;
375 if (tsc != NULL) {
376 TAILQ_FOREACH(tlc, &tsc->stripe_devs, entries) {
377 if (secsize < tlc->pdev->pdev_secsize)
378 secsize = tlc->pdev->pdev_secsize;
379 }
380 }
381
382 *secsizep = secsize;
383
384 return 0;
385 }
386