md.c revision 1.57 1 1.57 yamt /* $NetBSD: md.c,v 1.57 2009/01/13 13:35:52 yamt Exp $ */
2 1.1 gwr
3 1.1 gwr /*
4 1.1 gwr * Copyright (c) 1995 Gordon W. Ross, Leo Weppelman.
5 1.1 gwr * All rights reserved.
6 1.1 gwr *
7 1.1 gwr * Redistribution and use in source and binary forms, with or without
8 1.1 gwr * modification, are permitted provided that the following conditions
9 1.1 gwr * are met:
10 1.1 gwr * 1. Redistributions of source code must retain the above copyright
11 1.1 gwr * notice, this list of conditions and the following disclaimer.
12 1.1 gwr * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 gwr * notice, this list of conditions and the following disclaimer in the
14 1.1 gwr * documentation and/or other materials provided with the distribution.
15 1.1 gwr * 3. The name of the author may not be used to endorse or promote products
16 1.1 gwr * derived from this software without specific prior written permission.
17 1.1 gwr * 4. All advertising materials mentioning features or use of this software
18 1.1 gwr * must display the following acknowledgement:
19 1.1 gwr * This product includes software developed by
20 1.1 gwr * Gordon W. Ross and Leo Weppelman.
21 1.1 gwr *
22 1.1 gwr * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
23 1.1 gwr * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
24 1.1 gwr * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
25 1.1 gwr * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
26 1.1 gwr * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
27 1.1 gwr * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28 1.1 gwr * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29 1.1 gwr * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30 1.1 gwr * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
31 1.1 gwr * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32 1.1 gwr */
33 1.1 gwr
34 1.1 gwr /*
35 1.11 pk * This implements a general-purpose memory-disk.
36 1.13 jeremy * See md.h for notes on the config types.
37 1.1 gwr *
38 1.1 gwr * Note that this driver provides the same functionality
39 1.1 gwr * as the MFS filesystem hack, but this is better because
40 1.1 gwr * you can use this for any filesystem type you'd like!
41 1.1 gwr *
42 1.1 gwr * Credit for most of the kmem ramdisk code goes to:
43 1.1 gwr * Leo Weppelman (atari) and Phil Nelson (pc532)
44 1.11 pk * Credit for the ideas behind the "user space memory" code goes
45 1.1 gwr * to the authors of the MFS implementation.
46 1.1 gwr */
47 1.27 lukem
48 1.27 lukem #include <sys/cdefs.h>
49 1.57 yamt __KERNEL_RCSID(0, "$NetBSD: md.c,v 1.57 2009/01/13 13:35:52 yamt Exp $");
50 1.16 mrg
51 1.19 jonathan #include "opt_md.h"
52 1.1 gwr
53 1.1 gwr #include <sys/param.h>
54 1.7 gwr #include <sys/kernel.h>
55 1.7 gwr #include <sys/malloc.h>
56 1.1 gwr #include <sys/systm.h>
57 1.1 gwr #include <sys/buf.h>
58 1.39 yamt #include <sys/bufq.h>
59 1.1 gwr #include <sys/device.h>
60 1.4 thorpej #include <sys/disk.h>
61 1.8 leo #include <sys/proc.h>
62 1.8 leo #include <sys/conf.h>
63 1.14 leo #include <sys/disklabel.h>
64 1.23 mrg
65 1.23 mrg #include <uvm/uvm_extern.h>
66 1.1 gwr
67 1.11 pk #include <dev/md.h>
68 1.1 gwr
69 1.1 gwr /*
70 1.49 dsl * The user-space functionality is included by default.
71 1.11 pk * Use `options MEMORY_DISK_SERVER=0' to turn it off.
72 1.1 gwr */
73 1.11 pk #ifndef MEMORY_DISK_SERVER
74 1.49 dsl #error MEMORY_DISK_SERVER should be defined by opt_md.h
75 1.33 atatat #endif /* MEMORY_DISK_SERVER */
76 1.1 gwr
77 1.1 gwr /*
78 1.21 tsutsui * We should use the raw partition for ioctl.
79 1.1 gwr */
80 1.21 tsutsui #define MD_UNIT(unit) DISKUNIT(unit)
81 1.1 gwr
82 1.1 gwr /* autoconfig stuff... */
83 1.1 gwr
84 1.11 pk struct md_softc {
85 1.4 thorpej struct disk sc_dkdev; /* hook for generic disk handling */
86 1.11 pk struct md_conf sc_md;
87 1.42 yamt struct bufq_state *sc_buflist;
88 1.1 gwr };
89 1.11 pk /* shorthand for fields in sc_md: */
90 1.11 pk #define sc_addr sc_md.md_addr
91 1.11 pk #define sc_size sc_md.md_size
92 1.11 pk #define sc_type sc_md.md_type
93 1.1 gwr
94 1.38 thorpej void mdattach(int);
95 1.6 thorpej
96 1.54 cegger static void md_attach(device_t, device_t, void *);
97 1.38 thorpej
98 1.38 thorpej static dev_type_open(mdopen);
99 1.38 thorpej static dev_type_close(mdclose);
100 1.38 thorpej static dev_type_read(mdread);
101 1.38 thorpej static dev_type_write(mdwrite);
102 1.38 thorpej static dev_type_ioctl(mdioctl);
103 1.38 thorpej static dev_type_strategy(mdstrategy);
104 1.38 thorpej static dev_type_size(mdsize);
105 1.31 gehenna
106 1.31 gehenna const struct bdevsw md_bdevsw = {
107 1.31 gehenna mdopen, mdclose, mdstrategy, mdioctl, nodump, mdsize, D_DISK
108 1.31 gehenna };
109 1.31 gehenna
110 1.31 gehenna const struct cdevsw md_cdevsw = {
111 1.31 gehenna mdopen, mdclose, mdread, mdwrite, mdioctl,
112 1.32 jdolecek nostop, notty, nopoll, nommap, nokqfilter, D_DISK
113 1.31 gehenna };
114 1.31 gehenna
115 1.45 christos static struct dkdriver mddkdriver = { mdstrategy, NULL };
116 1.4 thorpej
117 1.53 drochner extern struct cfdriver md_cd;
118 1.54 cegger CFATTACH_DECL_NEW(md, sizeof(struct md_softc),
119 1.53 drochner 0, md_attach, 0, NULL);
120 1.4 thorpej
121 1.7 gwr /*
122 1.7 gwr * This is called if we are configured as a pseudo-device
123 1.7 gwr */
124 1.7 gwr void
125 1.38 thorpej mdattach(int n)
126 1.1 gwr {
127 1.7 gwr int i;
128 1.54 cegger cfdata_t cf;
129 1.7 gwr
130 1.53 drochner if (config_cfattach_attach("md", &md_ca)) {
131 1.53 drochner printf("md: cfattach_attach failed\n");
132 1.7 gwr return;
133 1.7 gwr }
134 1.7 gwr
135 1.7 gwr /* XXX: Are we supposed to provide a default? */
136 1.7 gwr if (n <= 1)
137 1.7 gwr n = 1;
138 1.7 gwr
139 1.7 gwr /* Attach as if by autoconfig. */
140 1.7 gwr for (i = 0; i < n; i++) {
141 1.53 drochner cf = malloc(sizeof(*cf), M_DEVBUF, M_WAITOK);
142 1.53 drochner cf->cf_name = "md";
143 1.53 drochner cf->cf_atname = "md";
144 1.53 drochner cf->cf_unit = i;
145 1.53 drochner cf->cf_fstate = FSTATE_NOTFOUND;
146 1.54 cegger (void)config_attach_pseudo(cf);
147 1.7 gwr }
148 1.1 gwr }
149 1.1 gwr
150 1.1 gwr static void
151 1.54 cegger md_attach(device_t parent, device_t self,
152 1.47 christos void *aux)
153 1.1 gwr {
154 1.54 cegger struct md_softc *sc = device_private(self);
155 1.1 gwr
156 1.42 yamt bufq_alloc(&sc->sc_buflist, "fcfs", 0);
157 1.22 thorpej
158 1.1 gwr /* XXX - Could accept aux info here to set the config. */
159 1.11 pk #ifdef MEMORY_DISK_HOOKS
160 1.1 gwr /*
161 1.1 gwr * This external function might setup a pre-loaded disk.
162 1.11 pk * All it would need to do is setup the md_conf struct.
163 1.25 tsutsui * See sys/dev/md_root.c for an example.
164 1.1 gwr */
165 1.54 cegger md_attach_hook(device_unit(self), &sc->sc_md);
166 1.1 gwr #endif
167 1.4 thorpej
168 1.4 thorpej /*
169 1.4 thorpej * Initialize and attach the disk structure.
170 1.4 thorpej */
171 1.54 cegger disk_init(&sc->sc_dkdev, device_xname(self), &mddkdriver);
172 1.4 thorpej disk_attach(&sc->sc_dkdev);
173 1.55 cegger
174 1.55 cegger if (!pmf_device_register(self, NULL, NULL))
175 1.55 cegger aprint_error_dev(self, "couldn't establish power handler\n");
176 1.1 gwr }
177 1.1 gwr
178 1.1 gwr /*
179 1.1 gwr * operational routines:
180 1.1 gwr * open, close, read, write, strategy,
181 1.1 gwr * ioctl, dump, size
182 1.1 gwr */
183 1.1 gwr
184 1.11 pk #if MEMORY_DISK_SERVER
185 1.38 thorpej static int md_server_loop(struct md_softc *sc);
186 1.38 thorpej static int md_ioctl_server(struct md_softc *sc, struct md_conf *umd,
187 1.43 christos struct lwp *l);
188 1.33 atatat #endif /* MEMORY_DISK_SERVER */
189 1.38 thorpej static int md_ioctl_kalloc(struct md_softc *sc, struct md_conf *umd,
190 1.43 christos struct lwp *l);
191 1.1 gwr
192 1.38 thorpej static int
193 1.21 tsutsui mdsize(dev_t dev)
194 1.1 gwr {
195 1.11 pk struct md_softc *sc;
196 1.1 gwr
197 1.54 cegger sc = device_lookup_private(&md_cd, MD_UNIT(dev));
198 1.1 gwr if (sc == NULL)
199 1.1 gwr return 0;
200 1.1 gwr
201 1.11 pk if (sc->sc_type == MD_UNCONFIGURED)
202 1.1 gwr return 0;
203 1.1 gwr
204 1.1 gwr return (sc->sc_size >> DEV_BSHIFT);
205 1.1 gwr }
206 1.1 gwr
207 1.38 thorpej static int
208 1.47 christos mdopen(dev_t dev, int flag, int fmt, struct lwp *l)
209 1.1 gwr {
210 1.21 tsutsui int unit;
211 1.11 pk struct md_softc *sc;
212 1.1 gwr
213 1.21 tsutsui unit = MD_UNIT(dev);
214 1.53 drochner sc = device_lookup_private(&md_cd, unit);
215 1.1 gwr if (sc == NULL)
216 1.1 gwr return ENXIO;
217 1.1 gwr
218 1.1 gwr /*
219 1.21 tsutsui * The raw partition is used for ioctl to configure.
220 1.1 gwr */
221 1.21 tsutsui if (DISKPART(dev) == RAW_PART)
222 1.1 gwr return 0;
223 1.1 gwr
224 1.11 pk #ifdef MEMORY_DISK_HOOKS
225 1.1 gwr /* Call the open hook to allow loading the device. */
226 1.11 pk md_open_hook(unit, &sc->sc_md);
227 1.1 gwr #endif
228 1.1 gwr
229 1.1 gwr /*
230 1.1 gwr * This is a normal, "slave" device, so
231 1.21 tsutsui * enforce initialized.
232 1.1 gwr */
233 1.11 pk if (sc->sc_type == MD_UNCONFIGURED)
234 1.1 gwr return ENXIO;
235 1.1 gwr
236 1.1 gwr return 0;
237 1.1 gwr }
238 1.1 gwr
239 1.38 thorpej static int
240 1.47 christos mdclose(dev_t dev, int flag, int fmt, struct lwp *l)
241 1.1 gwr {
242 1.1 gwr
243 1.1 gwr return 0;
244 1.1 gwr }
245 1.1 gwr
246 1.38 thorpej static int
247 1.47 christos mdread(dev_t dev, struct uio *uio, int flags)
248 1.1 gwr {
249 1.21 tsutsui struct md_softc *sc;
250 1.21 tsutsui
251 1.54 cegger sc = device_lookup_private(&md_cd, MD_UNIT(dev));
252 1.21 tsutsui
253 1.21 tsutsui if (sc->sc_type == MD_UNCONFIGURED)
254 1.21 tsutsui return ENXIO;
255 1.21 tsutsui
256 1.11 pk return (physio(mdstrategy, NULL, dev, B_READ, minphys, uio));
257 1.1 gwr }
258 1.1 gwr
259 1.38 thorpej static int
260 1.47 christos mdwrite(dev_t dev, struct uio *uio, int flags)
261 1.1 gwr {
262 1.21 tsutsui struct md_softc *sc;
263 1.21 tsutsui
264 1.54 cegger sc = device_lookup_private(&md_cd, MD_UNIT(dev));
265 1.21 tsutsui
266 1.21 tsutsui if (sc->sc_type == MD_UNCONFIGURED)
267 1.21 tsutsui return ENXIO;
268 1.21 tsutsui
269 1.11 pk return (physio(mdstrategy, NULL, dev, B_WRITE, minphys, uio));
270 1.1 gwr }
271 1.1 gwr
272 1.1 gwr /*
273 1.1 gwr * Handle I/O requests, either directly, or
274 1.1 gwr * by passing them to the server process.
275 1.1 gwr */
276 1.38 thorpej static void
277 1.38 thorpej mdstrategy(struct buf *bp)
278 1.1 gwr {
279 1.11 pk struct md_softc *sc;
280 1.48 christos void * addr;
281 1.21 tsutsui size_t off, xfer;
282 1.1 gwr
283 1.54 cegger sc = device_lookup_private(&md_cd, MD_UNIT(bp->b_dev));
284 1.1 gwr
285 1.21 tsutsui if (sc->sc_type == MD_UNCONFIGURED) {
286 1.21 tsutsui bp->b_error = ENXIO;
287 1.21 tsutsui goto done;
288 1.21 tsutsui }
289 1.21 tsutsui
290 1.1 gwr switch (sc->sc_type) {
291 1.11 pk #if MEMORY_DISK_SERVER
292 1.11 pk case MD_UMEM_SERVER:
293 1.1 gwr /* Just add this job to the server's queue. */
294 1.57 yamt bufq_put(sc->sc_buflist, bp);
295 1.48 christos wakeup((void *)sc);
296 1.29 hannken /* see md_server_loop() */
297 1.1 gwr /* no biodone in this case */
298 1.1 gwr return;
299 1.11 pk #endif /* MEMORY_DISK_SERVER */
300 1.1 gwr
301 1.11 pk case MD_KMEM_FIXED:
302 1.11 pk case MD_KMEM_ALLOCATED:
303 1.1 gwr /* These are in kernel space. Access directly. */
304 1.1 gwr bp->b_resid = bp->b_bcount;
305 1.1 gwr off = (bp->b_blkno << DEV_BSHIFT);
306 1.1 gwr if (off >= sc->sc_size) {
307 1.1 gwr if (bp->b_flags & B_READ)
308 1.1 gwr break; /* EOF */
309 1.1 gwr goto set_eio;
310 1.1 gwr }
311 1.1 gwr xfer = bp->b_resid;
312 1.1 gwr if (xfer > (sc->sc_size - off))
313 1.1 gwr xfer = (sc->sc_size - off);
314 1.48 christos addr = (char *)sc->sc_addr + off;
315 1.1 gwr if (bp->b_flags & B_READ)
316 1.26 thorpej memcpy(bp->b_data, addr, xfer);
317 1.1 gwr else
318 1.26 thorpej memcpy(addr, bp->b_data, xfer);
319 1.1 gwr bp->b_resid -= xfer;
320 1.1 gwr break;
321 1.1 gwr
322 1.1 gwr default:
323 1.1 gwr bp->b_resid = bp->b_bcount;
324 1.1 gwr set_eio:
325 1.1 gwr bp->b_error = EIO;
326 1.1 gwr break;
327 1.1 gwr }
328 1.21 tsutsui done:
329 1.1 gwr biodone(bp);
330 1.1 gwr }
331 1.1 gwr
332 1.38 thorpej static int
333 1.48 christos mdioctl(dev_t dev, u_long cmd, void *data, int flag, struct lwp *l)
334 1.1 gwr {
335 1.21 tsutsui struct md_softc *sc;
336 1.21 tsutsui struct md_conf *umd;
337 1.1 gwr
338 1.54 cegger sc = device_lookup_private(&md_cd, MD_UNIT(dev));
339 1.1 gwr
340 1.21 tsutsui /* If this is not the raw partition, punt! */
341 1.21 tsutsui if (DISKPART(dev) != RAW_PART)
342 1.1 gwr return ENOTTY;
343 1.1 gwr
344 1.11 pk umd = (struct md_conf *)data;
345 1.1 gwr switch (cmd) {
346 1.11 pk case MD_GETCONF:
347 1.11 pk *umd = sc->sc_md;
348 1.1 gwr return 0;
349 1.1 gwr
350 1.11 pk case MD_SETCONF:
351 1.1 gwr /* Can only set it once. */
352 1.11 pk if (sc->sc_type != MD_UNCONFIGURED)
353 1.1 gwr break;
354 1.11 pk switch (umd->md_type) {
355 1.11 pk case MD_KMEM_ALLOCATED:
356 1.43 christos return md_ioctl_kalloc(sc, umd, l);
357 1.11 pk #if MEMORY_DISK_SERVER
358 1.11 pk case MD_UMEM_SERVER:
359 1.43 christos return md_ioctl_server(sc, umd, l);
360 1.33 atatat #endif /* MEMORY_DISK_SERVER */
361 1.1 gwr default:
362 1.1 gwr break;
363 1.1 gwr }
364 1.1 gwr break;
365 1.1 gwr }
366 1.1 gwr return EINVAL;
367 1.1 gwr }
368 1.1 gwr
369 1.1 gwr /*
370 1.11 pk * Handle ioctl MD_SETCONF for (sc_type == MD_KMEM_ALLOCATED)
371 1.1 gwr * Just allocate some kernel memory and return.
372 1.1 gwr */
373 1.8 leo static int
374 1.46 christos md_ioctl_kalloc(struct md_softc *sc, struct md_conf *umd,
375 1.47 christos struct lwp *l)
376 1.1 gwr {
377 1.17 eeh vaddr_t addr;
378 1.21 tsutsui vsize_t size;
379 1.1 gwr
380 1.1 gwr /* Sanity check the size. */
381 1.11 pk size = umd->md_size;
382 1.41 yamt addr = uvm_km_alloc(kernel_map, size, 0, UVM_KMF_WIRED|UVM_KMF_ZERO);
383 1.1 gwr if (!addr)
384 1.1 gwr return ENOMEM;
385 1.1 gwr
386 1.1 gwr /* This unit is now configured. */
387 1.48 christos sc->sc_addr = (void *)addr; /* kernel space */
388 1.1 gwr sc->sc_size = (size_t)size;
389 1.11 pk sc->sc_type = MD_KMEM_ALLOCATED;
390 1.1 gwr return 0;
391 1.40 perry }
392 1.1 gwr
393 1.11 pk #if MEMORY_DISK_SERVER
394 1.1 gwr
395 1.1 gwr /*
396 1.11 pk * Handle ioctl MD_SETCONF for (sc_type == MD_UMEM_SERVER)
397 1.1 gwr * Set config, then become the I/O server for this unit.
398 1.1 gwr */
399 1.8 leo static int
400 1.46 christos md_ioctl_server(struct md_softc *sc, struct md_conf *umd,
401 1.47 christos struct lwp *l)
402 1.1 gwr {
403 1.17 eeh vaddr_t end;
404 1.1 gwr int error;
405 1.1 gwr
406 1.1 gwr /* Sanity check addr, size. */
407 1.48 christos end = (vaddr_t) ((char *)umd->md_addr + umd->md_size);
408 1.1 gwr
409 1.1 gwr if ((end >= VM_MAXUSER_ADDRESS) ||
410 1.17 eeh (end < ((vaddr_t) umd->md_addr)) )
411 1.1 gwr return EINVAL;
412 1.1 gwr
413 1.1 gwr /* This unit is now configured. */
414 1.11 pk sc->sc_addr = umd->md_addr; /* user space */
415 1.11 pk sc->sc_size = umd->md_size;
416 1.11 pk sc->sc_type = MD_UMEM_SERVER;
417 1.1 gwr
418 1.1 gwr /* Become the server daemon */
419 1.11 pk error = md_server_loop(sc);
420 1.1 gwr
421 1.1 gwr /* This server is now going away! */
422 1.11 pk sc->sc_type = MD_UNCONFIGURED;
423 1.1 gwr sc->sc_addr = 0;
424 1.1 gwr sc->sc_size = 0;
425 1.1 gwr
426 1.1 gwr return (error);
427 1.40 perry }
428 1.1 gwr
429 1.38 thorpej static int md_sleep_pri = PWAIT | PCATCH;
430 1.1 gwr
431 1.1 gwr static int
432 1.38 thorpej md_server_loop(struct md_softc *sc)
433 1.1 gwr {
434 1.1 gwr struct buf *bp;
435 1.48 christos void *addr; /* user space address */
436 1.21 tsutsui size_t off; /* offset into "device" */
437 1.21 tsutsui size_t xfer; /* amount to transfer */
438 1.1 gwr int error;
439 1.1 gwr
440 1.1 gwr for (;;) {
441 1.1 gwr /* Wait for some work to arrive. */
442 1.57 yamt while ((bp = bufq_get(sc->sc_buflist)) == NULL) {
443 1.48 christos error = tsleep((void *)sc, md_sleep_pri, "md_idle", 0);
444 1.1 gwr if (error)
445 1.1 gwr return error;
446 1.1 gwr }
447 1.1 gwr
448 1.1 gwr /* Do the transfer to/from user space. */
449 1.1 gwr error = 0;
450 1.1 gwr bp->b_resid = bp->b_bcount;
451 1.1 gwr off = (bp->b_blkno << DEV_BSHIFT);
452 1.1 gwr if (off >= sc->sc_size) {
453 1.1 gwr if (bp->b_flags & B_READ)
454 1.1 gwr goto done; /* EOF (not an error) */
455 1.1 gwr error = EIO;
456 1.1 gwr goto done;
457 1.1 gwr }
458 1.1 gwr xfer = bp->b_resid;
459 1.1 gwr if (xfer > (sc->sc_size - off))
460 1.1 gwr xfer = (sc->sc_size - off);
461 1.48 christos addr = (char *)sc->sc_addr + off;
462 1.1 gwr if (bp->b_flags & B_READ)
463 1.1 gwr error = copyin(addr, bp->b_data, xfer);
464 1.1 gwr else
465 1.1 gwr error = copyout(bp->b_data, addr, xfer);
466 1.1 gwr if (!error)
467 1.1 gwr bp->b_resid -= xfer;
468 1.1 gwr
469 1.1 gwr done:
470 1.1 gwr if (error) {
471 1.1 gwr bp->b_error = error;
472 1.1 gwr }
473 1.1 gwr biodone(bp);
474 1.1 gwr }
475 1.1 gwr }
476 1.11 pk #endif /* MEMORY_DISK_SERVER */
477