ld.c revision 1.62 1 1.62 simonb /* $NetBSD: ld.c,v 1.62 2008/08/11 06:43:37 simonb Exp $ */
2 1.1 ad
3 1.1 ad /*-
4 1.1 ad * Copyright (c) 1998, 2000 The NetBSD Foundation, Inc.
5 1.1 ad * All rights reserved.
6 1.1 ad *
7 1.1 ad * This code is derived from software contributed to The NetBSD Foundation
8 1.1 ad * by Andrew Doran and Charles M. Hannum.
9 1.1 ad *
10 1.1 ad * Redistribution and use in source and binary forms, with or without
11 1.1 ad * modification, are permitted provided that the following conditions
12 1.1 ad * are met:
13 1.1 ad * 1. Redistributions of source code must retain the above copyright
14 1.1 ad * notice, this list of conditions and the following disclaimer.
15 1.1 ad * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 ad * notice, this list of conditions and the following disclaimer in the
17 1.1 ad * documentation and/or other materials provided with the distribution.
18 1.1 ad *
19 1.1 ad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.1 ad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.1 ad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.1 ad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.1 ad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.1 ad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.1 ad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.1 ad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.1 ad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.1 ad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.1 ad * POSSIBILITY OF SUCH DAMAGE.
30 1.1 ad */
31 1.1 ad
32 1.1 ad /*
33 1.1 ad * Disk driver for use by RAID controllers.
34 1.1 ad */
35 1.12 lukem
36 1.12 lukem #include <sys/cdefs.h>
37 1.62 simonb __KERNEL_RCSID(0, "$NetBSD: ld.c,v 1.62 2008/08/11 06:43:37 simonb Exp $");
38 1.1 ad
39 1.1 ad #include "rnd.h"
40 1.1 ad
41 1.1 ad #include <sys/param.h>
42 1.1 ad #include <sys/systm.h>
43 1.1 ad #include <sys/kernel.h>
44 1.1 ad #include <sys/device.h>
45 1.1 ad #include <sys/queue.h>
46 1.1 ad #include <sys/proc.h>
47 1.1 ad #include <sys/buf.h>
48 1.33 yamt #include <sys/bufq.h>
49 1.1 ad #include <sys/endian.h>
50 1.1 ad #include <sys/disklabel.h>
51 1.1 ad #include <sys/disk.h>
52 1.1 ad #include <sys/dkio.h>
53 1.1 ad #include <sys/stat.h>
54 1.1 ad #include <sys/conf.h>
55 1.1 ad #include <sys/fcntl.h>
56 1.2 ad #include <sys/vnode.h>
57 1.1 ad #include <sys/syslog.h>
58 1.44 ad #include <sys/mutex.h>
59 1.1 ad #if NRND > 0
60 1.1 ad #include <sys/rnd.h>
61 1.1 ad #endif
62 1.1 ad
63 1.1 ad #include <dev/ldvar.h>
64 1.1 ad
65 1.43 riz #include <prop/proplib.h>
66 1.43 riz
67 1.1 ad static void ldgetdefaultlabel(struct ld_softc *, struct disklabel *);
68 1.1 ad static void ldgetdisklabel(struct ld_softc *);
69 1.1 ad static void ldminphys(struct buf *bp);
70 1.55 jmcneill static bool ld_shutdown(device_t, int);
71 1.44 ad static void ldstart(struct ld_softc *, struct buf *);
72 1.43 riz static void ld_set_properties(struct ld_softc *);
73 1.45 riz static void ld_config_interrupts (struct device *);
74 1.1 ad
75 1.1 ad extern struct cfdriver ld_cd;
76 1.1 ad
77 1.29 thorpej static dev_type_open(ldopen);
78 1.29 thorpej static dev_type_close(ldclose);
79 1.29 thorpej static dev_type_read(ldread);
80 1.29 thorpej static dev_type_write(ldwrite);
81 1.29 thorpej static dev_type_ioctl(ldioctl);
82 1.29 thorpej static dev_type_strategy(ldstrategy);
83 1.29 thorpej static dev_type_dump(lddump);
84 1.29 thorpej static dev_type_size(ldsize);
85 1.16 gehenna
86 1.16 gehenna const struct bdevsw ld_bdevsw = {
87 1.16 gehenna ldopen, ldclose, ldstrategy, ldioctl, lddump, ldsize, D_DISK
88 1.16 gehenna };
89 1.16 gehenna
90 1.16 gehenna const struct cdevsw ld_cdevsw = {
91 1.16 gehenna ldopen, ldclose, ldread, ldwrite, ldioctl,
92 1.17 jdolecek nostop, notty, nopoll, nommap, nokqfilter, D_DISK
93 1.16 gehenna };
94 1.16 gehenna
95 1.30 thorpej static struct dkdriver lddkdriver = { ldstrategy, ldminphys };
96 1.1 ad
97 1.1 ad void
98 1.1 ad ldattach(struct ld_softc *sc)
99 1.1 ad {
100 1.37 christos char tbuf[9];
101 1.1 ad
102 1.53 ad mutex_init(&sc->sc_mutex, MUTEX_DEFAULT, IPL_VM);
103 1.44 ad
104 1.7 ad if ((sc->sc_flags & LDF_ENABLED) == 0) {
105 1.57 cegger aprint_normal_dev(&sc->sc_dv, "disabled\n");
106 1.7 ad return;
107 1.7 ad }
108 1.7 ad
109 1.1 ad /* Initialise and attach the disk structure. */
110 1.57 cegger disk_init(&sc->sc_dk, device_xname(&sc->sc_dv), &lddkdriver);
111 1.1 ad disk_attach(&sc->sc_dk);
112 1.1 ad
113 1.1 ad if (sc->sc_maxxfer > MAXPHYS)
114 1.1 ad sc->sc_maxxfer = MAXPHYS;
115 1.9 ad
116 1.19 thorpej /* Build synthetic geometry if necessary. */
117 1.19 thorpej if (sc->sc_nheads == 0 || sc->sc_nsectors == 0 ||
118 1.19 thorpej sc->sc_ncylinders == 0) {
119 1.28 dbj uint64_t ncyl;
120 1.28 dbj
121 1.19 thorpej if (sc->sc_secperunit <= 528 * 2048) /* 528MB */
122 1.19 thorpej sc->sc_nheads = 16;
123 1.19 thorpej else if (sc->sc_secperunit <= 1024 * 2048) /* 1GB */
124 1.19 thorpej sc->sc_nheads = 32;
125 1.19 thorpej else if (sc->sc_secperunit <= 21504 * 2048) /* 21GB */
126 1.19 thorpej sc->sc_nheads = 64;
127 1.19 thorpej else if (sc->sc_secperunit <= 43008 * 2048) /* 42GB */
128 1.19 thorpej sc->sc_nheads = 128;
129 1.19 thorpej else
130 1.19 thorpej sc->sc_nheads = 255;
131 1.19 thorpej
132 1.19 thorpej sc->sc_nsectors = 63;
133 1.28 dbj sc->sc_ncylinders = INT_MAX;
134 1.35 perry ncyl = sc->sc_secperunit /
135 1.19 thorpej (sc->sc_nheads * sc->sc_nsectors);
136 1.28 dbj if (ncyl < INT_MAX)
137 1.28 dbj sc->sc_ncylinders = (int)ncyl;
138 1.19 thorpej }
139 1.1 ad
140 1.37 christos format_bytes(tbuf, sizeof(tbuf), sc->sc_secperunit *
141 1.1 ad sc->sc_secsize);
142 1.57 cegger aprint_normal_dev(&sc->sc_dv, "%s, %d cyl, %d head, %d sec, %d bytes/sect x %"PRIu64" sectors\n",
143 1.57 cegger tbuf, sc->sc_ncylinders, sc->sc_nheads,
144 1.1 ad sc->sc_nsectors, sc->sc_secsize, sc->sc_secperunit);
145 1.1 ad
146 1.43 riz ld_set_properties(sc);
147 1.43 riz
148 1.1 ad #if NRND > 0
149 1.1 ad /* Attach the device into the rnd source list. */
150 1.57 cegger rnd_attach_source(&sc->sc_rnd_source, device_xname(&sc->sc_dv),
151 1.1 ad RND_TYPE_DISK, 0);
152 1.1 ad #endif
153 1.1 ad
154 1.55 jmcneill /* Register with PMF */
155 1.55 jmcneill if (!pmf_device_register1(&sc->sc_dv, NULL, NULL, ld_shutdown))
156 1.55 jmcneill aprint_error_dev(&sc->sc_dv,
157 1.55 jmcneill "couldn't establish power handler\n");
158 1.55 jmcneill
159 1.38 yamt bufq_alloc(&sc->sc_bufq, BUFQ_DISK_DEFAULT_STRAT, BUFQ_SORT_RAWBLOCK);
160 1.30 thorpej
161 1.30 thorpej /* Discover wedges on this disk. */
162 1.45 riz config_interrupts(&sc->sc_dv, ld_config_interrupts);
163 1.1 ad }
164 1.1 ad
165 1.3 ad int
166 1.37 christos ldadjqparam(struct ld_softc *sc, int xmax)
167 1.3 ad {
168 1.24 thorpej int s;
169 1.7 ad
170 1.7 ad s = splbio();
171 1.37 christos sc->sc_maxqueuecnt = xmax;
172 1.7 ad splx(s);
173 1.7 ad
174 1.24 thorpej return (0);
175 1.7 ad }
176 1.7 ad
177 1.7 ad int
178 1.7 ad ldbegindetach(struct ld_softc *sc, int flags)
179 1.7 ad {
180 1.24 thorpej int s, rv = 0;
181 1.7 ad
182 1.7 ad if ((sc->sc_flags & LDF_ENABLED) == 0)
183 1.7 ad return (0);
184 1.3 ad
185 1.3 ad if ((flags & DETACH_FORCE) == 0 && sc->sc_dk.dk_openmask != 0)
186 1.3 ad return (EBUSY);
187 1.3 ad
188 1.3 ad s = splbio();
189 1.24 thorpej sc->sc_maxqueuecnt = 0;
190 1.7 ad sc->sc_flags |= LDF_DETACH;
191 1.24 thorpej while (sc->sc_queuecnt > 0) {
192 1.24 thorpej sc->sc_flags |= LDF_DRAIN;
193 1.24 thorpej rv = tsleep(&sc->sc_queuecnt, PRIBIO, "lddrn", 0);
194 1.24 thorpej if (rv)
195 1.24 thorpej break;
196 1.24 thorpej }
197 1.3 ad splx(s);
198 1.7 ad
199 1.7 ad return (rv);
200 1.3 ad }
201 1.3 ad
202 1.2 ad void
203 1.7 ad ldenddetach(struct ld_softc *sc)
204 1.2 ad {
205 1.13 drochner int s, bmaj, cmaj, i, mn;
206 1.2 ad
207 1.7 ad if ((sc->sc_flags & LDF_ENABLED) == 0)
208 1.7 ad return;
209 1.7 ad
210 1.2 ad /* Wait for commands queued with the hardware to complete. */
211 1.2 ad if (sc->sc_queuecnt != 0)
212 1.7 ad if (tsleep(&sc->sc_queuecnt, PRIBIO, "lddtch", 30 * hz))
213 1.57 cegger printf("%s: not drained\n", device_xname(&sc->sc_dv));
214 1.2 ad
215 1.2 ad /* Locate the major numbers. */
216 1.16 gehenna bmaj = bdevsw_lookup_major(&ld_bdevsw);
217 1.16 gehenna cmaj = cdevsw_lookup_major(&ld_cdevsw);
218 1.2 ad
219 1.2 ad /* Kill off any queued buffers. */
220 1.2 ad s = splbio();
221 1.38 yamt bufq_drain(sc->sc_bufq);
222 1.36 yamt splx(s);
223 1.36 yamt
224 1.38 yamt bufq_free(sc->sc_bufq);
225 1.2 ad
226 1.2 ad /* Nuke the vnodes for any open instances. */
227 1.13 drochner for (i = 0; i < MAXPARTITIONS; i++) {
228 1.40 thorpej mn = DISKMINOR(device_unit(&sc->sc_dv), i);
229 1.13 drochner vdevgone(bmaj, mn, mn, VBLK);
230 1.13 drochner vdevgone(cmaj, mn, mn, VCHR);
231 1.13 drochner }
232 1.13 drochner
233 1.30 thorpej /* Delete all of our wedges. */
234 1.30 thorpej dkwedge_delall(&sc->sc_dk);
235 1.30 thorpej
236 1.2 ad /* Detach from the disk list. */
237 1.2 ad disk_detach(&sc->sc_dk);
238 1.50 ad disk_destroy(&sc->sc_dk);
239 1.2 ad
240 1.2 ad #if NRND > 0
241 1.2 ad /* Unhook the entropy source. */
242 1.2 ad rnd_detach_source(&sc->sc_rnd_source);
243 1.2 ad #endif
244 1.2 ad
245 1.56 jmcneill /* Deregister with PMF */
246 1.56 jmcneill pmf_device_deregister(&sc->sc_dv);
247 1.56 jmcneill
248 1.24 thorpej /*
249 1.24 thorpej * XXX We can't really flush the cache here, beceause the
250 1.24 thorpej * XXX device may already be non-existent from the controller's
251 1.24 thorpej * XXX perspective.
252 1.24 thorpej */
253 1.24 thorpej #if 0
254 1.2 ad /* Flush the device's cache. */
255 1.2 ad if (sc->sc_flush != NULL)
256 1.62 simonb if ((*sc->sc_flush)(sc, 0) != 0)
257 1.57 cegger aprint_error_dev(&sc->sc_dv, "unable to flush cache\n");
258 1.24 thorpej #endif
259 1.61 ws mutex_destroy(&sc->sc_mutex);
260 1.2 ad }
261 1.2 ad
262 1.8 lukem /* ARGSUSED */
263 1.55 jmcneill static bool
264 1.55 jmcneill ld_shutdown(device_t dev, int flags)
265 1.1 ad {
266 1.55 jmcneill struct ld_softc *sc = device_private(dev);
267 1.1 ad
268 1.62 simonb if (sc->sc_flush != NULL && (*sc->sc_flush)(sc, LDFL_POLL) != 0) {
269 1.55 jmcneill printf("%s: unable to flush cache\n", device_xname(dev));
270 1.55 jmcneill return false;
271 1.1 ad }
272 1.55 jmcneill
273 1.55 jmcneill return true;
274 1.1 ad }
275 1.1 ad
276 1.8 lukem /* ARGSUSED */
277 1.29 thorpej static int
278 1.42 christos ldopen(dev_t dev, int flags, int fmt, struct lwp *l)
279 1.1 ad {
280 1.1 ad struct ld_softc *sc;
281 1.30 thorpej int error, unit, part;
282 1.1 ad
283 1.1 ad unit = DISKUNIT(dev);
284 1.59 tsutsui if ((sc = device_lookup_private(&ld_cd, unit)) == NULL)
285 1.1 ad return (ENXIO);
286 1.1 ad if ((sc->sc_flags & LDF_ENABLED) == 0)
287 1.1 ad return (ENODEV);
288 1.1 ad part = DISKPART(dev);
289 1.30 thorpej
290 1.48 ad mutex_enter(&sc->sc_dk.dk_openlock);
291 1.1 ad
292 1.22 thorpej if (sc->sc_dk.dk_openmask == 0) {
293 1.22 thorpej /* Load the partition info if not already loaded. */
294 1.22 thorpej if ((sc->sc_flags & LDF_VLABEL) == 0)
295 1.22 thorpej ldgetdisklabel(sc);
296 1.22 thorpej }
297 1.1 ad
298 1.1 ad /* Check that the partition exists. */
299 1.1 ad if (part != RAW_PART && (part >= sc->sc_dk.dk_label->d_npartitions ||
300 1.1 ad sc->sc_dk.dk_label->d_partitions[part].p_fstype == FS_UNUSED)) {
301 1.30 thorpej error = ENXIO;
302 1.30 thorpej goto bad1;
303 1.1 ad }
304 1.1 ad
305 1.1 ad /* Ensure only one open at a time. */
306 1.1 ad switch (fmt) {
307 1.1 ad case S_IFCHR:
308 1.1 ad sc->sc_dk.dk_copenmask |= (1 << part);
309 1.1 ad break;
310 1.1 ad case S_IFBLK:
311 1.1 ad sc->sc_dk.dk_bopenmask |= (1 << part);
312 1.1 ad break;
313 1.1 ad }
314 1.1 ad sc->sc_dk.dk_openmask =
315 1.1 ad sc->sc_dk.dk_copenmask | sc->sc_dk.dk_bopenmask;
316 1.1 ad
317 1.48 ad error = 0;
318 1.30 thorpej bad1:
319 1.48 ad mutex_exit(&sc->sc_dk.dk_openlock);
320 1.30 thorpej return (error);
321 1.1 ad }
322 1.1 ad
323 1.8 lukem /* ARGSUSED */
324 1.29 thorpej static int
325 1.42 christos ldclose(dev_t dev, int flags, int fmt, struct lwp *l)
326 1.1 ad {
327 1.1 ad struct ld_softc *sc;
328 1.48 ad int part, unit;
329 1.1 ad
330 1.1 ad unit = DISKUNIT(dev);
331 1.1 ad part = DISKPART(dev);
332 1.59 tsutsui sc = device_lookup_private(&ld_cd, unit);
333 1.30 thorpej
334 1.48 ad mutex_enter(&sc->sc_dk.dk_openlock);
335 1.1 ad
336 1.1 ad switch (fmt) {
337 1.1 ad case S_IFCHR:
338 1.1 ad sc->sc_dk.dk_copenmask &= ~(1 << part);
339 1.1 ad break;
340 1.1 ad case S_IFBLK:
341 1.1 ad sc->sc_dk.dk_bopenmask &= ~(1 << part);
342 1.1 ad break;
343 1.1 ad }
344 1.1 ad sc->sc_dk.dk_openmask =
345 1.1 ad sc->sc_dk.dk_copenmask | sc->sc_dk.dk_bopenmask;
346 1.1 ad
347 1.22 thorpej if (sc->sc_dk.dk_openmask == 0) {
348 1.62 simonb if (sc->sc_flush != NULL && (*sc->sc_flush)(sc, 0) != 0)
349 1.57 cegger aprint_error_dev(&sc->sc_dv, "unable to flush cache\n");
350 1.22 thorpej if ((sc->sc_flags & LDF_KLABEL) == 0)
351 1.22 thorpej sc->sc_flags &= ~LDF_VLABEL;
352 1.22 thorpej }
353 1.1 ad
354 1.48 ad mutex_exit(&sc->sc_dk.dk_openlock);
355 1.1 ad return (0);
356 1.1 ad }
357 1.1 ad
358 1.8 lukem /* ARGSUSED */
359 1.29 thorpej static int
360 1.42 christos ldread(dev_t dev, struct uio *uio, int ioflag)
361 1.1 ad {
362 1.1 ad
363 1.1 ad return (physio(ldstrategy, NULL, dev, B_READ, ldminphys, uio));
364 1.1 ad }
365 1.1 ad
366 1.8 lukem /* ARGSUSED */
367 1.29 thorpej static int
368 1.42 christos ldwrite(dev_t dev, struct uio *uio, int ioflag)
369 1.1 ad {
370 1.1 ad
371 1.1 ad return (physio(ldstrategy, NULL, dev, B_WRITE, ldminphys, uio));
372 1.1 ad }
373 1.1 ad
374 1.8 lukem /* ARGSUSED */
375 1.29 thorpej static int
376 1.46 christos ldioctl(dev_t dev, u_long cmd, void *addr, int32_t flag, struct lwp *l)
377 1.1 ad {
378 1.1 ad struct ld_softc *sc;
379 1.52 xtraeme int part, unit, error;
380 1.4 fvdl #ifdef __HAVE_OLD_DISKLABEL
381 1.6 itojun struct disklabel newlabel;
382 1.4 fvdl #endif
383 1.6 itojun struct disklabel *lp;
384 1.1 ad
385 1.1 ad unit = DISKUNIT(dev);
386 1.1 ad part = DISKPART(dev);
387 1.59 tsutsui sc = device_lookup_private(&ld_cd, unit);
388 1.1 ad
389 1.43 riz error = disk_ioctl(&sc->sc_dk, cmd, addr, flag, l);
390 1.43 riz if (error != EPASSTHROUGH)
391 1.43 riz return (error);
392 1.43 riz
393 1.47 tron error = 0;
394 1.1 ad switch (cmd) {
395 1.1 ad case DIOCGDINFO:
396 1.1 ad memcpy(addr, sc->sc_dk.dk_label, sizeof(struct disklabel));
397 1.1 ad return (0);
398 1.1 ad
399 1.4 fvdl #ifdef __HAVE_OLD_DISKLABEL
400 1.4 fvdl case ODIOCGDINFO:
401 1.4 fvdl newlabel = *(sc->sc_dk.dk_label);
402 1.4 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
403 1.5 fvdl return ENOTTY;
404 1.4 fvdl memcpy(addr, &newlabel, sizeof(struct olddisklabel));
405 1.4 fvdl return (0);
406 1.4 fvdl #endif
407 1.4 fvdl
408 1.1 ad case DIOCGPART:
409 1.1 ad ((struct partinfo *)addr)->disklab = sc->sc_dk.dk_label;
410 1.1 ad ((struct partinfo *)addr)->part =
411 1.1 ad &sc->sc_dk.dk_label->d_partitions[part];
412 1.1 ad break;
413 1.1 ad
414 1.1 ad case DIOCWDINFO:
415 1.1 ad case DIOCSDINFO:
416 1.4 fvdl #ifdef __HAVE_OLD_DISKLABEL
417 1.4 fvdl case ODIOCWDINFO:
418 1.4 fvdl case ODIOCSDINFO:
419 1.4 fvdl
420 1.4 fvdl if (cmd == ODIOCSDINFO || cmd == ODIOCWDINFO) {
421 1.4 fvdl memset(&newlabel, 0, sizeof newlabel);
422 1.4 fvdl memcpy(&newlabel, addr, sizeof (struct olddisklabel));
423 1.4 fvdl lp = &newlabel;
424 1.4 fvdl } else
425 1.4 fvdl #endif
426 1.4 fvdl lp = (struct disklabel *)addr;
427 1.4 fvdl
428 1.1 ad if ((flag & FWRITE) == 0)
429 1.1 ad return (EBADF);
430 1.1 ad
431 1.48 ad mutex_enter(&sc->sc_dk.dk_openlock);
432 1.1 ad sc->sc_flags |= LDF_LABELLING;
433 1.1 ad
434 1.1 ad error = setdisklabel(sc->sc_dk.dk_label,
435 1.4 fvdl lp, /*sc->sc_dk.dk_openmask : */0,
436 1.1 ad sc->sc_dk.dk_cpulabel);
437 1.4 fvdl if (error == 0 && (cmd == DIOCWDINFO
438 1.4 fvdl #ifdef __HAVE_OLD_DISKLABEL
439 1.4 fvdl || cmd == ODIOCWDINFO
440 1.4 fvdl #endif
441 1.4 fvdl ))
442 1.1 ad error = writedisklabel(
443 1.35 perry MAKEDISKDEV(major(dev), DISKUNIT(dev), RAW_PART),
444 1.35 perry ldstrategy, sc->sc_dk.dk_label,
445 1.1 ad sc->sc_dk.dk_cpulabel);
446 1.1 ad
447 1.1 ad sc->sc_flags &= ~LDF_LABELLING;
448 1.48 ad mutex_exit(&sc->sc_dk.dk_openlock);
449 1.1 ad break;
450 1.1 ad
451 1.22 thorpej case DIOCKLABEL:
452 1.22 thorpej if ((flag & FWRITE) == 0)
453 1.22 thorpej return (EBADF);
454 1.22 thorpej if (*(int *)addr)
455 1.22 thorpej sc->sc_flags |= LDF_KLABEL;
456 1.22 thorpej else
457 1.22 thorpej sc->sc_flags &= ~LDF_KLABEL;
458 1.22 thorpej break;
459 1.22 thorpej
460 1.1 ad case DIOCWLABEL:
461 1.1 ad if ((flag & FWRITE) == 0)
462 1.1 ad return (EBADF);
463 1.1 ad if (*(int *)addr)
464 1.1 ad sc->sc_flags |= LDF_WLABEL;
465 1.1 ad else
466 1.1 ad sc->sc_flags &= ~LDF_WLABEL;
467 1.1 ad break;
468 1.1 ad
469 1.1 ad case DIOCGDEFLABEL:
470 1.1 ad ldgetdefaultlabel(sc, (struct disklabel *)addr);
471 1.1 ad break;
472 1.4 fvdl
473 1.4 fvdl #ifdef __HAVE_OLD_DISKLABEL
474 1.4 fvdl case ODIOCGDEFLABEL:
475 1.4 fvdl ldgetdefaultlabel(sc, &newlabel);
476 1.4 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
477 1.5 fvdl return ENOTTY;
478 1.4 fvdl memcpy(addr, &newlabel, sizeof (struct olddisklabel));
479 1.4 fvdl break;
480 1.4 fvdl #endif
481 1.1 ad
482 1.32 thorpej case DIOCCACHESYNC:
483 1.32 thorpej /*
484 1.32 thorpej * XXX Do we really need to care about having a writable
485 1.32 thorpej * file descriptor here?
486 1.32 thorpej */
487 1.32 thorpej if ((flag & FWRITE) == 0)
488 1.32 thorpej error = EBADF;
489 1.32 thorpej else if (sc->sc_flush)
490 1.62 simonb error = (*sc->sc_flush)(sc, 0);
491 1.32 thorpej else
492 1.32 thorpej error = 0; /* XXX Error out instead? */
493 1.32 thorpej break;
494 1.32 thorpej
495 1.30 thorpej case DIOCAWEDGE:
496 1.30 thorpej {
497 1.30 thorpej struct dkwedge_info *dkw = (void *) addr;
498 1.30 thorpej
499 1.30 thorpej if ((flag & FWRITE) == 0)
500 1.30 thorpej return (EBADF);
501 1.30 thorpej
502 1.30 thorpej /* If the ioctl happens here, the parent is us. */
503 1.57 cegger strlcpy(dkw->dkw_parent, device_xname(&sc->sc_dv),
504 1.57 cegger sizeof(dkw->dkw_parent));
505 1.30 thorpej return (dkwedge_add(dkw));
506 1.30 thorpej }
507 1.35 perry
508 1.30 thorpej case DIOCDWEDGE:
509 1.30 thorpej {
510 1.30 thorpej struct dkwedge_info *dkw = (void *) addr;
511 1.30 thorpej
512 1.30 thorpej if ((flag & FWRITE) == 0)
513 1.30 thorpej return (EBADF);
514 1.30 thorpej
515 1.30 thorpej /* If the ioctl happens here, the parent is us. */
516 1.57 cegger strlcpy(dkw->dkw_parent, device_xname(&sc->sc_dv),
517 1.57 cegger sizeof(dkw->dkw_parent));
518 1.30 thorpej return (dkwedge_del(dkw));
519 1.30 thorpej }
520 1.35 perry
521 1.30 thorpej case DIOCLWEDGES:
522 1.30 thorpej {
523 1.30 thorpej struct dkwedge_list *dkwl = (void *) addr;
524 1.30 thorpej
525 1.39 christos return (dkwedge_list(&sc->sc_dk, dkwl, l));
526 1.30 thorpej }
527 1.51 xtraeme case DIOCGSTRATEGY:
528 1.51 xtraeme {
529 1.51 xtraeme struct disk_strategy *dks = (void *)addr;
530 1.51 xtraeme
531 1.52 xtraeme mutex_enter(&sc->sc_mutex);
532 1.51 xtraeme strlcpy(dks->dks_name, bufq_getstrategyname(sc->sc_bufq),
533 1.51 xtraeme sizeof(dks->dks_name));
534 1.52 xtraeme mutex_exit(&sc->sc_mutex);
535 1.51 xtraeme dks->dks_paramlen = 0;
536 1.51 xtraeme
537 1.51 xtraeme return 0;
538 1.51 xtraeme }
539 1.51 xtraeme case DIOCSSTRATEGY:
540 1.51 xtraeme {
541 1.51 xtraeme struct disk_strategy *dks = (void *)addr;
542 1.51 xtraeme struct bufq_state *new, *old;
543 1.30 thorpej
544 1.51 xtraeme if ((flag & FWRITE) == 0)
545 1.51 xtraeme return EPERM;
546 1.51 xtraeme
547 1.51 xtraeme if (dks->dks_param != NULL)
548 1.51 xtraeme return EINVAL;
549 1.51 xtraeme
550 1.51 xtraeme dks->dks_name[sizeof(dks->dks_name) - 1] = 0; /* ensure term */
551 1.51 xtraeme error = bufq_alloc(&new, dks->dks_name,
552 1.51 xtraeme BUFQ_EXACT|BUFQ_SORT_RAWBLOCK);
553 1.51 xtraeme if (error)
554 1.51 xtraeme return error;
555 1.51 xtraeme
556 1.52 xtraeme mutex_enter(&sc->sc_mutex);
557 1.51 xtraeme old = sc->sc_bufq;
558 1.51 xtraeme bufq_move(new, old);
559 1.51 xtraeme sc->sc_bufq = new;
560 1.52 xtraeme mutex_exit(&sc->sc_mutex);
561 1.51 xtraeme bufq_free(old);
562 1.51 xtraeme
563 1.51 xtraeme return 0;
564 1.51 xtraeme }
565 1.1 ad default:
566 1.1 ad error = ENOTTY;
567 1.1 ad break;
568 1.1 ad }
569 1.1 ad
570 1.1 ad return (error);
571 1.1 ad }
572 1.1 ad
573 1.29 thorpej static void
574 1.1 ad ldstrategy(struct buf *bp)
575 1.1 ad {
576 1.1 ad struct ld_softc *sc;
577 1.23 thorpej struct disklabel *lp;
578 1.23 thorpej daddr_t blkno;
579 1.23 thorpej int s, part;
580 1.1 ad
581 1.59 tsutsui sc = device_lookup_private(&ld_cd, DISKUNIT(bp->b_dev));
582 1.23 thorpej part = DISKPART(bp->b_dev);
583 1.1 ad
584 1.7 ad if ((sc->sc_flags & LDF_DETACH) != 0) {
585 1.2 ad bp->b_error = EIO;
586 1.49 ad goto done;
587 1.2 ad }
588 1.2 ad
589 1.1 ad lp = sc->sc_dk.dk_label;
590 1.1 ad
591 1.1 ad /*
592 1.1 ad * The transfer must be a whole number of blocks and the offset must
593 1.1 ad * not be negative.
594 1.1 ad */
595 1.1 ad if ((bp->b_bcount % lp->d_secsize) != 0 || bp->b_blkno < 0) {
596 1.23 thorpej bp->b_error = EINVAL;
597 1.49 ad goto done;
598 1.1 ad }
599 1.1 ad
600 1.23 thorpej /* If it's a null transfer, return immediately. */
601 1.23 thorpej if (bp->b_bcount == 0)
602 1.23 thorpej goto done;
603 1.1 ad
604 1.1 ad /*
605 1.1 ad * Do bounds checking and adjust the transfer. If error, process.
606 1.1 ad * If past the end of partition, just return.
607 1.1 ad */
608 1.1 ad if (part != RAW_PART &&
609 1.20 thorpej bounds_check_with_label(&sc->sc_dk, bp,
610 1.1 ad (sc->sc_flags & (LDF_WLABEL | LDF_LABELLING)) != 0) <= 0) {
611 1.23 thorpej goto done;
612 1.1 ad }
613 1.1 ad
614 1.1 ad /*
615 1.23 thorpej * Convert the block number to absolute and put it in terms
616 1.23 thorpej * of the device's logical block size.
617 1.1 ad */
618 1.23 thorpej if (lp->d_secsize == DEV_BSIZE)
619 1.23 thorpej blkno = bp->b_blkno;
620 1.23 thorpej else if (lp->d_secsize > DEV_BSIZE)
621 1.23 thorpej blkno = bp->b_blkno / (lp->d_secsize / DEV_BSIZE);
622 1.1 ad else
623 1.23 thorpej blkno = bp->b_blkno * (DEV_BSIZE / lp->d_secsize);
624 1.1 ad
625 1.11 thorpej if (part != RAW_PART)
626 1.23 thorpej blkno += lp->d_partitions[part].p_offset;
627 1.23 thorpej
628 1.23 thorpej bp->b_rawblkno = blkno;
629 1.1 ad
630 1.1 ad s = splbio();
631 1.44 ad ldstart(sc, bp);
632 1.1 ad splx(s);
633 1.23 thorpej return;
634 1.23 thorpej
635 1.23 thorpej done:
636 1.23 thorpej bp->b_resid = bp->b_bcount;
637 1.23 thorpej biodone(bp);
638 1.23 thorpej }
639 1.23 thorpej
640 1.23 thorpej static void
641 1.44 ad ldstart(struct ld_softc *sc, struct buf *bp)
642 1.23 thorpej {
643 1.23 thorpej int error;
644 1.1 ad
645 1.44 ad mutex_enter(&sc->sc_mutex);
646 1.44 ad
647 1.44 ad if (bp != NULL)
648 1.44 ad BUFQ_PUT(sc->sc_bufq, bp);
649 1.44 ad
650 1.23 thorpej while (sc->sc_queuecnt < sc->sc_maxqueuecnt) {
651 1.23 thorpej /* See if there is work to do. */
652 1.38 yamt if ((bp = BUFQ_PEEK(sc->sc_bufq)) == NULL)
653 1.23 thorpej break;
654 1.23 thorpej
655 1.23 thorpej disk_busy(&sc->sc_dk);
656 1.23 thorpej sc->sc_queuecnt++;
657 1.23 thorpej
658 1.23 thorpej if (__predict_true((error = (*sc->sc_start)(sc, bp)) == 0)) {
659 1.23 thorpej /*
660 1.23 thorpej * The back-end is running the job; remove it from
661 1.23 thorpej * the queue.
662 1.23 thorpej */
663 1.38 yamt (void) BUFQ_GET(sc->sc_bufq);
664 1.23 thorpej } else {
665 1.23 thorpej disk_unbusy(&sc->sc_dk, 0, (bp->b_flags & B_READ));
666 1.23 thorpej sc->sc_queuecnt--;
667 1.23 thorpej if (error == EAGAIN) {
668 1.23 thorpej /*
669 1.23 thorpej * Temporary resource shortage in the
670 1.23 thorpej * back-end; just defer the job until
671 1.23 thorpej * later.
672 1.23 thorpej *
673 1.23 thorpej * XXX We might consider a watchdog timer
674 1.23 thorpej * XXX to make sure we are kicked into action.
675 1.23 thorpej */
676 1.23 thorpej break;
677 1.23 thorpej } else {
678 1.38 yamt (void) BUFQ_GET(sc->sc_bufq);
679 1.23 thorpej bp->b_error = error;
680 1.23 thorpej bp->b_resid = bp->b_bcount;
681 1.44 ad mutex_exit(&sc->sc_mutex);
682 1.23 thorpej biodone(bp);
683 1.44 ad mutex_enter(&sc->sc_mutex);
684 1.23 thorpej }
685 1.23 thorpej }
686 1.1 ad }
687 1.44 ad
688 1.44 ad mutex_exit(&sc->sc_mutex);
689 1.1 ad }
690 1.1 ad
691 1.1 ad void
692 1.1 ad lddone(struct ld_softc *sc, struct buf *bp)
693 1.1 ad {
694 1.1 ad
695 1.49 ad if (bp->b_error != 0) {
696 1.1 ad diskerr(bp, "ld", "error", LOG_PRINTF, 0, sc->sc_dk.dk_label);
697 1.1 ad printf("\n");
698 1.1 ad }
699 1.1 ad
700 1.18 mrg disk_unbusy(&sc->sc_dk, bp->b_bcount - bp->b_resid,
701 1.18 mrg (bp->b_flags & B_READ));
702 1.1 ad #if NRND > 0
703 1.1 ad rnd_add_uint32(&sc->sc_rnd_source, bp->b_rawblkno);
704 1.1 ad #endif
705 1.1 ad biodone(bp);
706 1.1 ad
707 1.44 ad mutex_enter(&sc->sc_mutex);
708 1.7 ad if (--sc->sc_queuecnt <= sc->sc_maxqueuecnt) {
709 1.24 thorpej if ((sc->sc_flags & LDF_DRAIN) != 0) {
710 1.24 thorpej sc->sc_flags &= ~LDF_DRAIN;
711 1.7 ad wakeup(&sc->sc_queuecnt);
712 1.24 thorpej }
713 1.44 ad mutex_exit(&sc->sc_mutex);
714 1.44 ad ldstart(sc, NULL);
715 1.44 ad } else
716 1.44 ad mutex_exit(&sc->sc_mutex);
717 1.1 ad }
718 1.1 ad
719 1.29 thorpej static int
720 1.1 ad ldsize(dev_t dev)
721 1.1 ad {
722 1.1 ad struct ld_softc *sc;
723 1.1 ad int part, unit, omask, size;
724 1.1 ad
725 1.1 ad unit = DISKUNIT(dev);
726 1.59 tsutsui if ((sc = device_lookup_private(&ld_cd, unit)) == NULL)
727 1.1 ad return (ENODEV);
728 1.1 ad if ((sc->sc_flags & LDF_ENABLED) == 0)
729 1.1 ad return (ENODEV);
730 1.1 ad part = DISKPART(dev);
731 1.1 ad
732 1.1 ad omask = sc->sc_dk.dk_openmask & (1 << part);
733 1.1 ad
734 1.1 ad if (omask == 0 && ldopen(dev, 0, S_IFBLK, NULL) != 0)
735 1.1 ad return (-1);
736 1.1 ad else if (sc->sc_dk.dk_label->d_partitions[part].p_fstype != FS_SWAP)
737 1.1 ad size = -1;
738 1.1 ad else
739 1.1 ad size = sc->sc_dk.dk_label->d_partitions[part].p_size *
740 1.1 ad (sc->sc_dk.dk_label->d_secsize / DEV_BSIZE);
741 1.1 ad if (omask == 0 && ldclose(dev, 0, S_IFBLK, NULL) != 0)
742 1.1 ad return (-1);
743 1.1 ad
744 1.1 ad return (size);
745 1.1 ad }
746 1.1 ad
747 1.1 ad /*
748 1.1 ad * Load the label information from the specified device.
749 1.1 ad */
750 1.1 ad static void
751 1.1 ad ldgetdisklabel(struct ld_softc *sc)
752 1.1 ad {
753 1.1 ad const char *errstring;
754 1.1 ad
755 1.1 ad ldgetdefaultlabel(sc, sc->sc_dk.dk_label);
756 1.1 ad
757 1.1 ad /* Call the generic disklabel extraction routine. */
758 1.40 thorpej errstring = readdisklabel(MAKEDISKDEV(0, device_unit(&sc->sc_dv),
759 1.40 thorpej RAW_PART), ldstrategy, sc->sc_dk.dk_label, sc->sc_dk.dk_cpulabel);
760 1.1 ad if (errstring != NULL)
761 1.57 cegger printf("%s: %s\n", device_xname(&sc->sc_dv), errstring);
762 1.22 thorpej
763 1.22 thorpej /* In-core label now valid. */
764 1.22 thorpej sc->sc_flags |= LDF_VLABEL;
765 1.1 ad }
766 1.1 ad
767 1.1 ad /*
768 1.1 ad * Construct a ficticious label.
769 1.1 ad */
770 1.1 ad static void
771 1.1 ad ldgetdefaultlabel(struct ld_softc *sc, struct disklabel *lp)
772 1.1 ad {
773 1.1 ad
774 1.1 ad memset(lp, 0, sizeof(struct disklabel));
775 1.1 ad
776 1.1 ad lp->d_secsize = sc->sc_secsize;
777 1.1 ad lp->d_ntracks = sc->sc_nheads;
778 1.1 ad lp->d_nsectors = sc->sc_nsectors;
779 1.1 ad lp->d_ncylinders = sc->sc_ncylinders;
780 1.1 ad lp->d_secpercyl = lp->d_ntracks * lp->d_nsectors;
781 1.1 ad lp->d_type = DTYPE_LD;
782 1.21 itojun strlcpy(lp->d_typename, "unknown", sizeof(lp->d_typename));
783 1.21 itojun strlcpy(lp->d_packname, "fictitious", sizeof(lp->d_packname));
784 1.1 ad lp->d_secperunit = sc->sc_secperunit;
785 1.1 ad lp->d_rpm = 7200;
786 1.1 ad lp->d_interleave = 1;
787 1.1 ad lp->d_flags = 0;
788 1.1 ad
789 1.1 ad lp->d_partitions[RAW_PART].p_offset = 0;
790 1.1 ad lp->d_partitions[RAW_PART].p_size =
791 1.1 ad lp->d_secperunit * (lp->d_secsize / DEV_BSIZE);
792 1.1 ad lp->d_partitions[RAW_PART].p_fstype = FS_UNUSED;
793 1.1 ad lp->d_npartitions = RAW_PART + 1;
794 1.1 ad
795 1.1 ad lp->d_magic = DISKMAGIC;
796 1.1 ad lp->d_magic2 = DISKMAGIC;
797 1.1 ad lp->d_checksum = dkcksum(lp);
798 1.1 ad }
799 1.1 ad
800 1.1 ad /*
801 1.1 ad * Take a dump.
802 1.1 ad */
803 1.29 thorpej static int
804 1.46 christos lddump(dev_t dev, daddr_t blkno, void *vav, size_t size)
805 1.1 ad {
806 1.46 christos char *va = vav;
807 1.1 ad struct ld_softc *sc;
808 1.1 ad struct disklabel *lp;
809 1.1 ad int unit, part, nsects, sectoff, towrt, nblk, maxblkcnt, rv;
810 1.1 ad static int dumping;
811 1.1 ad
812 1.1 ad unit = DISKUNIT(dev);
813 1.59 tsutsui if ((sc = device_lookup_private(&ld_cd, unit)) == NULL)
814 1.1 ad return (ENXIO);
815 1.1 ad if ((sc->sc_flags & LDF_ENABLED) == 0)
816 1.1 ad return (ENODEV);
817 1.3 ad if (sc->sc_dump == NULL)
818 1.3 ad return (ENXIO);
819 1.3 ad
820 1.3 ad /* Check if recursive dump; if so, punt. */
821 1.3 ad if (dumping)
822 1.3 ad return (EFAULT);
823 1.3 ad dumping = 1;
824 1.1 ad
825 1.1 ad /* Convert to disk sectors. Request must be a multiple of size. */
826 1.3 ad part = DISKPART(dev);
827 1.1 ad lp = sc->sc_dk.dk_label;
828 1.1 ad if ((size % lp->d_secsize) != 0)
829 1.1 ad return (EFAULT);
830 1.1 ad towrt = size / lp->d_secsize;
831 1.1 ad blkno = dbtob(blkno) / lp->d_secsize; /* blkno in DEV_BSIZE units */
832 1.1 ad
833 1.1 ad nsects = lp->d_partitions[part].p_size;
834 1.1 ad sectoff = lp->d_partitions[part].p_offset;
835 1.1 ad
836 1.1 ad /* Check transfer bounds against partition size. */
837 1.1 ad if ((blkno < 0) || ((blkno + towrt) > nsects))
838 1.1 ad return (EINVAL);
839 1.1 ad
840 1.1 ad /* Offset block number to start of partition. */
841 1.1 ad blkno += sectoff;
842 1.1 ad
843 1.1 ad /* Start dumping and return when done. */
844 1.3 ad maxblkcnt = sc->sc_maxxfer / sc->sc_secsize - 1;
845 1.1 ad while (towrt > 0) {
846 1.3 ad nblk = min(maxblkcnt, towrt);
847 1.1 ad
848 1.1 ad if ((rv = (*sc->sc_dump)(sc, va, blkno, nblk)) != 0)
849 1.1 ad return (rv);
850 1.1 ad
851 1.1 ad towrt -= nblk;
852 1.1 ad blkno += nblk;
853 1.1 ad va += nblk * sc->sc_secsize;
854 1.1 ad }
855 1.1 ad
856 1.1 ad dumping = 0;
857 1.1 ad return (0);
858 1.1 ad }
859 1.1 ad
860 1.1 ad /*
861 1.1 ad * Adjust the size of a transfer.
862 1.1 ad */
863 1.1 ad static void
864 1.1 ad ldminphys(struct buf *bp)
865 1.1 ad {
866 1.1 ad struct ld_softc *sc;
867 1.1 ad
868 1.59 tsutsui sc = device_lookup_private(&ld_cd, DISKUNIT(bp->b_dev));
869 1.1 ad
870 1.1 ad if (bp->b_bcount > sc->sc_maxxfer)
871 1.1 ad bp->b_bcount = sc->sc_maxxfer;
872 1.1 ad minphys(bp);
873 1.1 ad }
874 1.43 riz
875 1.43 riz static void
876 1.43 riz ld_set_properties(struct ld_softc *ld)
877 1.43 riz {
878 1.43 riz prop_dictionary_t disk_info, odisk_info, geom;
879 1.43 riz
880 1.43 riz disk_info = prop_dictionary_create();
881 1.43 riz
882 1.43 riz geom = prop_dictionary_create();
883 1.43 riz
884 1.43 riz prop_dictionary_set_uint64(geom, "sectors-per-unit",
885 1.43 riz ld->sc_secperunit);
886 1.43 riz
887 1.43 riz prop_dictionary_set_uint32(geom, "sector-size",
888 1.43 riz ld->sc_secsize);
889 1.43 riz
890 1.43 riz prop_dictionary_set_uint16(geom, "sectors-per-track",
891 1.43 riz ld->sc_nsectors);
892 1.43 riz
893 1.43 riz prop_dictionary_set_uint16(geom, "tracks-per-cylinder",
894 1.43 riz ld->sc_nheads);
895 1.43 riz
896 1.43 riz prop_dictionary_set_uint64(geom, "cylinders-per-unit",
897 1.43 riz ld->sc_ncylinders);
898 1.43 riz
899 1.43 riz prop_dictionary_set(disk_info, "geometry", geom);
900 1.43 riz prop_object_release(geom);
901 1.43 riz
902 1.43 riz prop_dictionary_set(device_properties(&ld->sc_dv),
903 1.43 riz "disk-info", disk_info);
904 1.43 riz
905 1.43 riz /*
906 1.43 riz * Don't release disk_info here; we keep a reference to it.
907 1.43 riz * disk_detach() will release it when we go away.
908 1.43 riz */
909 1.43 riz
910 1.43 riz odisk_info = ld->sc_dk.dk_info;
911 1.43 riz ld->sc_dk.dk_info = disk_info;
912 1.43 riz if (odisk_info)
913 1.43 riz prop_object_release(odisk_info);
914 1.43 riz }
915 1.45 riz
916 1.45 riz static void
917 1.45 riz ld_config_interrupts (struct device *d)
918 1.45 riz {
919 1.60 cube struct ld_softc *sc = device_private(d);
920 1.45 riz dkwedge_discover(&sc->sc_dk);
921 1.45 riz }
922