ld.c revision 1.57 1 1.57 cegger /* $NetBSD: ld.c,v 1.57 2008/04/09 05:47:19 cegger Exp $ */
2 1.1 ad
3 1.1 ad /*-
4 1.1 ad * Copyright (c) 1998, 2000 The NetBSD Foundation, Inc.
5 1.1 ad * All rights reserved.
6 1.1 ad *
7 1.1 ad * This code is derived from software contributed to The NetBSD Foundation
8 1.1 ad * by Andrew Doran and Charles M. Hannum.
9 1.1 ad *
10 1.1 ad * Redistribution and use in source and binary forms, with or without
11 1.1 ad * modification, are permitted provided that the following conditions
12 1.1 ad * are met:
13 1.1 ad * 1. Redistributions of source code must retain the above copyright
14 1.1 ad * notice, this list of conditions and the following disclaimer.
15 1.1 ad * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 ad * notice, this list of conditions and the following disclaimer in the
17 1.1 ad * documentation and/or other materials provided with the distribution.
18 1.1 ad * 3. All advertising materials mentioning features or use of this software
19 1.1 ad * must display the following acknowledgement:
20 1.1 ad * This product includes software developed by the NetBSD
21 1.1 ad * Foundation, Inc. and its contributors.
22 1.1 ad * 4. Neither the name of The NetBSD Foundation nor the names of its
23 1.1 ad * contributors may be used to endorse or promote products derived
24 1.1 ad * from this software without specific prior written permission.
25 1.1 ad *
26 1.1 ad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
27 1.1 ad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
28 1.1 ad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
29 1.1 ad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
30 1.1 ad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
31 1.1 ad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
32 1.1 ad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
33 1.1 ad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
34 1.1 ad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
35 1.1 ad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
36 1.1 ad * POSSIBILITY OF SUCH DAMAGE.
37 1.1 ad */
38 1.1 ad
39 1.1 ad /*
40 1.1 ad * Disk driver for use by RAID controllers.
41 1.1 ad */
42 1.12 lukem
43 1.12 lukem #include <sys/cdefs.h>
44 1.57 cegger __KERNEL_RCSID(0, "$NetBSD: ld.c,v 1.57 2008/04/09 05:47:19 cegger Exp $");
45 1.1 ad
46 1.1 ad #include "rnd.h"
47 1.1 ad
48 1.1 ad #include <sys/param.h>
49 1.1 ad #include <sys/systm.h>
50 1.1 ad #include <sys/kernel.h>
51 1.1 ad #include <sys/device.h>
52 1.1 ad #include <sys/queue.h>
53 1.1 ad #include <sys/proc.h>
54 1.1 ad #include <sys/buf.h>
55 1.33 yamt #include <sys/bufq.h>
56 1.1 ad #include <sys/endian.h>
57 1.1 ad #include <sys/disklabel.h>
58 1.1 ad #include <sys/disk.h>
59 1.1 ad #include <sys/dkio.h>
60 1.1 ad #include <sys/stat.h>
61 1.1 ad #include <sys/conf.h>
62 1.1 ad #include <sys/fcntl.h>
63 1.2 ad #include <sys/vnode.h>
64 1.1 ad #include <sys/syslog.h>
65 1.44 ad #include <sys/mutex.h>
66 1.1 ad #if NRND > 0
67 1.1 ad #include <sys/rnd.h>
68 1.1 ad #endif
69 1.1 ad
70 1.1 ad #include <dev/ldvar.h>
71 1.1 ad
72 1.43 riz #include <prop/proplib.h>
73 1.43 riz
74 1.1 ad static void ldgetdefaultlabel(struct ld_softc *, struct disklabel *);
75 1.1 ad static void ldgetdisklabel(struct ld_softc *);
76 1.1 ad static void ldminphys(struct buf *bp);
77 1.55 jmcneill static bool ld_shutdown(device_t, int);
78 1.44 ad static void ldstart(struct ld_softc *, struct buf *);
79 1.43 riz static void ld_set_properties(struct ld_softc *);
80 1.45 riz static void ld_config_interrupts (struct device *);
81 1.1 ad
82 1.1 ad extern struct cfdriver ld_cd;
83 1.1 ad
84 1.29 thorpej static dev_type_open(ldopen);
85 1.29 thorpej static dev_type_close(ldclose);
86 1.29 thorpej static dev_type_read(ldread);
87 1.29 thorpej static dev_type_write(ldwrite);
88 1.29 thorpej static dev_type_ioctl(ldioctl);
89 1.29 thorpej static dev_type_strategy(ldstrategy);
90 1.29 thorpej static dev_type_dump(lddump);
91 1.29 thorpej static dev_type_size(ldsize);
92 1.16 gehenna
93 1.16 gehenna const struct bdevsw ld_bdevsw = {
94 1.16 gehenna ldopen, ldclose, ldstrategy, ldioctl, lddump, ldsize, D_DISK
95 1.16 gehenna };
96 1.16 gehenna
97 1.16 gehenna const struct cdevsw ld_cdevsw = {
98 1.16 gehenna ldopen, ldclose, ldread, ldwrite, ldioctl,
99 1.17 jdolecek nostop, notty, nopoll, nommap, nokqfilter, D_DISK
100 1.16 gehenna };
101 1.16 gehenna
102 1.30 thorpej static struct dkdriver lddkdriver = { ldstrategy, ldminphys };
103 1.1 ad
104 1.1 ad void
105 1.1 ad ldattach(struct ld_softc *sc)
106 1.1 ad {
107 1.37 christos char tbuf[9];
108 1.1 ad
109 1.53 ad mutex_init(&sc->sc_mutex, MUTEX_DEFAULT, IPL_VM);
110 1.44 ad
111 1.7 ad if ((sc->sc_flags & LDF_ENABLED) == 0) {
112 1.57 cegger aprint_normal_dev(&sc->sc_dv, "disabled\n");
113 1.7 ad return;
114 1.7 ad }
115 1.7 ad
116 1.1 ad /* Initialise and attach the disk structure. */
117 1.57 cegger disk_init(&sc->sc_dk, device_xname(&sc->sc_dv), &lddkdriver);
118 1.1 ad disk_attach(&sc->sc_dk);
119 1.1 ad
120 1.1 ad if (sc->sc_maxxfer > MAXPHYS)
121 1.1 ad sc->sc_maxxfer = MAXPHYS;
122 1.9 ad
123 1.19 thorpej /* Build synthetic geometry if necessary. */
124 1.19 thorpej if (sc->sc_nheads == 0 || sc->sc_nsectors == 0 ||
125 1.19 thorpej sc->sc_ncylinders == 0) {
126 1.28 dbj uint64_t ncyl;
127 1.28 dbj
128 1.19 thorpej if (sc->sc_secperunit <= 528 * 2048) /* 528MB */
129 1.19 thorpej sc->sc_nheads = 16;
130 1.19 thorpej else if (sc->sc_secperunit <= 1024 * 2048) /* 1GB */
131 1.19 thorpej sc->sc_nheads = 32;
132 1.19 thorpej else if (sc->sc_secperunit <= 21504 * 2048) /* 21GB */
133 1.19 thorpej sc->sc_nheads = 64;
134 1.19 thorpej else if (sc->sc_secperunit <= 43008 * 2048) /* 42GB */
135 1.19 thorpej sc->sc_nheads = 128;
136 1.19 thorpej else
137 1.19 thorpej sc->sc_nheads = 255;
138 1.19 thorpej
139 1.19 thorpej sc->sc_nsectors = 63;
140 1.28 dbj sc->sc_ncylinders = INT_MAX;
141 1.35 perry ncyl = sc->sc_secperunit /
142 1.19 thorpej (sc->sc_nheads * sc->sc_nsectors);
143 1.28 dbj if (ncyl < INT_MAX)
144 1.28 dbj sc->sc_ncylinders = (int)ncyl;
145 1.19 thorpej }
146 1.1 ad
147 1.37 christos format_bytes(tbuf, sizeof(tbuf), sc->sc_secperunit *
148 1.1 ad sc->sc_secsize);
149 1.57 cegger aprint_normal_dev(&sc->sc_dv, "%s, %d cyl, %d head, %d sec, %d bytes/sect x %"PRIu64" sectors\n",
150 1.57 cegger tbuf, sc->sc_ncylinders, sc->sc_nheads,
151 1.1 ad sc->sc_nsectors, sc->sc_secsize, sc->sc_secperunit);
152 1.1 ad
153 1.43 riz ld_set_properties(sc);
154 1.43 riz
155 1.1 ad #if NRND > 0
156 1.1 ad /* Attach the device into the rnd source list. */
157 1.57 cegger rnd_attach_source(&sc->sc_rnd_source, device_xname(&sc->sc_dv),
158 1.1 ad RND_TYPE_DISK, 0);
159 1.1 ad #endif
160 1.1 ad
161 1.55 jmcneill /* Register with PMF */
162 1.55 jmcneill if (!pmf_device_register1(&sc->sc_dv, NULL, NULL, ld_shutdown))
163 1.55 jmcneill aprint_error_dev(&sc->sc_dv,
164 1.55 jmcneill "couldn't establish power handler\n");
165 1.55 jmcneill
166 1.38 yamt bufq_alloc(&sc->sc_bufq, BUFQ_DISK_DEFAULT_STRAT, BUFQ_SORT_RAWBLOCK);
167 1.30 thorpej
168 1.30 thorpej /* Discover wedges on this disk. */
169 1.45 riz config_interrupts(&sc->sc_dv, ld_config_interrupts);
170 1.1 ad }
171 1.1 ad
172 1.3 ad int
173 1.37 christos ldadjqparam(struct ld_softc *sc, int xmax)
174 1.3 ad {
175 1.24 thorpej int s;
176 1.7 ad
177 1.7 ad s = splbio();
178 1.37 christos sc->sc_maxqueuecnt = xmax;
179 1.7 ad splx(s);
180 1.7 ad
181 1.24 thorpej return (0);
182 1.7 ad }
183 1.7 ad
184 1.7 ad int
185 1.7 ad ldbegindetach(struct ld_softc *sc, int flags)
186 1.7 ad {
187 1.24 thorpej int s, rv = 0;
188 1.7 ad
189 1.7 ad if ((sc->sc_flags & LDF_ENABLED) == 0)
190 1.7 ad return (0);
191 1.3 ad
192 1.3 ad if ((flags & DETACH_FORCE) == 0 && sc->sc_dk.dk_openmask != 0)
193 1.3 ad return (EBUSY);
194 1.3 ad
195 1.3 ad s = splbio();
196 1.24 thorpej sc->sc_maxqueuecnt = 0;
197 1.7 ad sc->sc_flags |= LDF_DETACH;
198 1.24 thorpej while (sc->sc_queuecnt > 0) {
199 1.24 thorpej sc->sc_flags |= LDF_DRAIN;
200 1.24 thorpej rv = tsleep(&sc->sc_queuecnt, PRIBIO, "lddrn", 0);
201 1.24 thorpej if (rv)
202 1.24 thorpej break;
203 1.24 thorpej }
204 1.3 ad splx(s);
205 1.7 ad
206 1.7 ad return (rv);
207 1.3 ad }
208 1.3 ad
209 1.2 ad void
210 1.7 ad ldenddetach(struct ld_softc *sc)
211 1.2 ad {
212 1.13 drochner int s, bmaj, cmaj, i, mn;
213 1.2 ad
214 1.7 ad if ((sc->sc_flags & LDF_ENABLED) == 0)
215 1.7 ad return;
216 1.7 ad
217 1.2 ad /* Wait for commands queued with the hardware to complete. */
218 1.2 ad if (sc->sc_queuecnt != 0)
219 1.7 ad if (tsleep(&sc->sc_queuecnt, PRIBIO, "lddtch", 30 * hz))
220 1.57 cegger printf("%s: not drained\n", device_xname(&sc->sc_dv));
221 1.2 ad
222 1.2 ad /* Locate the major numbers. */
223 1.16 gehenna bmaj = bdevsw_lookup_major(&ld_bdevsw);
224 1.16 gehenna cmaj = cdevsw_lookup_major(&ld_cdevsw);
225 1.2 ad
226 1.2 ad /* Kill off any queued buffers. */
227 1.2 ad s = splbio();
228 1.38 yamt bufq_drain(sc->sc_bufq);
229 1.36 yamt splx(s);
230 1.36 yamt
231 1.38 yamt bufq_free(sc->sc_bufq);
232 1.2 ad
233 1.2 ad /* Nuke the vnodes for any open instances. */
234 1.13 drochner for (i = 0; i < MAXPARTITIONS; i++) {
235 1.40 thorpej mn = DISKMINOR(device_unit(&sc->sc_dv), i);
236 1.13 drochner vdevgone(bmaj, mn, mn, VBLK);
237 1.13 drochner vdevgone(cmaj, mn, mn, VCHR);
238 1.13 drochner }
239 1.13 drochner
240 1.30 thorpej /* Delete all of our wedges. */
241 1.30 thorpej dkwedge_delall(&sc->sc_dk);
242 1.30 thorpej
243 1.2 ad /* Detach from the disk list. */
244 1.2 ad disk_detach(&sc->sc_dk);
245 1.50 ad disk_destroy(&sc->sc_dk);
246 1.2 ad
247 1.2 ad #if NRND > 0
248 1.2 ad /* Unhook the entropy source. */
249 1.2 ad rnd_detach_source(&sc->sc_rnd_source);
250 1.2 ad #endif
251 1.2 ad
252 1.56 jmcneill /* Deregister with PMF */
253 1.56 jmcneill pmf_device_deregister(&sc->sc_dv);
254 1.56 jmcneill
255 1.24 thorpej /*
256 1.24 thorpej * XXX We can't really flush the cache here, beceause the
257 1.24 thorpej * XXX device may already be non-existent from the controller's
258 1.24 thorpej * XXX perspective.
259 1.24 thorpej */
260 1.24 thorpej #if 0
261 1.2 ad /* Flush the device's cache. */
262 1.2 ad if (sc->sc_flush != NULL)
263 1.2 ad if ((*sc->sc_flush)(sc) != 0)
264 1.57 cegger aprint_error_dev(&sc->sc_dv, "unable to flush cache\n");
265 1.24 thorpej #endif
266 1.2 ad }
267 1.2 ad
268 1.8 lukem /* ARGSUSED */
269 1.55 jmcneill static bool
270 1.55 jmcneill ld_shutdown(device_t dev, int flags)
271 1.1 ad {
272 1.55 jmcneill struct ld_softc *sc = device_private(dev);
273 1.1 ad
274 1.55 jmcneill if (sc->sc_flush != NULL && (*sc->sc_flush)(sc) != 0) {
275 1.55 jmcneill printf("%s: unable to flush cache\n", device_xname(dev));
276 1.55 jmcneill return false;
277 1.1 ad }
278 1.55 jmcneill
279 1.55 jmcneill return true;
280 1.1 ad }
281 1.1 ad
282 1.8 lukem /* ARGSUSED */
283 1.29 thorpej static int
284 1.42 christos ldopen(dev_t dev, int flags, int fmt, struct lwp *l)
285 1.1 ad {
286 1.1 ad struct ld_softc *sc;
287 1.30 thorpej int error, unit, part;
288 1.1 ad
289 1.1 ad unit = DISKUNIT(dev);
290 1.30 thorpej if ((sc = device_lookup(&ld_cd, unit)) == NULL)
291 1.1 ad return (ENXIO);
292 1.1 ad if ((sc->sc_flags & LDF_ENABLED) == 0)
293 1.1 ad return (ENODEV);
294 1.1 ad part = DISKPART(dev);
295 1.30 thorpej
296 1.48 ad mutex_enter(&sc->sc_dk.dk_openlock);
297 1.1 ad
298 1.22 thorpej if (sc->sc_dk.dk_openmask == 0) {
299 1.22 thorpej /* Load the partition info if not already loaded. */
300 1.22 thorpej if ((sc->sc_flags & LDF_VLABEL) == 0)
301 1.22 thorpej ldgetdisklabel(sc);
302 1.22 thorpej }
303 1.1 ad
304 1.1 ad /* Check that the partition exists. */
305 1.1 ad if (part != RAW_PART && (part >= sc->sc_dk.dk_label->d_npartitions ||
306 1.1 ad sc->sc_dk.dk_label->d_partitions[part].p_fstype == FS_UNUSED)) {
307 1.30 thorpej error = ENXIO;
308 1.30 thorpej goto bad1;
309 1.1 ad }
310 1.1 ad
311 1.1 ad /* Ensure only one open at a time. */
312 1.1 ad switch (fmt) {
313 1.1 ad case S_IFCHR:
314 1.1 ad sc->sc_dk.dk_copenmask |= (1 << part);
315 1.1 ad break;
316 1.1 ad case S_IFBLK:
317 1.1 ad sc->sc_dk.dk_bopenmask |= (1 << part);
318 1.1 ad break;
319 1.1 ad }
320 1.1 ad sc->sc_dk.dk_openmask =
321 1.1 ad sc->sc_dk.dk_copenmask | sc->sc_dk.dk_bopenmask;
322 1.1 ad
323 1.48 ad error = 0;
324 1.30 thorpej bad1:
325 1.48 ad mutex_exit(&sc->sc_dk.dk_openlock);
326 1.30 thorpej return (error);
327 1.1 ad }
328 1.1 ad
329 1.8 lukem /* ARGSUSED */
330 1.29 thorpej static int
331 1.42 christos ldclose(dev_t dev, int flags, int fmt, struct lwp *l)
332 1.1 ad {
333 1.1 ad struct ld_softc *sc;
334 1.48 ad int part, unit;
335 1.1 ad
336 1.1 ad unit = DISKUNIT(dev);
337 1.1 ad part = DISKPART(dev);
338 1.1 ad sc = device_lookup(&ld_cd, unit);
339 1.30 thorpej
340 1.48 ad mutex_enter(&sc->sc_dk.dk_openlock);
341 1.1 ad
342 1.1 ad switch (fmt) {
343 1.1 ad case S_IFCHR:
344 1.1 ad sc->sc_dk.dk_copenmask &= ~(1 << part);
345 1.1 ad break;
346 1.1 ad case S_IFBLK:
347 1.1 ad sc->sc_dk.dk_bopenmask &= ~(1 << part);
348 1.1 ad break;
349 1.1 ad }
350 1.1 ad sc->sc_dk.dk_openmask =
351 1.1 ad sc->sc_dk.dk_copenmask | sc->sc_dk.dk_bopenmask;
352 1.1 ad
353 1.22 thorpej if (sc->sc_dk.dk_openmask == 0) {
354 1.22 thorpej if (sc->sc_flush != NULL && (*sc->sc_flush)(sc) != 0)
355 1.57 cegger aprint_error_dev(&sc->sc_dv, "unable to flush cache\n");
356 1.22 thorpej if ((sc->sc_flags & LDF_KLABEL) == 0)
357 1.22 thorpej sc->sc_flags &= ~LDF_VLABEL;
358 1.22 thorpej }
359 1.1 ad
360 1.48 ad mutex_exit(&sc->sc_dk.dk_openlock);
361 1.1 ad return (0);
362 1.1 ad }
363 1.1 ad
364 1.8 lukem /* ARGSUSED */
365 1.29 thorpej static int
366 1.42 christos ldread(dev_t dev, struct uio *uio, int ioflag)
367 1.1 ad {
368 1.1 ad
369 1.1 ad return (physio(ldstrategy, NULL, dev, B_READ, ldminphys, uio));
370 1.1 ad }
371 1.1 ad
372 1.8 lukem /* ARGSUSED */
373 1.29 thorpej static int
374 1.42 christos ldwrite(dev_t dev, struct uio *uio, int ioflag)
375 1.1 ad {
376 1.1 ad
377 1.1 ad return (physio(ldstrategy, NULL, dev, B_WRITE, ldminphys, uio));
378 1.1 ad }
379 1.1 ad
380 1.8 lukem /* ARGSUSED */
381 1.29 thorpej static int
382 1.46 christos ldioctl(dev_t dev, u_long cmd, void *addr, int32_t flag, struct lwp *l)
383 1.1 ad {
384 1.1 ad struct ld_softc *sc;
385 1.52 xtraeme int part, unit, error;
386 1.4 fvdl #ifdef __HAVE_OLD_DISKLABEL
387 1.6 itojun struct disklabel newlabel;
388 1.4 fvdl #endif
389 1.6 itojun struct disklabel *lp;
390 1.1 ad
391 1.1 ad unit = DISKUNIT(dev);
392 1.1 ad part = DISKPART(dev);
393 1.1 ad sc = device_lookup(&ld_cd, unit);
394 1.1 ad
395 1.43 riz error = disk_ioctl(&sc->sc_dk, cmd, addr, flag, l);
396 1.43 riz if (error != EPASSTHROUGH)
397 1.43 riz return (error);
398 1.43 riz
399 1.47 tron error = 0;
400 1.1 ad switch (cmd) {
401 1.1 ad case DIOCGDINFO:
402 1.1 ad memcpy(addr, sc->sc_dk.dk_label, sizeof(struct disklabel));
403 1.1 ad return (0);
404 1.1 ad
405 1.4 fvdl #ifdef __HAVE_OLD_DISKLABEL
406 1.4 fvdl case ODIOCGDINFO:
407 1.4 fvdl newlabel = *(sc->sc_dk.dk_label);
408 1.4 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
409 1.5 fvdl return ENOTTY;
410 1.4 fvdl memcpy(addr, &newlabel, sizeof(struct olddisklabel));
411 1.4 fvdl return (0);
412 1.4 fvdl #endif
413 1.4 fvdl
414 1.1 ad case DIOCGPART:
415 1.1 ad ((struct partinfo *)addr)->disklab = sc->sc_dk.dk_label;
416 1.1 ad ((struct partinfo *)addr)->part =
417 1.1 ad &sc->sc_dk.dk_label->d_partitions[part];
418 1.1 ad break;
419 1.1 ad
420 1.1 ad case DIOCWDINFO:
421 1.1 ad case DIOCSDINFO:
422 1.4 fvdl #ifdef __HAVE_OLD_DISKLABEL
423 1.4 fvdl case ODIOCWDINFO:
424 1.4 fvdl case ODIOCSDINFO:
425 1.4 fvdl
426 1.4 fvdl if (cmd == ODIOCSDINFO || cmd == ODIOCWDINFO) {
427 1.4 fvdl memset(&newlabel, 0, sizeof newlabel);
428 1.4 fvdl memcpy(&newlabel, addr, sizeof (struct olddisklabel));
429 1.4 fvdl lp = &newlabel;
430 1.4 fvdl } else
431 1.4 fvdl #endif
432 1.4 fvdl lp = (struct disklabel *)addr;
433 1.4 fvdl
434 1.1 ad if ((flag & FWRITE) == 0)
435 1.1 ad return (EBADF);
436 1.1 ad
437 1.48 ad mutex_enter(&sc->sc_dk.dk_openlock);
438 1.1 ad sc->sc_flags |= LDF_LABELLING;
439 1.1 ad
440 1.1 ad error = setdisklabel(sc->sc_dk.dk_label,
441 1.4 fvdl lp, /*sc->sc_dk.dk_openmask : */0,
442 1.1 ad sc->sc_dk.dk_cpulabel);
443 1.4 fvdl if (error == 0 && (cmd == DIOCWDINFO
444 1.4 fvdl #ifdef __HAVE_OLD_DISKLABEL
445 1.4 fvdl || cmd == ODIOCWDINFO
446 1.4 fvdl #endif
447 1.4 fvdl ))
448 1.1 ad error = writedisklabel(
449 1.35 perry MAKEDISKDEV(major(dev), DISKUNIT(dev), RAW_PART),
450 1.35 perry ldstrategy, sc->sc_dk.dk_label,
451 1.1 ad sc->sc_dk.dk_cpulabel);
452 1.1 ad
453 1.1 ad sc->sc_flags &= ~LDF_LABELLING;
454 1.48 ad mutex_exit(&sc->sc_dk.dk_openlock);
455 1.1 ad break;
456 1.1 ad
457 1.22 thorpej case DIOCKLABEL:
458 1.22 thorpej if ((flag & FWRITE) == 0)
459 1.22 thorpej return (EBADF);
460 1.22 thorpej if (*(int *)addr)
461 1.22 thorpej sc->sc_flags |= LDF_KLABEL;
462 1.22 thorpej else
463 1.22 thorpej sc->sc_flags &= ~LDF_KLABEL;
464 1.22 thorpej break;
465 1.22 thorpej
466 1.1 ad case DIOCWLABEL:
467 1.1 ad if ((flag & FWRITE) == 0)
468 1.1 ad return (EBADF);
469 1.1 ad if (*(int *)addr)
470 1.1 ad sc->sc_flags |= LDF_WLABEL;
471 1.1 ad else
472 1.1 ad sc->sc_flags &= ~LDF_WLABEL;
473 1.1 ad break;
474 1.1 ad
475 1.1 ad case DIOCGDEFLABEL:
476 1.1 ad ldgetdefaultlabel(sc, (struct disklabel *)addr);
477 1.1 ad break;
478 1.4 fvdl
479 1.4 fvdl #ifdef __HAVE_OLD_DISKLABEL
480 1.4 fvdl case ODIOCGDEFLABEL:
481 1.4 fvdl ldgetdefaultlabel(sc, &newlabel);
482 1.4 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
483 1.5 fvdl return ENOTTY;
484 1.4 fvdl memcpy(addr, &newlabel, sizeof (struct olddisklabel));
485 1.4 fvdl break;
486 1.4 fvdl #endif
487 1.1 ad
488 1.32 thorpej case DIOCCACHESYNC:
489 1.32 thorpej /*
490 1.32 thorpej * XXX Do we really need to care about having a writable
491 1.32 thorpej * file descriptor here?
492 1.32 thorpej */
493 1.32 thorpej if ((flag & FWRITE) == 0)
494 1.32 thorpej error = EBADF;
495 1.32 thorpej else if (sc->sc_flush)
496 1.32 thorpej error = (*sc->sc_flush)(sc);
497 1.32 thorpej else
498 1.32 thorpej error = 0; /* XXX Error out instead? */
499 1.32 thorpej break;
500 1.32 thorpej
501 1.30 thorpej case DIOCAWEDGE:
502 1.30 thorpej {
503 1.30 thorpej struct dkwedge_info *dkw = (void *) addr;
504 1.30 thorpej
505 1.30 thorpej if ((flag & FWRITE) == 0)
506 1.30 thorpej return (EBADF);
507 1.30 thorpej
508 1.30 thorpej /* If the ioctl happens here, the parent is us. */
509 1.57 cegger strlcpy(dkw->dkw_parent, device_xname(&sc->sc_dv),
510 1.57 cegger sizeof(dkw->dkw_parent));
511 1.30 thorpej return (dkwedge_add(dkw));
512 1.30 thorpej }
513 1.35 perry
514 1.30 thorpej case DIOCDWEDGE:
515 1.30 thorpej {
516 1.30 thorpej struct dkwedge_info *dkw = (void *) addr;
517 1.30 thorpej
518 1.30 thorpej if ((flag & FWRITE) == 0)
519 1.30 thorpej return (EBADF);
520 1.30 thorpej
521 1.30 thorpej /* If the ioctl happens here, the parent is us. */
522 1.57 cegger strlcpy(dkw->dkw_parent, device_xname(&sc->sc_dv),
523 1.57 cegger sizeof(dkw->dkw_parent));
524 1.30 thorpej return (dkwedge_del(dkw));
525 1.30 thorpej }
526 1.35 perry
527 1.30 thorpej case DIOCLWEDGES:
528 1.30 thorpej {
529 1.30 thorpej struct dkwedge_list *dkwl = (void *) addr;
530 1.30 thorpej
531 1.39 christos return (dkwedge_list(&sc->sc_dk, dkwl, l));
532 1.30 thorpej }
533 1.51 xtraeme case DIOCGSTRATEGY:
534 1.51 xtraeme {
535 1.51 xtraeme struct disk_strategy *dks = (void *)addr;
536 1.51 xtraeme
537 1.52 xtraeme mutex_enter(&sc->sc_mutex);
538 1.51 xtraeme strlcpy(dks->dks_name, bufq_getstrategyname(sc->sc_bufq),
539 1.51 xtraeme sizeof(dks->dks_name));
540 1.52 xtraeme mutex_exit(&sc->sc_mutex);
541 1.51 xtraeme dks->dks_paramlen = 0;
542 1.51 xtraeme
543 1.51 xtraeme return 0;
544 1.51 xtraeme }
545 1.51 xtraeme case DIOCSSTRATEGY:
546 1.51 xtraeme {
547 1.51 xtraeme struct disk_strategy *dks = (void *)addr;
548 1.51 xtraeme struct bufq_state *new, *old;
549 1.30 thorpej
550 1.51 xtraeme if ((flag & FWRITE) == 0)
551 1.51 xtraeme return EPERM;
552 1.51 xtraeme
553 1.51 xtraeme if (dks->dks_param != NULL)
554 1.51 xtraeme return EINVAL;
555 1.51 xtraeme
556 1.51 xtraeme dks->dks_name[sizeof(dks->dks_name) - 1] = 0; /* ensure term */
557 1.51 xtraeme error = bufq_alloc(&new, dks->dks_name,
558 1.51 xtraeme BUFQ_EXACT|BUFQ_SORT_RAWBLOCK);
559 1.51 xtraeme if (error)
560 1.51 xtraeme return error;
561 1.51 xtraeme
562 1.52 xtraeme mutex_enter(&sc->sc_mutex);
563 1.51 xtraeme old = sc->sc_bufq;
564 1.51 xtraeme bufq_move(new, old);
565 1.51 xtraeme sc->sc_bufq = new;
566 1.52 xtraeme mutex_exit(&sc->sc_mutex);
567 1.51 xtraeme bufq_free(old);
568 1.51 xtraeme
569 1.51 xtraeme return 0;
570 1.51 xtraeme }
571 1.1 ad default:
572 1.1 ad error = ENOTTY;
573 1.1 ad break;
574 1.1 ad }
575 1.1 ad
576 1.1 ad return (error);
577 1.1 ad }
578 1.1 ad
579 1.29 thorpej static void
580 1.1 ad ldstrategy(struct buf *bp)
581 1.1 ad {
582 1.1 ad struct ld_softc *sc;
583 1.23 thorpej struct disklabel *lp;
584 1.23 thorpej daddr_t blkno;
585 1.23 thorpej int s, part;
586 1.1 ad
587 1.1 ad sc = device_lookup(&ld_cd, DISKUNIT(bp->b_dev));
588 1.23 thorpej part = DISKPART(bp->b_dev);
589 1.1 ad
590 1.7 ad if ((sc->sc_flags & LDF_DETACH) != 0) {
591 1.2 ad bp->b_error = EIO;
592 1.49 ad goto done;
593 1.2 ad }
594 1.2 ad
595 1.1 ad lp = sc->sc_dk.dk_label;
596 1.1 ad
597 1.1 ad /*
598 1.1 ad * The transfer must be a whole number of blocks and the offset must
599 1.1 ad * not be negative.
600 1.1 ad */
601 1.1 ad if ((bp->b_bcount % lp->d_secsize) != 0 || bp->b_blkno < 0) {
602 1.23 thorpej bp->b_error = EINVAL;
603 1.49 ad goto done;
604 1.1 ad }
605 1.1 ad
606 1.23 thorpej /* If it's a null transfer, return immediately. */
607 1.23 thorpej if (bp->b_bcount == 0)
608 1.23 thorpej goto done;
609 1.1 ad
610 1.1 ad /*
611 1.1 ad * Do bounds checking and adjust the transfer. If error, process.
612 1.1 ad * If past the end of partition, just return.
613 1.1 ad */
614 1.1 ad if (part != RAW_PART &&
615 1.20 thorpej bounds_check_with_label(&sc->sc_dk, bp,
616 1.1 ad (sc->sc_flags & (LDF_WLABEL | LDF_LABELLING)) != 0) <= 0) {
617 1.23 thorpej goto done;
618 1.1 ad }
619 1.1 ad
620 1.1 ad /*
621 1.23 thorpej * Convert the block number to absolute and put it in terms
622 1.23 thorpej * of the device's logical block size.
623 1.1 ad */
624 1.23 thorpej if (lp->d_secsize == DEV_BSIZE)
625 1.23 thorpej blkno = bp->b_blkno;
626 1.23 thorpej else if (lp->d_secsize > DEV_BSIZE)
627 1.23 thorpej blkno = bp->b_blkno / (lp->d_secsize / DEV_BSIZE);
628 1.1 ad else
629 1.23 thorpej blkno = bp->b_blkno * (DEV_BSIZE / lp->d_secsize);
630 1.1 ad
631 1.11 thorpej if (part != RAW_PART)
632 1.23 thorpej blkno += lp->d_partitions[part].p_offset;
633 1.23 thorpej
634 1.23 thorpej bp->b_rawblkno = blkno;
635 1.1 ad
636 1.1 ad s = splbio();
637 1.44 ad ldstart(sc, bp);
638 1.1 ad splx(s);
639 1.23 thorpej return;
640 1.23 thorpej
641 1.23 thorpej done:
642 1.23 thorpej bp->b_resid = bp->b_bcount;
643 1.23 thorpej biodone(bp);
644 1.23 thorpej }
645 1.23 thorpej
646 1.23 thorpej static void
647 1.44 ad ldstart(struct ld_softc *sc, struct buf *bp)
648 1.23 thorpej {
649 1.23 thorpej int error;
650 1.1 ad
651 1.44 ad mutex_enter(&sc->sc_mutex);
652 1.44 ad
653 1.44 ad if (bp != NULL)
654 1.44 ad BUFQ_PUT(sc->sc_bufq, bp);
655 1.44 ad
656 1.23 thorpej while (sc->sc_queuecnt < sc->sc_maxqueuecnt) {
657 1.23 thorpej /* See if there is work to do. */
658 1.38 yamt if ((bp = BUFQ_PEEK(sc->sc_bufq)) == NULL)
659 1.23 thorpej break;
660 1.23 thorpej
661 1.23 thorpej disk_busy(&sc->sc_dk);
662 1.23 thorpej sc->sc_queuecnt++;
663 1.23 thorpej
664 1.23 thorpej if (__predict_true((error = (*sc->sc_start)(sc, bp)) == 0)) {
665 1.23 thorpej /*
666 1.23 thorpej * The back-end is running the job; remove it from
667 1.23 thorpej * the queue.
668 1.23 thorpej */
669 1.38 yamt (void) BUFQ_GET(sc->sc_bufq);
670 1.23 thorpej } else {
671 1.23 thorpej disk_unbusy(&sc->sc_dk, 0, (bp->b_flags & B_READ));
672 1.23 thorpej sc->sc_queuecnt--;
673 1.23 thorpej if (error == EAGAIN) {
674 1.23 thorpej /*
675 1.23 thorpej * Temporary resource shortage in the
676 1.23 thorpej * back-end; just defer the job until
677 1.23 thorpej * later.
678 1.23 thorpej *
679 1.23 thorpej * XXX We might consider a watchdog timer
680 1.23 thorpej * XXX to make sure we are kicked into action.
681 1.23 thorpej */
682 1.23 thorpej break;
683 1.23 thorpej } else {
684 1.38 yamt (void) BUFQ_GET(sc->sc_bufq);
685 1.23 thorpej bp->b_error = error;
686 1.23 thorpej bp->b_resid = bp->b_bcount;
687 1.44 ad mutex_exit(&sc->sc_mutex);
688 1.23 thorpej biodone(bp);
689 1.44 ad mutex_enter(&sc->sc_mutex);
690 1.23 thorpej }
691 1.23 thorpej }
692 1.1 ad }
693 1.44 ad
694 1.44 ad mutex_exit(&sc->sc_mutex);
695 1.1 ad }
696 1.1 ad
697 1.1 ad void
698 1.1 ad lddone(struct ld_softc *sc, struct buf *bp)
699 1.1 ad {
700 1.1 ad
701 1.49 ad if (bp->b_error != 0) {
702 1.1 ad diskerr(bp, "ld", "error", LOG_PRINTF, 0, sc->sc_dk.dk_label);
703 1.1 ad printf("\n");
704 1.1 ad }
705 1.1 ad
706 1.18 mrg disk_unbusy(&sc->sc_dk, bp->b_bcount - bp->b_resid,
707 1.18 mrg (bp->b_flags & B_READ));
708 1.1 ad #if NRND > 0
709 1.1 ad rnd_add_uint32(&sc->sc_rnd_source, bp->b_rawblkno);
710 1.1 ad #endif
711 1.1 ad biodone(bp);
712 1.1 ad
713 1.44 ad mutex_enter(&sc->sc_mutex);
714 1.7 ad if (--sc->sc_queuecnt <= sc->sc_maxqueuecnt) {
715 1.24 thorpej if ((sc->sc_flags & LDF_DRAIN) != 0) {
716 1.24 thorpej sc->sc_flags &= ~LDF_DRAIN;
717 1.7 ad wakeup(&sc->sc_queuecnt);
718 1.24 thorpej }
719 1.44 ad mutex_exit(&sc->sc_mutex);
720 1.44 ad ldstart(sc, NULL);
721 1.44 ad } else
722 1.44 ad mutex_exit(&sc->sc_mutex);
723 1.1 ad }
724 1.1 ad
725 1.29 thorpej static int
726 1.1 ad ldsize(dev_t dev)
727 1.1 ad {
728 1.1 ad struct ld_softc *sc;
729 1.1 ad int part, unit, omask, size;
730 1.1 ad
731 1.1 ad unit = DISKUNIT(dev);
732 1.1 ad if ((sc = device_lookup(&ld_cd, unit)) == NULL)
733 1.1 ad return (ENODEV);
734 1.1 ad if ((sc->sc_flags & LDF_ENABLED) == 0)
735 1.1 ad return (ENODEV);
736 1.1 ad part = DISKPART(dev);
737 1.1 ad
738 1.1 ad omask = sc->sc_dk.dk_openmask & (1 << part);
739 1.1 ad
740 1.1 ad if (omask == 0 && ldopen(dev, 0, S_IFBLK, NULL) != 0)
741 1.1 ad return (-1);
742 1.1 ad else if (sc->sc_dk.dk_label->d_partitions[part].p_fstype != FS_SWAP)
743 1.1 ad size = -1;
744 1.1 ad else
745 1.1 ad size = sc->sc_dk.dk_label->d_partitions[part].p_size *
746 1.1 ad (sc->sc_dk.dk_label->d_secsize / DEV_BSIZE);
747 1.1 ad if (omask == 0 && ldclose(dev, 0, S_IFBLK, NULL) != 0)
748 1.1 ad return (-1);
749 1.1 ad
750 1.1 ad return (size);
751 1.1 ad }
752 1.1 ad
753 1.1 ad /*
754 1.1 ad * Load the label information from the specified device.
755 1.1 ad */
756 1.1 ad static void
757 1.1 ad ldgetdisklabel(struct ld_softc *sc)
758 1.1 ad {
759 1.1 ad const char *errstring;
760 1.1 ad
761 1.1 ad ldgetdefaultlabel(sc, sc->sc_dk.dk_label);
762 1.1 ad
763 1.1 ad /* Call the generic disklabel extraction routine. */
764 1.40 thorpej errstring = readdisklabel(MAKEDISKDEV(0, device_unit(&sc->sc_dv),
765 1.40 thorpej RAW_PART), ldstrategy, sc->sc_dk.dk_label, sc->sc_dk.dk_cpulabel);
766 1.1 ad if (errstring != NULL)
767 1.57 cegger printf("%s: %s\n", device_xname(&sc->sc_dv), errstring);
768 1.22 thorpej
769 1.22 thorpej /* In-core label now valid. */
770 1.22 thorpej sc->sc_flags |= LDF_VLABEL;
771 1.1 ad }
772 1.1 ad
773 1.1 ad /*
774 1.1 ad * Construct a ficticious label.
775 1.1 ad */
776 1.1 ad static void
777 1.1 ad ldgetdefaultlabel(struct ld_softc *sc, struct disklabel *lp)
778 1.1 ad {
779 1.1 ad
780 1.1 ad memset(lp, 0, sizeof(struct disklabel));
781 1.1 ad
782 1.1 ad lp->d_secsize = sc->sc_secsize;
783 1.1 ad lp->d_ntracks = sc->sc_nheads;
784 1.1 ad lp->d_nsectors = sc->sc_nsectors;
785 1.1 ad lp->d_ncylinders = sc->sc_ncylinders;
786 1.1 ad lp->d_secpercyl = lp->d_ntracks * lp->d_nsectors;
787 1.1 ad lp->d_type = DTYPE_LD;
788 1.21 itojun strlcpy(lp->d_typename, "unknown", sizeof(lp->d_typename));
789 1.21 itojun strlcpy(lp->d_packname, "fictitious", sizeof(lp->d_packname));
790 1.1 ad lp->d_secperunit = sc->sc_secperunit;
791 1.1 ad lp->d_rpm = 7200;
792 1.1 ad lp->d_interleave = 1;
793 1.1 ad lp->d_flags = 0;
794 1.1 ad
795 1.1 ad lp->d_partitions[RAW_PART].p_offset = 0;
796 1.1 ad lp->d_partitions[RAW_PART].p_size =
797 1.1 ad lp->d_secperunit * (lp->d_secsize / DEV_BSIZE);
798 1.1 ad lp->d_partitions[RAW_PART].p_fstype = FS_UNUSED;
799 1.1 ad lp->d_npartitions = RAW_PART + 1;
800 1.1 ad
801 1.1 ad lp->d_magic = DISKMAGIC;
802 1.1 ad lp->d_magic2 = DISKMAGIC;
803 1.1 ad lp->d_checksum = dkcksum(lp);
804 1.1 ad }
805 1.1 ad
806 1.1 ad /*
807 1.1 ad * Take a dump.
808 1.1 ad */
809 1.29 thorpej static int
810 1.46 christos lddump(dev_t dev, daddr_t blkno, void *vav, size_t size)
811 1.1 ad {
812 1.46 christos char *va = vav;
813 1.1 ad struct ld_softc *sc;
814 1.1 ad struct disklabel *lp;
815 1.1 ad int unit, part, nsects, sectoff, towrt, nblk, maxblkcnt, rv;
816 1.1 ad static int dumping;
817 1.1 ad
818 1.1 ad unit = DISKUNIT(dev);
819 1.1 ad if ((sc = device_lookup(&ld_cd, unit)) == NULL)
820 1.1 ad return (ENXIO);
821 1.1 ad if ((sc->sc_flags & LDF_ENABLED) == 0)
822 1.1 ad return (ENODEV);
823 1.3 ad if (sc->sc_dump == NULL)
824 1.3 ad return (ENXIO);
825 1.3 ad
826 1.3 ad /* Check if recursive dump; if so, punt. */
827 1.3 ad if (dumping)
828 1.3 ad return (EFAULT);
829 1.3 ad dumping = 1;
830 1.1 ad
831 1.1 ad /* Convert to disk sectors. Request must be a multiple of size. */
832 1.3 ad part = DISKPART(dev);
833 1.1 ad lp = sc->sc_dk.dk_label;
834 1.1 ad if ((size % lp->d_secsize) != 0)
835 1.1 ad return (EFAULT);
836 1.1 ad towrt = size / lp->d_secsize;
837 1.1 ad blkno = dbtob(blkno) / lp->d_secsize; /* blkno in DEV_BSIZE units */
838 1.1 ad
839 1.1 ad nsects = lp->d_partitions[part].p_size;
840 1.1 ad sectoff = lp->d_partitions[part].p_offset;
841 1.1 ad
842 1.1 ad /* Check transfer bounds against partition size. */
843 1.1 ad if ((blkno < 0) || ((blkno + towrt) > nsects))
844 1.1 ad return (EINVAL);
845 1.1 ad
846 1.1 ad /* Offset block number to start of partition. */
847 1.1 ad blkno += sectoff;
848 1.1 ad
849 1.1 ad /* Start dumping and return when done. */
850 1.3 ad maxblkcnt = sc->sc_maxxfer / sc->sc_secsize - 1;
851 1.1 ad while (towrt > 0) {
852 1.3 ad nblk = min(maxblkcnt, towrt);
853 1.1 ad
854 1.1 ad if ((rv = (*sc->sc_dump)(sc, va, blkno, nblk)) != 0)
855 1.1 ad return (rv);
856 1.1 ad
857 1.1 ad towrt -= nblk;
858 1.1 ad blkno += nblk;
859 1.1 ad va += nblk * sc->sc_secsize;
860 1.1 ad }
861 1.1 ad
862 1.1 ad dumping = 0;
863 1.1 ad return (0);
864 1.1 ad }
865 1.1 ad
866 1.1 ad /*
867 1.1 ad * Adjust the size of a transfer.
868 1.1 ad */
869 1.1 ad static void
870 1.1 ad ldminphys(struct buf *bp)
871 1.1 ad {
872 1.1 ad struct ld_softc *sc;
873 1.1 ad
874 1.1 ad sc = device_lookup(&ld_cd, DISKUNIT(bp->b_dev));
875 1.1 ad
876 1.1 ad if (bp->b_bcount > sc->sc_maxxfer)
877 1.1 ad bp->b_bcount = sc->sc_maxxfer;
878 1.1 ad minphys(bp);
879 1.1 ad }
880 1.43 riz
881 1.43 riz static void
882 1.43 riz ld_set_properties(struct ld_softc *ld)
883 1.43 riz {
884 1.43 riz prop_dictionary_t disk_info, odisk_info, geom;
885 1.43 riz
886 1.43 riz disk_info = prop_dictionary_create();
887 1.43 riz
888 1.43 riz geom = prop_dictionary_create();
889 1.43 riz
890 1.43 riz prop_dictionary_set_uint64(geom, "sectors-per-unit",
891 1.43 riz ld->sc_secperunit);
892 1.43 riz
893 1.43 riz prop_dictionary_set_uint32(geom, "sector-size",
894 1.43 riz ld->sc_secsize);
895 1.43 riz
896 1.43 riz prop_dictionary_set_uint16(geom, "sectors-per-track",
897 1.43 riz ld->sc_nsectors);
898 1.43 riz
899 1.43 riz prop_dictionary_set_uint16(geom, "tracks-per-cylinder",
900 1.43 riz ld->sc_nheads);
901 1.43 riz
902 1.43 riz prop_dictionary_set_uint64(geom, "cylinders-per-unit",
903 1.43 riz ld->sc_ncylinders);
904 1.43 riz
905 1.43 riz prop_dictionary_set(disk_info, "geometry", geom);
906 1.43 riz prop_object_release(geom);
907 1.43 riz
908 1.43 riz prop_dictionary_set(device_properties(&ld->sc_dv),
909 1.43 riz "disk-info", disk_info);
910 1.43 riz
911 1.43 riz /*
912 1.43 riz * Don't release disk_info here; we keep a reference to it.
913 1.43 riz * disk_detach() will release it when we go away.
914 1.43 riz */
915 1.43 riz
916 1.43 riz odisk_info = ld->sc_dk.dk_info;
917 1.43 riz ld->sc_dk.dk_info = disk_info;
918 1.43 riz if (odisk_info)
919 1.43 riz prop_object_release(odisk_info);
920 1.43 riz }
921 1.45 riz
922 1.45 riz static void
923 1.45 riz ld_config_interrupts (struct device *d)
924 1.45 riz {
925 1.45 riz struct ld_softc *sc = (struct ld_softc *)d;
926 1.45 riz dkwedge_discover(&sc->sc_dk);
927 1.45 riz }
928