dk.c revision 1.117 1 1.117 riastrad /* $NetBSD: dk.c,v 1.117 2022/08/22 00:19:53 riastradh Exp $ */
2 1.1 thorpej
3 1.1 thorpej /*-
4 1.27 ad * Copyright (c) 2004, 2005, 2006, 2007 The NetBSD Foundation, Inc.
5 1.1 thorpej * All rights reserved.
6 1.1 thorpej *
7 1.1 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.1 thorpej * by Jason R. Thorpe.
9 1.1 thorpej *
10 1.1 thorpej * Redistribution and use in source and binary forms, with or without
11 1.1 thorpej * modification, are permitted provided that the following conditions
12 1.1 thorpej * are met:
13 1.1 thorpej * 1. Redistributions of source code must retain the above copyright
14 1.1 thorpej * notice, this list of conditions and the following disclaimer.
15 1.1 thorpej * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 thorpej * notice, this list of conditions and the following disclaimer in the
17 1.1 thorpej * documentation and/or other materials provided with the distribution.
18 1.1 thorpej *
19 1.1 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.1 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.1 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.1 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.1 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.1 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.1 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.1 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.1 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.1 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.1 thorpej * POSSIBILITY OF SUCH DAMAGE.
30 1.1 thorpej */
31 1.1 thorpej
32 1.1 thorpej #include <sys/cdefs.h>
33 1.117 riastrad __KERNEL_RCSID(0, "$NetBSD: dk.c,v 1.117 2022/08/22 00:19:53 riastradh Exp $");
34 1.1 thorpej
35 1.50 pooka #ifdef _KERNEL_OPT
36 1.1 thorpej #include "opt_dkwedge.h"
37 1.50 pooka #endif
38 1.1 thorpej
39 1.1 thorpej #include <sys/param.h>
40 1.1 thorpej #include <sys/systm.h>
41 1.1 thorpej #include <sys/proc.h>
42 1.1 thorpej #include <sys/errno.h>
43 1.1 thorpej #include <sys/pool.h>
44 1.1 thorpej #include <sys/ioctl.h>
45 1.1 thorpej #include <sys/disklabel.h>
46 1.1 thorpej #include <sys/disk.h>
47 1.1 thorpej #include <sys/fcntl.h>
48 1.5 yamt #include <sys/buf.h>
49 1.5 yamt #include <sys/bufq.h>
50 1.1 thorpej #include <sys/vnode.h>
51 1.3 thorpej #include <sys/stat.h>
52 1.1 thorpej #include <sys/conf.h>
53 1.1 thorpej #include <sys/callout.h>
54 1.1 thorpej #include <sys/kernel.h>
55 1.1 thorpej #include <sys/malloc.h>
56 1.2 thorpej #include <sys/device.h>
57 1.15 elad #include <sys/kauth.h>
58 1.1 thorpej
59 1.1 thorpej #include <miscfs/specfs/specdev.h>
60 1.1 thorpej
61 1.1 thorpej MALLOC_DEFINE(M_DKWEDGE, "dkwedge", "Disk wedge structures");
62 1.1 thorpej
63 1.1 thorpej typedef enum {
64 1.1 thorpej DKW_STATE_LARVAL = 0,
65 1.1 thorpej DKW_STATE_RUNNING = 1,
66 1.1 thorpej DKW_STATE_DYING = 2,
67 1.1 thorpej DKW_STATE_DEAD = 666
68 1.1 thorpej } dkwedge_state_t;
69 1.1 thorpej
70 1.1 thorpej struct dkwedge_softc {
71 1.65 chs device_t sc_dev; /* pointer to our pseudo-device */
72 1.2 thorpej struct cfdata sc_cfdata; /* our cfdata structure */
73 1.1 thorpej uint8_t sc_wname[128]; /* wedge name (Unicode, UTF-8) */
74 1.1 thorpej
75 1.1 thorpej dkwedge_state_t sc_state; /* state this wedge is in */
76 1.1 thorpej
77 1.1 thorpej struct disk *sc_parent; /* parent disk */
78 1.1 thorpej daddr_t sc_offset; /* LBA offset of wedge in parent */
79 1.1 thorpej uint64_t sc_size; /* size of wedge in blocks */
80 1.1 thorpej char sc_ptype[32]; /* partition type */
81 1.1 thorpej dev_t sc_pdev; /* cached parent's dev_t */
82 1.1 thorpej /* link on parent's wedge list */
83 1.1 thorpej LIST_ENTRY(dkwedge_softc) sc_plink;
84 1.1 thorpej
85 1.1 thorpej struct disk sc_dk; /* our own disk structure */
86 1.9 yamt struct bufq_state *sc_bufq; /* buffer queue */
87 1.1 thorpej struct callout sc_restart_ch; /* callout to restart I/O */
88 1.1 thorpej
89 1.92 mlelstv kmutex_t sc_iolock;
90 1.92 mlelstv kcondvar_t sc_dkdrn;
91 1.1 thorpej u_int sc_iopend; /* I/Os pending */
92 1.103 mlelstv int sc_mode; /* parent open mode */
93 1.1 thorpej };
94 1.1 thorpej
95 1.1 thorpej static void dkstart(struct dkwedge_softc *);
96 1.1 thorpej static void dkiodone(struct buf *);
97 1.1 thorpej static void dkrestart(void *);
98 1.52 jakllsch static void dkminphys(struct buf *);
99 1.1 thorpej
100 1.46 dyoung static int dklastclose(struct dkwedge_softc *);
101 1.74 mlelstv static int dkwedge_cleanup_parent(struct dkwedge_softc *, int);
102 1.47 dyoung static int dkwedge_detach(device_t, int);
103 1.74 mlelstv static void dkwedge_delall1(struct disk *, bool);
104 1.74 mlelstv static int dkwedge_del1(struct dkwedge_info *, int);
105 1.87 mlelstv static int dk_open_parent(dev_t, int, struct vnode **);
106 1.82 mlelstv static int dk_close_parent(struct vnode *, int);
107 1.46 dyoung
108 1.1 thorpej static dev_type_open(dkopen);
109 1.1 thorpej static dev_type_close(dkclose);
110 1.1 thorpej static dev_type_read(dkread);
111 1.1 thorpej static dev_type_write(dkwrite);
112 1.1 thorpej static dev_type_ioctl(dkioctl);
113 1.1 thorpej static dev_type_strategy(dkstrategy);
114 1.1 thorpej static dev_type_dump(dkdump);
115 1.1 thorpej static dev_type_size(dksize);
116 1.72 dholland static dev_type_discard(dkdiscard);
117 1.1 thorpej
118 1.1 thorpej const struct bdevsw dk_bdevsw = {
119 1.68 dholland .d_open = dkopen,
120 1.68 dholland .d_close = dkclose,
121 1.68 dholland .d_strategy = dkstrategy,
122 1.68 dholland .d_ioctl = dkioctl,
123 1.68 dholland .d_dump = dkdump,
124 1.68 dholland .d_psize = dksize,
125 1.72 dholland .d_discard = dkdiscard,
126 1.92 mlelstv .d_flag = D_DISK | D_MPSAFE
127 1.1 thorpej };
128 1.1 thorpej
129 1.1 thorpej const struct cdevsw dk_cdevsw = {
130 1.68 dholland .d_open = dkopen,
131 1.68 dholland .d_close = dkclose,
132 1.68 dholland .d_read = dkread,
133 1.68 dholland .d_write = dkwrite,
134 1.68 dholland .d_ioctl = dkioctl,
135 1.68 dholland .d_stop = nostop,
136 1.68 dholland .d_tty = notty,
137 1.68 dholland .d_poll = nopoll,
138 1.68 dholland .d_mmap = nommap,
139 1.68 dholland .d_kqfilter = nokqfilter,
140 1.72 dholland .d_discard = dkdiscard,
141 1.92 mlelstv .d_flag = D_DISK | D_MPSAFE
142 1.1 thorpej };
143 1.1 thorpej
144 1.1 thorpej static struct dkwedge_softc **dkwedges;
145 1.1 thorpej static u_int ndkwedges;
146 1.27 ad static krwlock_t dkwedges_lock;
147 1.1 thorpej
148 1.1 thorpej static LIST_HEAD(, dkwedge_discovery_method) dkwedge_discovery_methods;
149 1.27 ad static krwlock_t dkwedge_discovery_methods_lock;
150 1.1 thorpej
151 1.1 thorpej /*
152 1.2 thorpej * dkwedge_match:
153 1.2 thorpej *
154 1.2 thorpej * Autoconfiguration match function for pseudo-device glue.
155 1.2 thorpej */
156 1.2 thorpej static int
157 1.45 cegger dkwedge_match(device_t parent, cfdata_t match,
158 1.20 christos void *aux)
159 1.2 thorpej {
160 1.2 thorpej
161 1.2 thorpej /* Pseudo-device; always present. */
162 1.2 thorpej return (1);
163 1.2 thorpej }
164 1.2 thorpej
165 1.2 thorpej /*
166 1.2 thorpej * dkwedge_attach:
167 1.2 thorpej *
168 1.2 thorpej * Autoconfiguration attach function for pseudo-device glue.
169 1.2 thorpej */
170 1.2 thorpej static void
171 1.45 cegger dkwedge_attach(device_t parent, device_t self,
172 1.20 christos void *aux)
173 1.2 thorpej {
174 1.2 thorpej
175 1.31 jmcneill if (!pmf_device_register(self, NULL, NULL))
176 1.31 jmcneill aprint_error_dev(self, "couldn't establish power handler\n");
177 1.2 thorpej }
178 1.2 thorpej
179 1.2 thorpej CFDRIVER_DECL(dk, DV_DISK, NULL);
180 1.47 dyoung CFATTACH_DECL3_NEW(dk, 0,
181 1.47 dyoung dkwedge_match, dkwedge_attach, dkwedge_detach, NULL, NULL, NULL,
182 1.47 dyoung DVF_DETACH_SHUTDOWN);
183 1.2 thorpej
184 1.2 thorpej /*
185 1.1 thorpej * dkwedge_wait_drain:
186 1.1 thorpej *
187 1.1 thorpej * Wait for I/O on the wedge to drain.
188 1.1 thorpej */
189 1.1 thorpej static void
190 1.1 thorpej dkwedge_wait_drain(struct dkwedge_softc *sc)
191 1.1 thorpej {
192 1.1 thorpej
193 1.92 mlelstv mutex_enter(&sc->sc_iolock);
194 1.110 riastrad while (sc->sc_iopend != 0)
195 1.92 mlelstv cv_wait(&sc->sc_dkdrn, &sc->sc_iolock);
196 1.92 mlelstv mutex_exit(&sc->sc_iolock);
197 1.1 thorpej }
198 1.1 thorpej
199 1.1 thorpej /*
200 1.1 thorpej * dkwedge_compute_pdev:
201 1.1 thorpej *
202 1.1 thorpej * Compute the parent disk's dev_t.
203 1.1 thorpej */
204 1.1 thorpej static int
205 1.74 mlelstv dkwedge_compute_pdev(const char *pname, dev_t *pdevp, enum vtype type)
206 1.1 thorpej {
207 1.1 thorpej const char *name, *cp;
208 1.63 drochner devmajor_t pmaj;
209 1.63 drochner int punit;
210 1.1 thorpej char devname[16];
211 1.1 thorpej
212 1.1 thorpej name = pname;
213 1.74 mlelstv switch (type) {
214 1.74 mlelstv case VBLK:
215 1.74 mlelstv pmaj = devsw_name2blk(name, devname, sizeof(devname));
216 1.74 mlelstv break;
217 1.74 mlelstv case VCHR:
218 1.74 mlelstv pmaj = devsw_name2chr(name, devname, sizeof(devname));
219 1.74 mlelstv break;
220 1.74 mlelstv default:
221 1.75 mlelstv pmaj = NODEVMAJOR;
222 1.74 mlelstv break;
223 1.74 mlelstv }
224 1.75 mlelstv if (pmaj == NODEVMAJOR)
225 1.1 thorpej return (ENODEV);
226 1.6 perry
227 1.1 thorpej name += strlen(devname);
228 1.1 thorpej for (cp = name, punit = 0; *cp >= '0' && *cp <= '9'; cp++)
229 1.1 thorpej punit = (punit * 10) + (*cp - '0');
230 1.1 thorpej if (cp == name) {
231 1.1 thorpej /* Invalid parent disk name. */
232 1.1 thorpej return (ENODEV);
233 1.1 thorpej }
234 1.1 thorpej
235 1.1 thorpej *pdevp = MAKEDISKDEV(pmaj, punit, RAW_PART);
236 1.1 thorpej
237 1.1 thorpej return (0);
238 1.1 thorpej }
239 1.1 thorpej
240 1.1 thorpej /*
241 1.1 thorpej * dkwedge_array_expand:
242 1.1 thorpej *
243 1.1 thorpej * Expand the dkwedges array.
244 1.1 thorpej */
245 1.1 thorpej static void
246 1.1 thorpej dkwedge_array_expand(void)
247 1.1 thorpej {
248 1.1 thorpej int newcnt = ndkwedges + 16;
249 1.1 thorpej struct dkwedge_softc **newarray, **oldarray;
250 1.1 thorpej
251 1.1 thorpej newarray = malloc(newcnt * sizeof(*newarray), M_DKWEDGE,
252 1.1 thorpej M_WAITOK|M_ZERO);
253 1.1 thorpej if ((oldarray = dkwedges) != NULL)
254 1.1 thorpej memcpy(newarray, dkwedges, ndkwedges * sizeof(*newarray));
255 1.1 thorpej dkwedges = newarray;
256 1.1 thorpej ndkwedges = newcnt;
257 1.1 thorpej if (oldarray != NULL)
258 1.1 thorpej free(oldarray, M_DKWEDGE);
259 1.1 thorpej }
260 1.1 thorpej
261 1.48 haad static void
262 1.77 mlelstv dk_set_geometry(struct dkwedge_softc *sc, struct disk *pdk)
263 1.48 haad {
264 1.77 mlelstv struct disk *dk = &sc->sc_dk;
265 1.77 mlelstv struct disk_geom *dg = &dk->dk_geom;
266 1.48 haad
267 1.66 christos memset(dg, 0, sizeof(*dg));
268 1.48 haad
269 1.86 mlelstv dg->dg_secperunit = sc->sc_size;
270 1.77 mlelstv dg->dg_secsize = DEV_BSIZE << pdk->dk_blkshift;
271 1.76 mlelstv
272 1.76 mlelstv /* fake numbers, 1 cylinder is 1 MB with default sector size */
273 1.66 christos dg->dg_nsectors = 32;
274 1.66 christos dg->dg_ntracks = 64;
275 1.76 mlelstv dg->dg_ncylinders = dg->dg_secperunit / (dg->dg_nsectors * dg->dg_ntracks);
276 1.48 haad
277 1.77 mlelstv disk_set_info(sc->sc_dev, dk, NULL);
278 1.48 haad }
279 1.48 haad
280 1.1 thorpej /*
281 1.1 thorpej * dkwedge_add: [exported function]
282 1.1 thorpej *
283 1.1 thorpej * Add a disk wedge based on the provided information.
284 1.1 thorpej *
285 1.1 thorpej * The incoming dkw_devname[] is ignored, instead being
286 1.1 thorpej * filled in and returned to the caller.
287 1.1 thorpej */
288 1.1 thorpej int
289 1.1 thorpej dkwedge_add(struct dkwedge_info *dkw)
290 1.1 thorpej {
291 1.1 thorpej struct dkwedge_softc *sc, *lsc;
292 1.1 thorpej struct disk *pdk;
293 1.1 thorpej u_int unit;
294 1.1 thorpej int error;
295 1.1 thorpej dev_t pdev;
296 1.1 thorpej
297 1.1 thorpej dkw->dkw_parent[sizeof(dkw->dkw_parent) - 1] = '\0';
298 1.1 thorpej pdk = disk_find(dkw->dkw_parent);
299 1.1 thorpej if (pdk == NULL)
300 1.1 thorpej return (ENODEV);
301 1.1 thorpej
302 1.74 mlelstv error = dkwedge_compute_pdev(pdk->dk_name, &pdev, VBLK);
303 1.1 thorpej if (error)
304 1.1 thorpej return (error);
305 1.1 thorpej
306 1.1 thorpej if (dkw->dkw_offset < 0)
307 1.1 thorpej return (EINVAL);
308 1.1 thorpej
309 1.101 jmcneill /*
310 1.101 jmcneill * Check for an existing wedge at the same disk offset. Allow
311 1.101 jmcneill * updating a wedge if the only change is the size, and the new
312 1.101 jmcneill * size is larger than the old.
313 1.101 jmcneill */
314 1.101 jmcneill sc = NULL;
315 1.101 jmcneill mutex_enter(&pdk->dk_openlock);
316 1.101 jmcneill LIST_FOREACH(lsc, &pdk->dk_wedges, sc_plink) {
317 1.101 jmcneill if (lsc->sc_offset != dkw->dkw_offset)
318 1.101 jmcneill continue;
319 1.101 jmcneill if (strcmp(lsc->sc_wname, dkw->dkw_wname) != 0)
320 1.101 jmcneill break;
321 1.101 jmcneill if (strcmp(lsc->sc_ptype, dkw->dkw_ptype) != 0)
322 1.101 jmcneill break;
323 1.101 jmcneill if (lsc->sc_size > dkw->dkw_size)
324 1.101 jmcneill break;
325 1.101 jmcneill
326 1.101 jmcneill sc = lsc;
327 1.101 jmcneill sc->sc_size = dkw->dkw_size;
328 1.101 jmcneill dk_set_geometry(sc, pdk);
329 1.101 jmcneill
330 1.101 jmcneill break;
331 1.101 jmcneill }
332 1.101 jmcneill mutex_exit(&pdk->dk_openlock);
333 1.101 jmcneill
334 1.101 jmcneill if (sc != NULL)
335 1.101 jmcneill goto announce;
336 1.101 jmcneill
337 1.1 thorpej sc = malloc(sizeof(*sc), M_DKWEDGE, M_WAITOK|M_ZERO);
338 1.1 thorpej sc->sc_state = DKW_STATE_LARVAL;
339 1.1 thorpej sc->sc_parent = pdk;
340 1.1 thorpej sc->sc_pdev = pdev;
341 1.1 thorpej sc->sc_offset = dkw->dkw_offset;
342 1.1 thorpej sc->sc_size = dkw->dkw_size;
343 1.1 thorpej
344 1.1 thorpej memcpy(sc->sc_wname, dkw->dkw_wname, sizeof(sc->sc_wname));
345 1.1 thorpej sc->sc_wname[sizeof(sc->sc_wname) - 1] = '\0';
346 1.1 thorpej
347 1.1 thorpej memcpy(sc->sc_ptype, dkw->dkw_ptype, sizeof(sc->sc_ptype));
348 1.1 thorpej sc->sc_ptype[sizeof(sc->sc_ptype) - 1] = '\0';
349 1.1 thorpej
350 1.9 yamt bufq_alloc(&sc->sc_bufq, "fcfs", 0);
351 1.1 thorpej
352 1.26 ad callout_init(&sc->sc_restart_ch, 0);
353 1.1 thorpej callout_setfunc(&sc->sc_restart_ch, dkrestart, sc);
354 1.1 thorpej
355 1.92 mlelstv mutex_init(&sc->sc_iolock, MUTEX_DEFAULT, IPL_BIO);
356 1.92 mlelstv cv_init(&sc->sc_dkdrn, "dkdrn");
357 1.92 mlelstv
358 1.1 thorpej /*
359 1.1 thorpej * Wedge will be added; increment the wedge count for the parent.
360 1.107 andvar * Only allow this to happen if RAW_PART is the only thing open.
361 1.1 thorpej */
362 1.27 ad mutex_enter(&pdk->dk_openlock);
363 1.1 thorpej if (pdk->dk_openmask & ~(1 << RAW_PART))
364 1.1 thorpej error = EBUSY;
365 1.1 thorpej else {
366 1.1 thorpej /* Check for wedge overlap. */
367 1.1 thorpej LIST_FOREACH(lsc, &pdk->dk_wedges, sc_plink) {
368 1.1 thorpej daddr_t lastblk = sc->sc_offset + sc->sc_size - 1;
369 1.1 thorpej daddr_t llastblk = lsc->sc_offset + lsc->sc_size - 1;
370 1.1 thorpej
371 1.1 thorpej if (sc->sc_offset >= lsc->sc_offset &&
372 1.1 thorpej sc->sc_offset <= llastblk) {
373 1.63 drochner /* Overlaps the tail of the existing wedge. */
374 1.1 thorpej break;
375 1.1 thorpej }
376 1.1 thorpej if (lastblk >= lsc->sc_offset &&
377 1.1 thorpej lastblk <= llastblk) {
378 1.1 thorpej /* Overlaps the head of the existing wedge. */
379 1.1 thorpej break;
380 1.1 thorpej }
381 1.1 thorpej }
382 1.74 mlelstv if (lsc != NULL) {
383 1.74 mlelstv if (sc->sc_offset == lsc->sc_offset &&
384 1.74 mlelstv sc->sc_size == lsc->sc_size &&
385 1.74 mlelstv strcmp(sc->sc_wname, lsc->sc_wname) == 0)
386 1.74 mlelstv error = EEXIST;
387 1.74 mlelstv else
388 1.74 mlelstv error = EINVAL;
389 1.74 mlelstv } else {
390 1.1 thorpej pdk->dk_nwedges++;
391 1.1 thorpej LIST_INSERT_HEAD(&pdk->dk_wedges, sc, sc_plink);
392 1.1 thorpej }
393 1.1 thorpej }
394 1.27 ad mutex_exit(&pdk->dk_openlock);
395 1.1 thorpej if (error) {
396 1.93 mlelstv cv_destroy(&sc->sc_dkdrn);
397 1.93 mlelstv mutex_destroy(&sc->sc_iolock);
398 1.9 yamt bufq_free(sc->sc_bufq);
399 1.1 thorpej free(sc, M_DKWEDGE);
400 1.1 thorpej return (error);
401 1.1 thorpej }
402 1.1 thorpej
403 1.2 thorpej /* Fill in our cfdata for the pseudo-device glue. */
404 1.2 thorpej sc->sc_cfdata.cf_name = dk_cd.cd_name;
405 1.2 thorpej sc->sc_cfdata.cf_atname = dk_ca.ca_name;
406 1.2 thorpej /* sc->sc_cfdata.cf_unit set below */
407 1.8 nathanw sc->sc_cfdata.cf_fstate = FSTATE_STAR;
408 1.2 thorpej
409 1.1 thorpej /* Insert the larval wedge into the array. */
410 1.27 ad rw_enter(&dkwedges_lock, RW_WRITER);
411 1.1 thorpej for (error = 0;;) {
412 1.1 thorpej struct dkwedge_softc **scpp;
413 1.1 thorpej
414 1.1 thorpej /*
415 1.1 thorpej * Check for a duplicate wname while searching for
416 1.1 thorpej * a slot.
417 1.1 thorpej */
418 1.1 thorpej for (scpp = NULL, unit = 0; unit < ndkwedges; unit++) {
419 1.1 thorpej if (dkwedges[unit] == NULL) {
420 1.1 thorpej if (scpp == NULL) {
421 1.1 thorpej scpp = &dkwedges[unit];
422 1.2 thorpej sc->sc_cfdata.cf_unit = unit;
423 1.1 thorpej }
424 1.1 thorpej } else {
425 1.1 thorpej /* XXX Unicode. */
426 1.1 thorpej if (strcmp(dkwedges[unit]->sc_wname,
427 1.1 thorpej sc->sc_wname) == 0) {
428 1.1 thorpej error = EEXIST;
429 1.1 thorpej break;
430 1.1 thorpej }
431 1.1 thorpej }
432 1.1 thorpej }
433 1.1 thorpej if (error)
434 1.1 thorpej break;
435 1.1 thorpej KASSERT(unit == ndkwedges);
436 1.1 thorpej if (scpp == NULL)
437 1.1 thorpej dkwedge_array_expand();
438 1.1 thorpej else {
439 1.2 thorpej KASSERT(scpp == &dkwedges[sc->sc_cfdata.cf_unit]);
440 1.1 thorpej *scpp = sc;
441 1.1 thorpej break;
442 1.1 thorpej }
443 1.1 thorpej }
444 1.27 ad rw_exit(&dkwedges_lock);
445 1.1 thorpej if (error) {
446 1.27 ad mutex_enter(&pdk->dk_openlock);
447 1.1 thorpej pdk->dk_nwedges--;
448 1.1 thorpej LIST_REMOVE(sc, sc_plink);
449 1.27 ad mutex_exit(&pdk->dk_openlock);
450 1.1 thorpej
451 1.93 mlelstv cv_destroy(&sc->sc_dkdrn);
452 1.93 mlelstv mutex_destroy(&sc->sc_iolock);
453 1.9 yamt bufq_free(sc->sc_bufq);
454 1.1 thorpej free(sc, M_DKWEDGE);
455 1.1 thorpej return (error);
456 1.1 thorpej }
457 1.1 thorpej
458 1.2 thorpej /*
459 1.2 thorpej * Now that we know the unit #, attach a pseudo-device for
460 1.2 thorpej * this wedge instance. This will provide us with the
461 1.65 chs * device_t necessary for glue to other parts of the system.
462 1.2 thorpej *
463 1.2 thorpej * This should never fail, unless we're almost totally out of
464 1.2 thorpej * memory.
465 1.2 thorpej */
466 1.2 thorpej if ((sc->sc_dev = config_attach_pseudo(&sc->sc_cfdata)) == NULL) {
467 1.2 thorpej aprint_error("%s%u: unable to attach pseudo-device\n",
468 1.2 thorpej sc->sc_cfdata.cf_name, sc->sc_cfdata.cf_unit);
469 1.2 thorpej
470 1.27 ad rw_enter(&dkwedges_lock, RW_WRITER);
471 1.2 thorpej dkwedges[sc->sc_cfdata.cf_unit] = NULL;
472 1.27 ad rw_exit(&dkwedges_lock);
473 1.2 thorpej
474 1.27 ad mutex_enter(&pdk->dk_openlock);
475 1.2 thorpej pdk->dk_nwedges--;
476 1.2 thorpej LIST_REMOVE(sc, sc_plink);
477 1.27 ad mutex_exit(&pdk->dk_openlock);
478 1.2 thorpej
479 1.93 mlelstv cv_destroy(&sc->sc_dkdrn);
480 1.93 mlelstv mutex_destroy(&sc->sc_iolock);
481 1.9 yamt bufq_free(sc->sc_bufq);
482 1.2 thorpej free(sc, M_DKWEDGE);
483 1.2 thorpej return (ENOMEM);
484 1.2 thorpej }
485 1.1 thorpej
486 1.1 thorpej /*
487 1.1 thorpej * XXX Really ought to make the disk_attach() and the changing
488 1.1 thorpej * of state to RUNNING atomic.
489 1.1 thorpej */
490 1.1 thorpej
491 1.36 cegger disk_init(&sc->sc_dk, device_xname(sc->sc_dev), NULL);
492 1.77 mlelstv dk_set_geometry(sc, pdk);
493 1.1 thorpej disk_attach(&sc->sc_dk);
494 1.1 thorpej
495 1.1 thorpej /* Disk wedge is ready for use! */
496 1.1 thorpej sc->sc_state = DKW_STATE_RUNNING;
497 1.1 thorpej
498 1.101 jmcneill announce:
499 1.1 thorpej /* Announce our arrival. */
500 1.84 jmcneill aprint_normal(
501 1.84 jmcneill "%s at %s: \"%s\", %"PRIu64" blocks at %"PRId64", type: %s\n",
502 1.84 jmcneill device_xname(sc->sc_dev), pdk->dk_name,
503 1.84 jmcneill sc->sc_wname, /* XXX Unicode */
504 1.84 jmcneill sc->sc_size, sc->sc_offset,
505 1.84 jmcneill sc->sc_ptype[0] == '\0' ? "<unknown>" : sc->sc_ptype);
506 1.1 thorpej
507 1.112 martin /* Return the devname to the caller. */
508 1.112 martin strlcpy(dkw->dkw_devname, device_xname(sc->sc_dev),
509 1.112 martin sizeof(dkw->dkw_devname));
510 1.112 martin
511 1.1 thorpej return (0);
512 1.1 thorpej }
513 1.1 thorpej
514 1.1 thorpej /*
515 1.47 dyoung * dkwedge_find:
516 1.1 thorpej *
517 1.47 dyoung * Lookup a disk wedge based on the provided information.
518 1.1 thorpej * NOTE: We look up the wedge based on the wedge devname,
519 1.1 thorpej * not wname.
520 1.47 dyoung *
521 1.47 dyoung * Return NULL if the wedge is not found, otherwise return
522 1.47 dyoung * the wedge's softc. Assign the wedge's unit number to unitp
523 1.47 dyoung * if unitp is not NULL.
524 1.1 thorpej */
525 1.47 dyoung static struct dkwedge_softc *
526 1.47 dyoung dkwedge_find(struct dkwedge_info *dkw, u_int *unitp)
527 1.1 thorpej {
528 1.1 thorpej struct dkwedge_softc *sc = NULL;
529 1.1 thorpej u_int unit;
530 1.1 thorpej
531 1.1 thorpej /* Find our softc. */
532 1.1 thorpej dkw->dkw_devname[sizeof(dkw->dkw_devname) - 1] = '\0';
533 1.47 dyoung rw_enter(&dkwedges_lock, RW_READER);
534 1.1 thorpej for (unit = 0; unit < ndkwedges; unit++) {
535 1.1 thorpej if ((sc = dkwedges[unit]) != NULL &&
536 1.36 cegger strcmp(device_xname(sc->sc_dev), dkw->dkw_devname) == 0 &&
537 1.1 thorpej strcmp(sc->sc_parent->dk_name, dkw->dkw_parent) == 0) {
538 1.1 thorpej break;
539 1.1 thorpej }
540 1.1 thorpej }
541 1.27 ad rw_exit(&dkwedges_lock);
542 1.1 thorpej if (unit == ndkwedges)
543 1.47 dyoung return NULL;
544 1.47 dyoung
545 1.47 dyoung if (unitp != NULL)
546 1.47 dyoung *unitp = unit;
547 1.47 dyoung
548 1.47 dyoung return sc;
549 1.47 dyoung }
550 1.47 dyoung
551 1.47 dyoung /*
552 1.47 dyoung * dkwedge_del: [exported function]
553 1.47 dyoung *
554 1.47 dyoung * Delete a disk wedge based on the provided information.
555 1.47 dyoung * NOTE: We look up the wedge based on the wedge devname,
556 1.47 dyoung * not wname.
557 1.47 dyoung */
558 1.47 dyoung int
559 1.47 dyoung dkwedge_del(struct dkwedge_info *dkw)
560 1.47 dyoung {
561 1.74 mlelstv return dkwedge_del1(dkw, 0);
562 1.74 mlelstv }
563 1.74 mlelstv
564 1.74 mlelstv int
565 1.74 mlelstv dkwedge_del1(struct dkwedge_info *dkw, int flags)
566 1.74 mlelstv {
567 1.47 dyoung struct dkwedge_softc *sc = NULL;
568 1.47 dyoung
569 1.47 dyoung /* Find our softc. */
570 1.47 dyoung if ((sc = dkwedge_find(dkw, NULL)) == NULL)
571 1.1 thorpej return (ESRCH);
572 1.1 thorpej
573 1.74 mlelstv return config_detach(sc->sc_dev, flags);
574 1.47 dyoung }
575 1.47 dyoung
576 1.47 dyoung static int
577 1.74 mlelstv dkwedge_cleanup_parent(struct dkwedge_softc *sc, int flags)
578 1.47 dyoung {
579 1.47 dyoung struct disk *dk = &sc->sc_dk;
580 1.47 dyoung int rc;
581 1.47 dyoung
582 1.47 dyoung rc = 0;
583 1.47 dyoung mutex_enter(&dk->dk_openlock);
584 1.115 riastrad if (dk->dk_openmask == 0) {
585 1.91 mlelstv /* nothing to do */
586 1.115 riastrad } else if ((flags & DETACH_FORCE) == 0) {
587 1.47 dyoung rc = EBUSY;
588 1.90 mlelstv } else {
589 1.57 bouyer mutex_enter(&sc->sc_parent->dk_rawlock);
590 1.114 riastrad rc = dklastclose(sc);
591 1.114 riastrad mutex_exit(&sc->sc_parent->dk_rawlock);
592 1.57 bouyer }
593 1.115 riastrad mutex_exit(&sc->sc_dk.dk_openlock);
594 1.47 dyoung
595 1.47 dyoung return rc;
596 1.47 dyoung }
597 1.47 dyoung
598 1.47 dyoung /*
599 1.47 dyoung * dkwedge_detach:
600 1.47 dyoung *
601 1.47 dyoung * Autoconfiguration detach function for pseudo-device glue.
602 1.47 dyoung */
603 1.47 dyoung static int
604 1.47 dyoung dkwedge_detach(device_t self, int flags)
605 1.47 dyoung {
606 1.47 dyoung struct dkwedge_softc *sc = NULL;
607 1.47 dyoung u_int unit;
608 1.92 mlelstv int bmaj, cmaj, rc;
609 1.47 dyoung
610 1.47 dyoung rw_enter(&dkwedges_lock, RW_WRITER);
611 1.47 dyoung for (unit = 0; unit < ndkwedges; unit++) {
612 1.47 dyoung if ((sc = dkwedges[unit]) != NULL && sc->sc_dev == self)
613 1.47 dyoung break;
614 1.47 dyoung }
615 1.47 dyoung if (unit == ndkwedges)
616 1.47 dyoung rc = ENXIO;
617 1.74 mlelstv else if ((rc = dkwedge_cleanup_parent(sc, flags)) == 0) {
618 1.47 dyoung /* Mark the wedge as dying. */
619 1.47 dyoung sc->sc_state = DKW_STATE_DYING;
620 1.47 dyoung }
621 1.47 dyoung rw_exit(&dkwedges_lock);
622 1.47 dyoung
623 1.47 dyoung if (rc != 0)
624 1.47 dyoung return rc;
625 1.47 dyoung
626 1.47 dyoung pmf_device_deregister(self);
627 1.1 thorpej
628 1.1 thorpej /* Locate the wedge major numbers. */
629 1.1 thorpej bmaj = bdevsw_lookup_major(&dk_bdevsw);
630 1.1 thorpej cmaj = cdevsw_lookup_major(&dk_cdevsw);
631 1.1 thorpej
632 1.1 thorpej /* Kill any pending restart. */
633 1.1 thorpej callout_stop(&sc->sc_restart_ch);
634 1.1 thorpej
635 1.1 thorpej /*
636 1.1 thorpej * dkstart() will kill any queued buffers now that the
637 1.1 thorpej * state of the wedge is not RUNNING. Once we've done
638 1.1 thorpej * that, wait for any other pending I/O to complete.
639 1.1 thorpej */
640 1.1 thorpej dkstart(sc);
641 1.1 thorpej dkwedge_wait_drain(sc);
642 1.1 thorpej
643 1.1 thorpej /* Nuke the vnodes for any open instances. */
644 1.14 thorpej vdevgone(bmaj, unit, unit, VBLK);
645 1.14 thorpej vdevgone(cmaj, unit, unit, VCHR);
646 1.1 thorpej
647 1.1 thorpej /* Clean up the parent. */
648 1.74 mlelstv dkwedge_cleanup_parent(sc, flags | DETACH_FORCE);
649 1.1 thorpej
650 1.1 thorpej /* Announce our departure. */
651 1.36 cegger aprint_normal("%s at %s (%s) deleted\n", device_xname(sc->sc_dev),
652 1.1 thorpej sc->sc_parent->dk_name,
653 1.1 thorpej sc->sc_wname); /* XXX Unicode */
654 1.1 thorpej
655 1.27 ad mutex_enter(&sc->sc_parent->dk_openlock);
656 1.1 thorpej sc->sc_parent->dk_nwedges--;
657 1.1 thorpej LIST_REMOVE(sc, sc_plink);
658 1.27 ad mutex_exit(&sc->sc_parent->dk_openlock);
659 1.1 thorpej
660 1.1 thorpej /* Delete our buffer queue. */
661 1.9 yamt bufq_free(sc->sc_bufq);
662 1.1 thorpej
663 1.1 thorpej /* Detach from the disk list. */
664 1.1 thorpej disk_detach(&sc->sc_dk);
665 1.39 plunky disk_destroy(&sc->sc_dk);
666 1.1 thorpej
667 1.1 thorpej /* Poof. */
668 1.27 ad rw_enter(&dkwedges_lock, RW_WRITER);
669 1.1 thorpej dkwedges[unit] = NULL;
670 1.1 thorpej sc->sc_state = DKW_STATE_DEAD;
671 1.27 ad rw_exit(&dkwedges_lock);
672 1.1 thorpej
673 1.92 mlelstv mutex_destroy(&sc->sc_iolock);
674 1.92 mlelstv cv_destroy(&sc->sc_dkdrn);
675 1.92 mlelstv
676 1.1 thorpej free(sc, M_DKWEDGE);
677 1.1 thorpej
678 1.47 dyoung return 0;
679 1.1 thorpej }
680 1.1 thorpej
681 1.1 thorpej /*
682 1.1 thorpej * dkwedge_delall: [exported function]
683 1.1 thorpej *
684 1.1 thorpej * Delete all of the wedges on the specified disk. Used when
685 1.1 thorpej * a disk is being detached.
686 1.1 thorpej */
687 1.1 thorpej void
688 1.1 thorpej dkwedge_delall(struct disk *pdk)
689 1.1 thorpej {
690 1.74 mlelstv dkwedge_delall1(pdk, false);
691 1.74 mlelstv }
692 1.74 mlelstv
693 1.74 mlelstv static void
694 1.74 mlelstv dkwedge_delall1(struct disk *pdk, bool idleonly)
695 1.74 mlelstv {
696 1.1 thorpej struct dkwedge_info dkw;
697 1.1 thorpej struct dkwedge_softc *sc;
698 1.74 mlelstv int flags;
699 1.74 mlelstv
700 1.74 mlelstv flags = DETACH_QUIET;
701 1.74 mlelstv if (!idleonly) flags |= DETACH_FORCE;
702 1.1 thorpej
703 1.1 thorpej for (;;) {
704 1.27 ad mutex_enter(&pdk->dk_openlock);
705 1.74 mlelstv LIST_FOREACH(sc, &pdk->dk_wedges, sc_plink) {
706 1.74 mlelstv if (!idleonly || sc->sc_dk.dk_openmask == 0)
707 1.74 mlelstv break;
708 1.74 mlelstv }
709 1.74 mlelstv if (sc == NULL) {
710 1.74 mlelstv KASSERT(idleonly || pdk->dk_nwedges == 0);
711 1.27 ad mutex_exit(&pdk->dk_openlock);
712 1.1 thorpej return;
713 1.1 thorpej }
714 1.94 maya strlcpy(dkw.dkw_parent, pdk->dk_name, sizeof(dkw.dkw_parent));
715 1.36 cegger strlcpy(dkw.dkw_devname, device_xname(sc->sc_dev),
716 1.36 cegger sizeof(dkw.dkw_devname));
717 1.27 ad mutex_exit(&pdk->dk_openlock);
718 1.74 mlelstv (void) dkwedge_del1(&dkw, flags);
719 1.1 thorpej }
720 1.1 thorpej }
721 1.1 thorpej
722 1.1 thorpej /*
723 1.1 thorpej * dkwedge_list: [exported function]
724 1.1 thorpej *
725 1.1 thorpej * List all of the wedges on a particular disk.
726 1.1 thorpej */
727 1.1 thorpej int
728 1.10 christos dkwedge_list(struct disk *pdk, struct dkwedge_list *dkwl, struct lwp *l)
729 1.1 thorpej {
730 1.1 thorpej struct uio uio;
731 1.1 thorpej struct iovec iov;
732 1.1 thorpej struct dkwedge_softc *sc;
733 1.1 thorpej struct dkwedge_info dkw;
734 1.1 thorpej int error = 0;
735 1.1 thorpej
736 1.1 thorpej iov.iov_base = dkwl->dkwl_buf;
737 1.1 thorpej iov.iov_len = dkwl->dkwl_bufsize;
738 1.1 thorpej
739 1.1 thorpej uio.uio_iov = &iov;
740 1.1 thorpej uio.uio_iovcnt = 1;
741 1.1 thorpej uio.uio_offset = 0;
742 1.1 thorpej uio.uio_resid = dkwl->dkwl_bufsize;
743 1.1 thorpej uio.uio_rw = UIO_READ;
744 1.51 pooka KASSERT(l == curlwp);
745 1.51 pooka uio.uio_vmspace = l->l_proc->p_vmspace;
746 1.1 thorpej
747 1.1 thorpej dkwl->dkwl_ncopied = 0;
748 1.1 thorpej
749 1.27 ad mutex_enter(&pdk->dk_openlock);
750 1.1 thorpej LIST_FOREACH(sc, &pdk->dk_wedges, sc_plink) {
751 1.1 thorpej if (uio.uio_resid < sizeof(dkw))
752 1.1 thorpej break;
753 1.1 thorpej
754 1.1 thorpej if (sc->sc_state != DKW_STATE_RUNNING)
755 1.1 thorpej continue;
756 1.1 thorpej
757 1.36 cegger strlcpy(dkw.dkw_devname, device_xname(sc->sc_dev),
758 1.36 cegger sizeof(dkw.dkw_devname));
759 1.1 thorpej memcpy(dkw.dkw_wname, sc->sc_wname, sizeof(dkw.dkw_wname));
760 1.1 thorpej dkw.dkw_wname[sizeof(dkw.dkw_wname) - 1] = '\0';
761 1.94 maya strlcpy(dkw.dkw_parent, sc->sc_parent->dk_name,
762 1.94 maya sizeof(dkw.dkw_parent));
763 1.1 thorpej dkw.dkw_offset = sc->sc_offset;
764 1.1 thorpej dkw.dkw_size = sc->sc_size;
765 1.94 maya strlcpy(dkw.dkw_ptype, sc->sc_ptype, sizeof(dkw.dkw_ptype));
766 1.1 thorpej
767 1.1 thorpej error = uiomove(&dkw, sizeof(dkw), &uio);
768 1.1 thorpej if (error)
769 1.1 thorpej break;
770 1.1 thorpej dkwl->dkwl_ncopied++;
771 1.1 thorpej }
772 1.1 thorpej dkwl->dkwl_nwedges = pdk->dk_nwedges;
773 1.27 ad mutex_exit(&pdk->dk_openlock);
774 1.1 thorpej
775 1.1 thorpej return (error);
776 1.1 thorpej }
777 1.1 thorpej
778 1.25 dyoung device_t
779 1.25 dyoung dkwedge_find_by_wname(const char *wname)
780 1.25 dyoung {
781 1.25 dyoung device_t dv = NULL;
782 1.25 dyoung struct dkwedge_softc *sc;
783 1.25 dyoung int i;
784 1.25 dyoung
785 1.27 ad rw_enter(&dkwedges_lock, RW_WRITER);
786 1.25 dyoung for (i = 0; i < ndkwedges; i++) {
787 1.25 dyoung if ((sc = dkwedges[i]) == NULL)
788 1.25 dyoung continue;
789 1.25 dyoung if (strcmp(sc->sc_wname, wname) == 0) {
790 1.25 dyoung if (dv != NULL) {
791 1.25 dyoung printf(
792 1.25 dyoung "WARNING: double match for wedge name %s "
793 1.25 dyoung "(%s, %s)\n", wname, device_xname(dv),
794 1.25 dyoung device_xname(sc->sc_dev));
795 1.25 dyoung continue;
796 1.25 dyoung }
797 1.25 dyoung dv = sc->sc_dev;
798 1.25 dyoung }
799 1.25 dyoung }
800 1.27 ad rw_exit(&dkwedges_lock);
801 1.25 dyoung return dv;
802 1.25 dyoung }
803 1.25 dyoung
804 1.89 christos device_t
805 1.89 christos dkwedge_find_by_parent(const char *name, size_t *i)
806 1.89 christos {
807 1.89 christos rw_enter(&dkwedges_lock, RW_WRITER);
808 1.89 christos for (; *i < (size_t)ndkwedges; (*i)++) {
809 1.89 christos struct dkwedge_softc *sc;
810 1.89 christos if ((sc = dkwedges[*i]) == NULL)
811 1.89 christos continue;
812 1.89 christos if (strcmp(sc->sc_parent->dk_name, name) != 0)
813 1.89 christos continue;
814 1.89 christos rw_exit(&dkwedges_lock);
815 1.89 christos return sc->sc_dev;
816 1.89 christos }
817 1.89 christos rw_exit(&dkwedges_lock);
818 1.89 christos return NULL;
819 1.89 christos }
820 1.89 christos
821 1.25 dyoung void
822 1.25 dyoung dkwedge_print_wnames(void)
823 1.25 dyoung {
824 1.25 dyoung struct dkwedge_softc *sc;
825 1.25 dyoung int i;
826 1.25 dyoung
827 1.27 ad rw_enter(&dkwedges_lock, RW_WRITER);
828 1.25 dyoung for (i = 0; i < ndkwedges; i++) {
829 1.25 dyoung if ((sc = dkwedges[i]) == NULL)
830 1.25 dyoung continue;
831 1.25 dyoung printf(" wedge:%s", sc->sc_wname);
832 1.25 dyoung }
833 1.27 ad rw_exit(&dkwedges_lock);
834 1.25 dyoung }
835 1.25 dyoung
836 1.1 thorpej /*
837 1.18 uebayasi * We need a dummy object to stuff into the dkwedge discovery method link
838 1.1 thorpej * set to ensure that there is always at least one object in the set.
839 1.1 thorpej */
840 1.1 thorpej static struct dkwedge_discovery_method dummy_discovery_method;
841 1.1 thorpej __link_set_add_bss(dkwedge_methods, dummy_discovery_method);
842 1.1 thorpej
843 1.1 thorpej /*
844 1.27 ad * dkwedge_init:
845 1.1 thorpej *
846 1.27 ad * Initialize the disk wedge subsystem.
847 1.1 thorpej */
848 1.27 ad void
849 1.27 ad dkwedge_init(void)
850 1.1 thorpej {
851 1.1 thorpej __link_set_decl(dkwedge_methods, struct dkwedge_discovery_method);
852 1.1 thorpej struct dkwedge_discovery_method * const *ddmp;
853 1.1 thorpej struct dkwedge_discovery_method *lddm, *ddm;
854 1.1 thorpej
855 1.27 ad rw_init(&dkwedges_lock);
856 1.27 ad rw_init(&dkwedge_discovery_methods_lock);
857 1.27 ad
858 1.27 ad if (config_cfdriver_attach(&dk_cd) != 0)
859 1.27 ad panic("dkwedge: unable to attach cfdriver");
860 1.27 ad if (config_cfattach_attach(dk_cd.cd_name, &dk_ca) != 0)
861 1.27 ad panic("dkwedge: unable to attach cfattach");
862 1.1 thorpej
863 1.27 ad rw_enter(&dkwedge_discovery_methods_lock, RW_WRITER);
864 1.1 thorpej
865 1.1 thorpej LIST_INIT(&dkwedge_discovery_methods);
866 1.1 thorpej
867 1.1 thorpej __link_set_foreach(ddmp, dkwedge_methods) {
868 1.1 thorpej ddm = *ddmp;
869 1.1 thorpej if (ddm == &dummy_discovery_method)
870 1.1 thorpej continue;
871 1.1 thorpej if (LIST_EMPTY(&dkwedge_discovery_methods)) {
872 1.1 thorpej LIST_INSERT_HEAD(&dkwedge_discovery_methods,
873 1.1 thorpej ddm, ddm_list);
874 1.1 thorpej continue;
875 1.1 thorpej }
876 1.1 thorpej LIST_FOREACH(lddm, &dkwedge_discovery_methods, ddm_list) {
877 1.1 thorpej if (ddm->ddm_priority == lddm->ddm_priority) {
878 1.1 thorpej aprint_error("dk-method-%s: method \"%s\" "
879 1.1 thorpej "already exists at priority %d\n",
880 1.1 thorpej ddm->ddm_name, lddm->ddm_name,
881 1.1 thorpej lddm->ddm_priority);
882 1.1 thorpej /* Not inserted. */
883 1.1 thorpej break;
884 1.1 thorpej }
885 1.1 thorpej if (ddm->ddm_priority < lddm->ddm_priority) {
886 1.1 thorpej /* Higher priority; insert before. */
887 1.1 thorpej LIST_INSERT_BEFORE(lddm, ddm, ddm_list);
888 1.1 thorpej break;
889 1.1 thorpej }
890 1.1 thorpej if (LIST_NEXT(lddm, ddm_list) == NULL) {
891 1.1 thorpej /* Last one; insert after. */
892 1.1 thorpej KASSERT(lddm->ddm_priority < ddm->ddm_priority);
893 1.1 thorpej LIST_INSERT_AFTER(lddm, ddm, ddm_list);
894 1.1 thorpej break;
895 1.1 thorpej }
896 1.1 thorpej }
897 1.1 thorpej }
898 1.1 thorpej
899 1.27 ad rw_exit(&dkwedge_discovery_methods_lock);
900 1.1 thorpej }
901 1.1 thorpej
902 1.1 thorpej #ifdef DKWEDGE_AUTODISCOVER
903 1.1 thorpej int dkwedge_autodiscover = 1;
904 1.1 thorpej #else
905 1.1 thorpej int dkwedge_autodiscover = 0;
906 1.1 thorpej #endif
907 1.1 thorpej
908 1.1 thorpej /*
909 1.1 thorpej * dkwedge_discover: [exported function]
910 1.1 thorpej *
911 1.1 thorpej * Discover the wedges on a newly attached disk.
912 1.74 mlelstv * Remove all unused wedges on the disk first.
913 1.1 thorpej */
914 1.1 thorpej void
915 1.1 thorpej dkwedge_discover(struct disk *pdk)
916 1.1 thorpej {
917 1.1 thorpej struct dkwedge_discovery_method *ddm;
918 1.1 thorpej struct vnode *vp;
919 1.1 thorpej int error;
920 1.1 thorpej dev_t pdev;
921 1.1 thorpej
922 1.1 thorpej /*
923 1.1 thorpej * Require people playing with wedges to enable this explicitly.
924 1.1 thorpej */
925 1.1 thorpej if (dkwedge_autodiscover == 0)
926 1.1 thorpej return;
927 1.1 thorpej
928 1.27 ad rw_enter(&dkwedge_discovery_methods_lock, RW_READER);
929 1.1 thorpej
930 1.74 mlelstv /*
931 1.74 mlelstv * Use the character device for scanning, the block device
932 1.74 mlelstv * is busy if there are already wedges attached.
933 1.74 mlelstv */
934 1.74 mlelstv error = dkwedge_compute_pdev(pdk->dk_name, &pdev, VCHR);
935 1.1 thorpej if (error) {
936 1.1 thorpej aprint_error("%s: unable to compute pdev, error = %d\n",
937 1.1 thorpej pdk->dk_name, error);
938 1.1 thorpej goto out;
939 1.1 thorpej }
940 1.1 thorpej
941 1.74 mlelstv error = cdevvp(pdev, &vp);
942 1.1 thorpej if (error) {
943 1.1 thorpej aprint_error("%s: unable to find vnode for pdev, error = %d\n",
944 1.1 thorpej pdk->dk_name, error);
945 1.1 thorpej goto out;
946 1.1 thorpej }
947 1.1 thorpej
948 1.1 thorpej error = vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
949 1.1 thorpej if (error) {
950 1.1 thorpej aprint_error("%s: unable to lock vnode for pdev, error = %d\n",
951 1.1 thorpej pdk->dk_name, error);
952 1.1 thorpej vrele(vp);
953 1.1 thorpej goto out;
954 1.1 thorpej }
955 1.1 thorpej
956 1.62 jmcneill error = VOP_OPEN(vp, FREAD | FSILENT, NOCRED);
957 1.1 thorpej if (error) {
958 1.67 soren if (error != ENODEV)
959 1.67 soren aprint_error("%s: unable to open device, error = %d\n",
960 1.67 soren pdk->dk_name, error);
961 1.1 thorpej vput(vp);
962 1.1 thorpej goto out;
963 1.1 thorpej }
964 1.56 hannken VOP_UNLOCK(vp);
965 1.1 thorpej
966 1.1 thorpej /*
967 1.74 mlelstv * Remove unused wedges
968 1.74 mlelstv */
969 1.74 mlelstv dkwedge_delall1(pdk, true);
970 1.74 mlelstv
971 1.74 mlelstv /*
972 1.1 thorpej * For each supported partition map type, look to see if
973 1.1 thorpej * this map type exists. If so, parse it and add the
974 1.1 thorpej * corresponding wedges.
975 1.1 thorpej */
976 1.1 thorpej LIST_FOREACH(ddm, &dkwedge_discovery_methods, ddm_list) {
977 1.1 thorpej error = (*ddm->ddm_discover)(pdk, vp);
978 1.1 thorpej if (error == 0) {
979 1.1 thorpej /* Successfully created wedges; we're done. */
980 1.1 thorpej break;
981 1.1 thorpej }
982 1.1 thorpej }
983 1.1 thorpej
984 1.35 ad error = vn_close(vp, FREAD, NOCRED);
985 1.1 thorpej if (error) {
986 1.1 thorpej aprint_error("%s: unable to close device, error = %d\n",
987 1.1 thorpej pdk->dk_name, error);
988 1.1 thorpej /* We'll just assume the vnode has been cleaned up. */
989 1.1 thorpej }
990 1.75 mlelstv
991 1.1 thorpej out:
992 1.27 ad rw_exit(&dkwedge_discovery_methods_lock);
993 1.1 thorpej }
994 1.1 thorpej
995 1.1 thorpej /*
996 1.1 thorpej * dkwedge_read:
997 1.1 thorpej *
998 1.37 agc * Read some data from the specified disk, used for
999 1.1 thorpej * partition discovery.
1000 1.1 thorpej */
1001 1.1 thorpej int
1002 1.20 christos dkwedge_read(struct disk *pdk, struct vnode *vp, daddr_t blkno,
1003 1.19 christos void *tbuf, size_t len)
1004 1.1 thorpej {
1005 1.74 mlelstv buf_t *bp;
1006 1.81 mlelstv int error;
1007 1.82 mlelstv bool isopen;
1008 1.82 mlelstv dev_t bdev;
1009 1.83 pooka struct vnode *bdvp;
1010 1.74 mlelstv
1011 1.74 mlelstv /*
1012 1.74 mlelstv * The kernel cannot read from a character device vnode
1013 1.74 mlelstv * as physio() only handles user memory.
1014 1.74 mlelstv *
1015 1.82 mlelstv * If the block device has already been opened by a wedge
1016 1.82 mlelstv * use that vnode and temporarily bump the open counter.
1017 1.82 mlelstv *
1018 1.82 mlelstv * Otherwise try to open the block device.
1019 1.74 mlelstv */
1020 1.1 thorpej
1021 1.82 mlelstv bdev = devsw_chr2blk(vp->v_rdev);
1022 1.82 mlelstv
1023 1.82 mlelstv mutex_enter(&pdk->dk_rawlock);
1024 1.82 mlelstv if (pdk->dk_rawopens != 0) {
1025 1.82 mlelstv KASSERT(pdk->dk_rawvp != NULL);
1026 1.82 mlelstv isopen = true;
1027 1.82 mlelstv ++pdk->dk_rawopens;
1028 1.83 pooka bdvp = pdk->dk_rawvp;
1029 1.87 mlelstv error = 0;
1030 1.82 mlelstv } else {
1031 1.82 mlelstv isopen = false;
1032 1.87 mlelstv error = dk_open_parent(bdev, FREAD, &bdvp);
1033 1.82 mlelstv }
1034 1.82 mlelstv mutex_exit(&pdk->dk_rawlock);
1035 1.82 mlelstv
1036 1.87 mlelstv if (error)
1037 1.87 mlelstv return error;
1038 1.82 mlelstv
1039 1.83 pooka bp = getiobuf(bdvp, true);
1040 1.41 ad bp->b_flags = B_READ;
1041 1.74 mlelstv bp->b_cflags = BC_BUSY;
1042 1.82 mlelstv bp->b_dev = bdev;
1043 1.41 ad bp->b_data = tbuf;
1044 1.75 mlelstv bp->b_bufsize = bp->b_bcount = len;
1045 1.74 mlelstv bp->b_blkno = blkno;
1046 1.75 mlelstv bp->b_cylinder = 0;
1047 1.75 mlelstv bp->b_error = 0;
1048 1.74 mlelstv
1049 1.83 pooka VOP_STRATEGY(bdvp, bp);
1050 1.74 mlelstv error = biowait(bp);
1051 1.41 ad putiobuf(bp);
1052 1.1 thorpej
1053 1.82 mlelstv mutex_enter(&pdk->dk_rawlock);
1054 1.82 mlelstv if (isopen) {
1055 1.82 mlelstv --pdk->dk_rawopens;
1056 1.82 mlelstv } else {
1057 1.83 pooka dk_close_parent(bdvp, FREAD);
1058 1.82 mlelstv }
1059 1.82 mlelstv mutex_exit(&pdk->dk_rawlock);
1060 1.74 mlelstv
1061 1.74 mlelstv return error;
1062 1.1 thorpej }
1063 1.1 thorpej
1064 1.1 thorpej /*
1065 1.1 thorpej * dkwedge_lookup:
1066 1.1 thorpej *
1067 1.1 thorpej * Look up a dkwedge_softc based on the provided dev_t.
1068 1.1 thorpej */
1069 1.1 thorpej static struct dkwedge_softc *
1070 1.1 thorpej dkwedge_lookup(dev_t dev)
1071 1.1 thorpej {
1072 1.3 thorpej int unit = minor(dev);
1073 1.1 thorpej
1074 1.1 thorpej if (unit >= ndkwedges)
1075 1.1 thorpej return (NULL);
1076 1.1 thorpej
1077 1.1 thorpej KASSERT(dkwedges != NULL);
1078 1.1 thorpej
1079 1.1 thorpej return (dkwedges[unit]);
1080 1.1 thorpej }
1081 1.1 thorpej
1082 1.87 mlelstv static int
1083 1.87 mlelstv dk_open_parent(dev_t dev, int mode, struct vnode **vpp)
1084 1.82 mlelstv {
1085 1.82 mlelstv struct vnode *vp;
1086 1.82 mlelstv int error;
1087 1.82 mlelstv
1088 1.82 mlelstv error = bdevvp(dev, &vp);
1089 1.82 mlelstv if (error)
1090 1.87 mlelstv return error;
1091 1.82 mlelstv
1092 1.82 mlelstv error = vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
1093 1.82 mlelstv if (error) {
1094 1.82 mlelstv vrele(vp);
1095 1.87 mlelstv return error;
1096 1.82 mlelstv }
1097 1.82 mlelstv error = VOP_OPEN(vp, mode, NOCRED);
1098 1.82 mlelstv if (error) {
1099 1.82 mlelstv vput(vp);
1100 1.87 mlelstv return error;
1101 1.82 mlelstv }
1102 1.82 mlelstv
1103 1.82 mlelstv /* VOP_OPEN() doesn't do this for us. */
1104 1.82 mlelstv if (mode & FWRITE) {
1105 1.82 mlelstv mutex_enter(vp->v_interlock);
1106 1.82 mlelstv vp->v_writecount++;
1107 1.82 mlelstv mutex_exit(vp->v_interlock);
1108 1.82 mlelstv }
1109 1.82 mlelstv
1110 1.82 mlelstv VOP_UNLOCK(vp);
1111 1.82 mlelstv
1112 1.87 mlelstv *vpp = vp;
1113 1.87 mlelstv
1114 1.87 mlelstv return 0;
1115 1.82 mlelstv }
1116 1.82 mlelstv
1117 1.82 mlelstv static int
1118 1.82 mlelstv dk_close_parent(struct vnode *vp, int mode)
1119 1.82 mlelstv {
1120 1.82 mlelstv int error;
1121 1.82 mlelstv
1122 1.82 mlelstv error = vn_close(vp, mode, NOCRED);
1123 1.82 mlelstv return error;
1124 1.82 mlelstv }
1125 1.82 mlelstv
1126 1.1 thorpej /*
1127 1.1 thorpej * dkopen: [devsw entry point]
1128 1.1 thorpej *
1129 1.1 thorpej * Open a wedge.
1130 1.1 thorpej */
1131 1.1 thorpej static int
1132 1.20 christos dkopen(dev_t dev, int flags, int fmt, struct lwp *l)
1133 1.1 thorpej {
1134 1.1 thorpej struct dkwedge_softc *sc = dkwedge_lookup(dev);
1135 1.104 mlelstv struct dkwedge_softc *nsc;
1136 1.1 thorpej struct vnode *vp;
1137 1.14 thorpej int error = 0;
1138 1.103 mlelstv int mode;
1139 1.1 thorpej
1140 1.1 thorpej if (sc == NULL)
1141 1.1 thorpej return (ENODEV);
1142 1.1 thorpej if (sc->sc_state != DKW_STATE_RUNNING)
1143 1.1 thorpej return (ENXIO);
1144 1.1 thorpej
1145 1.1 thorpej /*
1146 1.1 thorpej * We go through a complicated little dance to only open the parent
1147 1.1 thorpej * vnode once per wedge, no matter how many times the wedge is
1148 1.1 thorpej * opened. The reason? We see one dkopen() per open call, but
1149 1.1 thorpej * only dkclose() on the last close.
1150 1.1 thorpej */
1151 1.27 ad mutex_enter(&sc->sc_dk.dk_openlock);
1152 1.27 ad mutex_enter(&sc->sc_parent->dk_rawlock);
1153 1.3 thorpej if (sc->sc_dk.dk_openmask == 0) {
1154 1.23 dyoung if (sc->sc_parent->dk_rawopens == 0) {
1155 1.1 thorpej KASSERT(sc->sc_parent->dk_rawvp == NULL);
1156 1.103 mlelstv /*
1157 1.103 mlelstv * Try open read-write. If this fails for EROFS
1158 1.103 mlelstv * and wedge is read-only, retry to open read-only.
1159 1.103 mlelstv */
1160 1.103 mlelstv mode = FREAD | FWRITE;
1161 1.103 mlelstv error = dk_open_parent(sc->sc_pdev, mode, &vp);
1162 1.103 mlelstv if (error == EROFS && (flags & FWRITE) == 0) {
1163 1.103 mlelstv mode &= ~FWRITE;
1164 1.103 mlelstv error = dk_open_parent(sc->sc_pdev, mode, &vp);
1165 1.103 mlelstv }
1166 1.87 mlelstv if (error)
1167 1.1 thorpej goto popen_fail;
1168 1.1 thorpej sc->sc_parent->dk_rawvp = vp;
1169 1.104 mlelstv } else {
1170 1.104 mlelstv /*
1171 1.104 mlelstv * Retrieve mode from an already opened wedge.
1172 1.104 mlelstv */
1173 1.104 mlelstv mode = 0;
1174 1.104 mlelstv LIST_FOREACH(nsc, &sc->sc_parent->dk_wedges, sc_plink) {
1175 1.104 mlelstv if (nsc == sc || nsc->sc_dk.dk_openmask == 0)
1176 1.104 mlelstv continue;
1177 1.104 mlelstv mode = nsc->sc_mode;
1178 1.104 mlelstv break;
1179 1.104 mlelstv }
1180 1.1 thorpej }
1181 1.104 mlelstv sc->sc_mode = mode;
1182 1.24 christos sc->sc_parent->dk_rawopens++;
1183 1.104 mlelstv }
1184 1.104 mlelstv KASSERT(sc->sc_mode != 0);
1185 1.104 mlelstv if (flags & ~sc->sc_mode & FWRITE) {
1186 1.103 mlelstv error = EROFS;
1187 1.103 mlelstv goto popen_fail;
1188 1.1 thorpej }
1189 1.17 dbj if (fmt == S_IFCHR)
1190 1.17 dbj sc->sc_dk.dk_copenmask |= 1;
1191 1.17 dbj else
1192 1.17 dbj sc->sc_dk.dk_bopenmask |= 1;
1193 1.17 dbj sc->sc_dk.dk_openmask =
1194 1.17 dbj sc->sc_dk.dk_copenmask | sc->sc_dk.dk_bopenmask;
1195 1.1 thorpej
1196 1.1 thorpej popen_fail:
1197 1.27 ad mutex_exit(&sc->sc_parent->dk_rawlock);
1198 1.27 ad mutex_exit(&sc->sc_dk.dk_openlock);
1199 1.1 thorpej return (error);
1200 1.1 thorpej }
1201 1.1 thorpej
1202 1.46 dyoung static int
1203 1.46 dyoung dklastclose(struct dkwedge_softc *sc)
1204 1.46 dyoung {
1205 1.98 yamaguch struct vnode *vp;
1206 1.104 mlelstv int error = 0, mode;
1207 1.104 mlelstv
1208 1.117 riastrad KASSERT(mutex_owned(&sc->sc_dk.dk_openlock));
1209 1.117 riastrad KASSERT(mutex_owned(&sc->sc_parent->dk_rawlock));
1210 1.117 riastrad
1211 1.104 mlelstv mode = sc->sc_mode;
1212 1.74 mlelstv
1213 1.98 yamaguch vp = NULL;
1214 1.74 mlelstv if (sc->sc_parent->dk_rawopens > 0) {
1215 1.98 yamaguch if (--sc->sc_parent->dk_rawopens == 0) {
1216 1.98 yamaguch KASSERT(sc->sc_parent->dk_rawvp != NULL);
1217 1.98 yamaguch vp = sc->sc_parent->dk_rawvp;
1218 1.98 yamaguch sc->sc_parent->dk_rawvp = NULL;
1219 1.105 mlelstv sc->sc_mode = 0;
1220 1.98 yamaguch }
1221 1.74 mlelstv }
1222 1.74 mlelstv
1223 1.98 yamaguch if (vp) {
1224 1.104 mlelstv dk_close_parent(vp, mode);
1225 1.74 mlelstv }
1226 1.74 mlelstv
1227 1.46 dyoung return error;
1228 1.46 dyoung }
1229 1.46 dyoung
1230 1.46 dyoung /*
1231 1.1 thorpej * dkclose: [devsw entry point]
1232 1.1 thorpej *
1233 1.1 thorpej * Close a wedge.
1234 1.1 thorpej */
1235 1.1 thorpej static int
1236 1.20 christos dkclose(dev_t dev, int flags, int fmt, struct lwp *l)
1237 1.1 thorpej {
1238 1.1 thorpej struct dkwedge_softc *sc = dkwedge_lookup(dev);
1239 1.1 thorpej int error = 0;
1240 1.1 thorpej
1241 1.59 christos if (sc == NULL)
1242 1.59 christos return (ENODEV);
1243 1.59 christos if (sc->sc_state != DKW_STATE_RUNNING)
1244 1.59 christos return (ENXIO);
1245 1.59 christos
1246 1.3 thorpej KASSERT(sc->sc_dk.dk_openmask != 0);
1247 1.1 thorpej
1248 1.27 ad mutex_enter(&sc->sc_dk.dk_openlock);
1249 1.1 thorpej
1250 1.3 thorpej if (fmt == S_IFCHR)
1251 1.3 thorpej sc->sc_dk.dk_copenmask &= ~1;
1252 1.3 thorpej else
1253 1.3 thorpej sc->sc_dk.dk_bopenmask &= ~1;
1254 1.3 thorpej sc->sc_dk.dk_openmask =
1255 1.3 thorpej sc->sc_dk.dk_copenmask | sc->sc_dk.dk_bopenmask;
1256 1.3 thorpej
1257 1.104 mlelstv if (sc->sc_dk.dk_openmask == 0) {
1258 1.116 riastrad mutex_enter(&sc->sc_parent->dk_rawlock);
1259 1.114 riastrad error = dklastclose(sc);
1260 1.116 riastrad mutex_exit(&sc->sc_parent->dk_rawlock);
1261 1.90 mlelstv }
1262 1.1 thorpej
1263 1.115 riastrad mutex_exit(&sc->sc_dk.dk_openlock);
1264 1.115 riastrad
1265 1.1 thorpej return (error);
1266 1.1 thorpej }
1267 1.1 thorpej
1268 1.1 thorpej /*
1269 1.1 thorpej * dkstragegy: [devsw entry point]
1270 1.1 thorpej *
1271 1.1 thorpej * Perform I/O based on the wedge I/O strategy.
1272 1.1 thorpej */
1273 1.1 thorpej static void
1274 1.1 thorpej dkstrategy(struct buf *bp)
1275 1.1 thorpej {
1276 1.1 thorpej struct dkwedge_softc *sc = dkwedge_lookup(bp->b_dev);
1277 1.54 mlelstv uint64_t p_size, p_offset;
1278 1.1 thorpej
1279 1.59 christos if (sc == NULL) {
1280 1.59 christos bp->b_error = ENODEV;
1281 1.59 christos goto done;
1282 1.59 christos }
1283 1.60 christos
1284 1.60 christos if (sc->sc_state != DKW_STATE_RUNNING ||
1285 1.60 christos sc->sc_parent->dk_rawvp == NULL) {
1286 1.1 thorpej bp->b_error = ENXIO;
1287 1.1 thorpej goto done;
1288 1.1 thorpej }
1289 1.1 thorpej
1290 1.1 thorpej /* If it's an empty transfer, wake up the top half now. */
1291 1.1 thorpej if (bp->b_bcount == 0)
1292 1.1 thorpej goto done;
1293 1.1 thorpej
1294 1.54 mlelstv p_offset = sc->sc_offset << sc->sc_parent->dk_blkshift;
1295 1.54 mlelstv p_size = sc->sc_size << sc->sc_parent->dk_blkshift;
1296 1.54 mlelstv
1297 1.1 thorpej /* Make sure it's in-range. */
1298 1.54 mlelstv if (bounds_check_with_mediasize(bp, DEV_BSIZE, p_size) <= 0)
1299 1.1 thorpej goto done;
1300 1.1 thorpej
1301 1.1 thorpej /* Translate it to the parent's raw LBA. */
1302 1.54 mlelstv bp->b_rawblkno = bp->b_blkno + p_offset;
1303 1.1 thorpej
1304 1.1 thorpej /* Place it in the queue and start I/O on the unit. */
1305 1.92 mlelstv mutex_enter(&sc->sc_iolock);
1306 1.1 thorpej sc->sc_iopend++;
1307 1.96 mlelstv disk_wait(&sc->sc_dk);
1308 1.43 yamt bufq_put(sc->sc_bufq, bp);
1309 1.92 mlelstv mutex_exit(&sc->sc_iolock);
1310 1.92 mlelstv
1311 1.1 thorpej dkstart(sc);
1312 1.1 thorpej return;
1313 1.1 thorpej
1314 1.1 thorpej done:
1315 1.1 thorpej bp->b_resid = bp->b_bcount;
1316 1.1 thorpej biodone(bp);
1317 1.1 thorpej }
1318 1.1 thorpej
1319 1.1 thorpej /*
1320 1.1 thorpej * dkstart:
1321 1.1 thorpej *
1322 1.1 thorpej * Start I/O that has been enqueued on the wedge.
1323 1.1 thorpej */
1324 1.1 thorpej static void
1325 1.1 thorpej dkstart(struct dkwedge_softc *sc)
1326 1.1 thorpej {
1327 1.32 ad struct vnode *vp;
1328 1.1 thorpej struct buf *bp, *nbp;
1329 1.1 thorpej
1330 1.92 mlelstv mutex_enter(&sc->sc_iolock);
1331 1.92 mlelstv
1332 1.1 thorpej /* Do as much work as has been enqueued. */
1333 1.43 yamt while ((bp = bufq_peek(sc->sc_bufq)) != NULL) {
1334 1.1 thorpej if (sc->sc_state != DKW_STATE_RUNNING) {
1335 1.43 yamt (void) bufq_get(sc->sc_bufq);
1336 1.110 riastrad if (--sc->sc_iopend == 0)
1337 1.92 mlelstv cv_broadcast(&sc->sc_dkdrn);
1338 1.92 mlelstv mutex_exit(&sc->sc_iolock);
1339 1.1 thorpej bp->b_error = ENXIO;
1340 1.1 thorpej bp->b_resid = bp->b_bcount;
1341 1.1 thorpej biodone(bp);
1342 1.92 mlelstv mutex_enter(&sc->sc_iolock);
1343 1.92 mlelstv continue;
1344 1.1 thorpej }
1345 1.1 thorpej
1346 1.92 mlelstv /* fetch an I/O buf with sc_iolock dropped */
1347 1.92 mlelstv mutex_exit(&sc->sc_iolock);
1348 1.32 ad nbp = getiobuf(sc->sc_parent->dk_rawvp, false);
1349 1.92 mlelstv mutex_enter(&sc->sc_iolock);
1350 1.1 thorpej if (nbp == NULL) {
1351 1.1 thorpej /*
1352 1.1 thorpej * No resources to run this request; leave the
1353 1.1 thorpej * buffer queued up, and schedule a timer to
1354 1.1 thorpej * restart the queue in 1/2 a second.
1355 1.1 thorpej */
1356 1.1 thorpej callout_schedule(&sc->sc_restart_ch, hz / 2);
1357 1.92 mlelstv break;
1358 1.92 mlelstv }
1359 1.92 mlelstv
1360 1.92 mlelstv /*
1361 1.92 mlelstv * fetch buf, this can fail if another thread
1362 1.92 mlelstv * has already processed the queue, it can also
1363 1.92 mlelstv * return a completely different buf.
1364 1.92 mlelstv */
1365 1.92 mlelstv bp = bufq_get(sc->sc_bufq);
1366 1.92 mlelstv if (bp == NULL) {
1367 1.92 mlelstv mutex_exit(&sc->sc_iolock);
1368 1.92 mlelstv putiobuf(nbp);
1369 1.92 mlelstv mutex_enter(&sc->sc_iolock);
1370 1.92 mlelstv continue;
1371 1.1 thorpej }
1372 1.1 thorpej
1373 1.92 mlelstv /* Instrumentation. */
1374 1.92 mlelstv disk_busy(&sc->sc_dk);
1375 1.92 mlelstv
1376 1.92 mlelstv /* release lock for VOP_STRATEGY */
1377 1.92 mlelstv mutex_exit(&sc->sc_iolock);
1378 1.1 thorpej
1379 1.1 thorpej nbp->b_data = bp->b_data;
1380 1.32 ad nbp->b_flags = bp->b_flags;
1381 1.32 ad nbp->b_oflags = bp->b_oflags;
1382 1.32 ad nbp->b_cflags = bp->b_cflags;
1383 1.1 thorpej nbp->b_iodone = dkiodone;
1384 1.1 thorpej nbp->b_proc = bp->b_proc;
1385 1.1 thorpej nbp->b_blkno = bp->b_rawblkno;
1386 1.1 thorpej nbp->b_dev = sc->sc_parent->dk_rawvp->v_rdev;
1387 1.1 thorpej nbp->b_bcount = bp->b_bcount;
1388 1.1 thorpej nbp->b_private = bp;
1389 1.1 thorpej BIO_COPYPRIO(nbp, bp);
1390 1.1 thorpej
1391 1.32 ad vp = nbp->b_vp;
1392 1.32 ad if ((nbp->b_flags & B_READ) == 0) {
1393 1.61 rmind mutex_enter(vp->v_interlock);
1394 1.32 ad vp->v_numoutput++;
1395 1.61 rmind mutex_exit(vp->v_interlock);
1396 1.32 ad }
1397 1.32 ad VOP_STRATEGY(vp, nbp);
1398 1.92 mlelstv
1399 1.92 mlelstv mutex_enter(&sc->sc_iolock);
1400 1.1 thorpej }
1401 1.92 mlelstv
1402 1.92 mlelstv mutex_exit(&sc->sc_iolock);
1403 1.1 thorpej }
1404 1.1 thorpej
1405 1.1 thorpej /*
1406 1.1 thorpej * dkiodone:
1407 1.1 thorpej *
1408 1.1 thorpej * I/O to a wedge has completed; alert the top half.
1409 1.1 thorpej */
1410 1.1 thorpej static void
1411 1.1 thorpej dkiodone(struct buf *bp)
1412 1.1 thorpej {
1413 1.1 thorpej struct buf *obp = bp->b_private;
1414 1.1 thorpej struct dkwedge_softc *sc = dkwedge_lookup(obp->b_dev);
1415 1.1 thorpej
1416 1.28 ad if (bp->b_error != 0)
1417 1.1 thorpej obp->b_error = bp->b_error;
1418 1.1 thorpej obp->b_resid = bp->b_resid;
1419 1.11 yamt putiobuf(bp);
1420 1.1 thorpej
1421 1.92 mlelstv mutex_enter(&sc->sc_iolock);
1422 1.110 riastrad if (--sc->sc_iopend == 0)
1423 1.92 mlelstv cv_broadcast(&sc->sc_dkdrn);
1424 1.1 thorpej
1425 1.1 thorpej disk_unbusy(&sc->sc_dk, obp->b_bcount - obp->b_resid,
1426 1.1 thorpej obp->b_flags & B_READ);
1427 1.92 mlelstv mutex_exit(&sc->sc_iolock);
1428 1.1 thorpej
1429 1.1 thorpej biodone(obp);
1430 1.1 thorpej
1431 1.1 thorpej /* Kick the queue in case there is more work we can do. */
1432 1.1 thorpej dkstart(sc);
1433 1.1 thorpej }
1434 1.1 thorpej
1435 1.1 thorpej /*
1436 1.1 thorpej * dkrestart:
1437 1.1 thorpej *
1438 1.1 thorpej * Restart the work queue after it was stalled due to
1439 1.1 thorpej * a resource shortage. Invoked via a callout.
1440 1.1 thorpej */
1441 1.1 thorpej static void
1442 1.1 thorpej dkrestart(void *v)
1443 1.1 thorpej {
1444 1.1 thorpej struct dkwedge_softc *sc = v;
1445 1.1 thorpej
1446 1.1 thorpej dkstart(sc);
1447 1.1 thorpej }
1448 1.1 thorpej
1449 1.1 thorpej /*
1450 1.52 jakllsch * dkminphys:
1451 1.52 jakllsch *
1452 1.52 jakllsch * Call parent's minphys function.
1453 1.52 jakllsch */
1454 1.52 jakllsch static void
1455 1.52 jakllsch dkminphys(struct buf *bp)
1456 1.52 jakllsch {
1457 1.52 jakllsch struct dkwedge_softc *sc = dkwedge_lookup(bp->b_dev);
1458 1.52 jakllsch dev_t dev;
1459 1.52 jakllsch
1460 1.52 jakllsch dev = bp->b_dev;
1461 1.52 jakllsch bp->b_dev = sc->sc_pdev;
1462 1.102 mlelstv if (sc->sc_parent->dk_driver && sc->sc_parent->dk_driver->d_minphys)
1463 1.102 mlelstv (*sc->sc_parent->dk_driver->d_minphys)(bp);
1464 1.102 mlelstv else
1465 1.102 mlelstv minphys(bp);
1466 1.52 jakllsch bp->b_dev = dev;
1467 1.52 jakllsch }
1468 1.52 jakllsch
1469 1.52 jakllsch /*
1470 1.1 thorpej * dkread: [devsw entry point]
1471 1.1 thorpej *
1472 1.1 thorpej * Read from a wedge.
1473 1.1 thorpej */
1474 1.1 thorpej static int
1475 1.20 christos dkread(dev_t dev, struct uio *uio, int flags)
1476 1.1 thorpej {
1477 1.1 thorpej struct dkwedge_softc *sc = dkwedge_lookup(dev);
1478 1.1 thorpej
1479 1.59 christos if (sc == NULL)
1480 1.59 christos return (ENODEV);
1481 1.1 thorpej if (sc->sc_state != DKW_STATE_RUNNING)
1482 1.1 thorpej return (ENXIO);
1483 1.6 perry
1484 1.52 jakllsch return (physio(dkstrategy, NULL, dev, B_READ, dkminphys, uio));
1485 1.1 thorpej }
1486 1.1 thorpej
1487 1.1 thorpej /*
1488 1.1 thorpej * dkwrite: [devsw entry point]
1489 1.1 thorpej *
1490 1.1 thorpej * Write to a wedge.
1491 1.1 thorpej */
1492 1.1 thorpej static int
1493 1.20 christos dkwrite(dev_t dev, struct uio *uio, int flags)
1494 1.1 thorpej {
1495 1.1 thorpej struct dkwedge_softc *sc = dkwedge_lookup(dev);
1496 1.1 thorpej
1497 1.59 christos if (sc == NULL)
1498 1.59 christos return (ENODEV);
1499 1.1 thorpej if (sc->sc_state != DKW_STATE_RUNNING)
1500 1.1 thorpej return (ENXIO);
1501 1.6 perry
1502 1.52 jakllsch return (physio(dkstrategy, NULL, dev, B_WRITE, dkminphys, uio));
1503 1.1 thorpej }
1504 1.1 thorpej
1505 1.1 thorpej /*
1506 1.1 thorpej * dkioctl: [devsw entry point]
1507 1.1 thorpej *
1508 1.1 thorpej * Perform an ioctl request on a wedge.
1509 1.1 thorpej */
1510 1.1 thorpej static int
1511 1.22 christos dkioctl(dev_t dev, u_long cmd, void *data, int flag, struct lwp *l)
1512 1.1 thorpej {
1513 1.1 thorpej struct dkwedge_softc *sc = dkwedge_lookup(dev);
1514 1.1 thorpej int error = 0;
1515 1.1 thorpej
1516 1.59 christos if (sc == NULL)
1517 1.59 christos return (ENODEV);
1518 1.1 thorpej if (sc->sc_state != DKW_STATE_RUNNING)
1519 1.1 thorpej return (ENXIO);
1520 1.60 christos if (sc->sc_parent->dk_rawvp == NULL)
1521 1.60 christos return (ENXIO);
1522 1.1 thorpej
1523 1.78 christos /*
1524 1.79 christos * We pass NODEV instead of our device to indicate we don't
1525 1.78 christos * want to handle disklabel ioctls
1526 1.78 christos */
1527 1.79 christos error = disk_ioctl(&sc->sc_dk, NODEV, cmd, data, flag, l);
1528 1.48 haad if (error != EPASSTHROUGH)
1529 1.48 haad return (error);
1530 1.48 haad
1531 1.48 haad error = 0;
1532 1.109 simonb
1533 1.1 thorpej switch (cmd) {
1534 1.95 jdolecek case DIOCGSTRATEGY:
1535 1.95 jdolecek case DIOCGCACHE:
1536 1.4 thorpej case DIOCCACHESYNC:
1537 1.95 jdolecek error = VOP_IOCTL(sc->sc_parent->dk_rawvp, cmd, data, flag,
1538 1.30 pooka l != NULL ? l->l_cred : NOCRED);
1539 1.4 thorpej break;
1540 1.1 thorpej case DIOCGWEDGEINFO:
1541 1.1 thorpej {
1542 1.48 haad struct dkwedge_info *dkw = (void *) data;
1543 1.1 thorpej
1544 1.36 cegger strlcpy(dkw->dkw_devname, device_xname(sc->sc_dev),
1545 1.36 cegger sizeof(dkw->dkw_devname));
1546 1.1 thorpej memcpy(dkw->dkw_wname, sc->sc_wname, sizeof(dkw->dkw_wname));
1547 1.1 thorpej dkw->dkw_wname[sizeof(dkw->dkw_wname) - 1] = '\0';
1548 1.94 maya strlcpy(dkw->dkw_parent, sc->sc_parent->dk_name,
1549 1.94 maya sizeof(dkw->dkw_parent));
1550 1.1 thorpej dkw->dkw_offset = sc->sc_offset;
1551 1.1 thorpej dkw->dkw_size = sc->sc_size;
1552 1.94 maya strlcpy(dkw->dkw_ptype, sc->sc_ptype, sizeof(dkw->dkw_ptype));
1553 1.1 thorpej
1554 1.1 thorpej break;
1555 1.1 thorpej }
1556 1.100 riastrad case DIOCGSECTORALIGN:
1557 1.100 riastrad {
1558 1.100 riastrad struct disk_sectoralign *dsa = data;
1559 1.100 riastrad uint32_t r;
1560 1.100 riastrad
1561 1.100 riastrad error = VOP_IOCTL(sc->sc_parent->dk_rawvp, cmd, dsa, flag,
1562 1.100 riastrad l != NULL ? l->l_cred : NOCRED);
1563 1.100 riastrad if (error)
1564 1.100 riastrad break;
1565 1.1 thorpej
1566 1.100 riastrad r = sc->sc_offset % dsa->dsa_alignment;
1567 1.100 riastrad if (r < dsa->dsa_firstaligned)
1568 1.100 riastrad dsa->dsa_firstaligned = dsa->dsa_firstaligned - r;
1569 1.100 riastrad else
1570 1.100 riastrad dsa->dsa_firstaligned = (dsa->dsa_firstaligned +
1571 1.100 riastrad dsa->dsa_alignment) - r;
1572 1.100 riastrad break;
1573 1.100 riastrad }
1574 1.1 thorpej default:
1575 1.1 thorpej error = ENOTTY;
1576 1.1 thorpej }
1577 1.1 thorpej
1578 1.1 thorpej return (error);
1579 1.1 thorpej }
1580 1.1 thorpej
1581 1.1 thorpej /*
1582 1.72 dholland * dkdiscard: [devsw entry point]
1583 1.72 dholland *
1584 1.72 dholland * Perform a discard-range request on a wedge.
1585 1.72 dholland */
1586 1.72 dholland static int
1587 1.72 dholland dkdiscard(dev_t dev, off_t pos, off_t len)
1588 1.72 dholland {
1589 1.72 dholland struct dkwedge_softc *sc = dkwedge_lookup(dev);
1590 1.73 riastrad unsigned shift;
1591 1.73 riastrad off_t offset, maxlen;
1592 1.111 hannken int error;
1593 1.72 dholland
1594 1.72 dholland if (sc == NULL)
1595 1.72 dholland return (ENODEV);
1596 1.72 dholland if (sc->sc_state != DKW_STATE_RUNNING)
1597 1.72 dholland return (ENXIO);
1598 1.72 dholland if (sc->sc_parent->dk_rawvp == NULL)
1599 1.72 dholland return (ENXIO);
1600 1.72 dholland
1601 1.73 riastrad shift = (sc->sc_parent->dk_blkshift + DEV_BSHIFT);
1602 1.73 riastrad KASSERT(__type_fit(off_t, sc->sc_size));
1603 1.73 riastrad KASSERT(__type_fit(off_t, sc->sc_offset));
1604 1.73 riastrad KASSERT(0 <= sc->sc_offset);
1605 1.73 riastrad KASSERT(sc->sc_size <= (__type_max(off_t) >> shift));
1606 1.73 riastrad KASSERT(sc->sc_offset <= ((__type_max(off_t) >> shift) - sc->sc_size));
1607 1.73 riastrad offset = ((off_t)sc->sc_offset << shift);
1608 1.73 riastrad maxlen = ((off_t)sc->sc_size << shift);
1609 1.73 riastrad
1610 1.73 riastrad if (len > maxlen)
1611 1.73 riastrad return (EINVAL);
1612 1.73 riastrad if (pos > (maxlen - len))
1613 1.73 riastrad return (EINVAL);
1614 1.73 riastrad
1615 1.73 riastrad pos += offset;
1616 1.111 hannken
1617 1.111 hannken vn_lock(sc->sc_parent->dk_rawvp, LK_EXCLUSIVE | LK_RETRY);
1618 1.111 hannken error = VOP_FDISCARD(sc->sc_parent->dk_rawvp, pos, len);
1619 1.111 hannken VOP_UNLOCK(sc->sc_parent->dk_rawvp);
1620 1.111 hannken
1621 1.111 hannken return error;
1622 1.72 dholland }
1623 1.72 dholland
1624 1.72 dholland /*
1625 1.1 thorpej * dksize: [devsw entry point]
1626 1.1 thorpej *
1627 1.1 thorpej * Query the size of a wedge for the purpose of performing a dump
1628 1.1 thorpej * or for swapping to.
1629 1.1 thorpej */
1630 1.1 thorpej static int
1631 1.1 thorpej dksize(dev_t dev)
1632 1.1 thorpej {
1633 1.13 thorpej struct dkwedge_softc *sc = dkwedge_lookup(dev);
1634 1.106 mlelstv uint64_t p_size;
1635 1.13 thorpej int rv = -1;
1636 1.13 thorpej
1637 1.13 thorpej if (sc == NULL)
1638 1.13 thorpej return (-1);
1639 1.13 thorpej if (sc->sc_state != DKW_STATE_RUNNING)
1640 1.55 mlelstv return (-1);
1641 1.13 thorpej
1642 1.27 ad mutex_enter(&sc->sc_dk.dk_openlock);
1643 1.27 ad mutex_enter(&sc->sc_parent->dk_rawlock);
1644 1.1 thorpej
1645 1.13 thorpej /* Our content type is static, no need to open the device. */
1646 1.13 thorpej
1647 1.106 mlelstv p_size = sc->sc_size << sc->sc_parent->dk_blkshift;
1648 1.13 thorpej if (strcmp(sc->sc_ptype, DKW_PTYPE_SWAP) == 0) {
1649 1.13 thorpej /* Saturate if we are larger than INT_MAX. */
1650 1.106 mlelstv if (p_size > INT_MAX)
1651 1.13 thorpej rv = INT_MAX;
1652 1.13 thorpej else
1653 1.106 mlelstv rv = (int) p_size;
1654 1.13 thorpej }
1655 1.13 thorpej
1656 1.27 ad mutex_exit(&sc->sc_parent->dk_rawlock);
1657 1.27 ad mutex_exit(&sc->sc_dk.dk_openlock);
1658 1.13 thorpej
1659 1.13 thorpej return (rv);
1660 1.1 thorpej }
1661 1.1 thorpej
1662 1.1 thorpej /*
1663 1.1 thorpej * dkdump: [devsw entry point]
1664 1.1 thorpej *
1665 1.1 thorpej * Perform a crash dump to a wedge.
1666 1.1 thorpej */
1667 1.1 thorpej static int
1668 1.23 dyoung dkdump(dev_t dev, daddr_t blkno, void *va, size_t size)
1669 1.1 thorpej {
1670 1.23 dyoung struct dkwedge_softc *sc = dkwedge_lookup(dev);
1671 1.23 dyoung const struct bdevsw *bdev;
1672 1.106 mlelstv uint64_t p_size, p_offset;
1673 1.23 dyoung int rv = 0;
1674 1.23 dyoung
1675 1.23 dyoung if (sc == NULL)
1676 1.59 christos return (ENODEV);
1677 1.23 dyoung if (sc->sc_state != DKW_STATE_RUNNING)
1678 1.23 dyoung return (ENXIO);
1679 1.23 dyoung
1680 1.27 ad mutex_enter(&sc->sc_dk.dk_openlock);
1681 1.27 ad mutex_enter(&sc->sc_parent->dk_rawlock);
1682 1.23 dyoung
1683 1.23 dyoung /* Our content type is static, no need to open the device. */
1684 1.23 dyoung
1685 1.88 mlelstv if (strcmp(sc->sc_ptype, DKW_PTYPE_SWAP) != 0 &&
1686 1.99 riastrad strcmp(sc->sc_ptype, DKW_PTYPE_RAID) != 0 &&
1687 1.99 riastrad strcmp(sc->sc_ptype, DKW_PTYPE_CGD) != 0) {
1688 1.23 dyoung rv = ENXIO;
1689 1.23 dyoung goto out;
1690 1.23 dyoung }
1691 1.23 dyoung if (size % DEV_BSIZE != 0) {
1692 1.23 dyoung rv = EINVAL;
1693 1.23 dyoung goto out;
1694 1.23 dyoung }
1695 1.106 mlelstv
1696 1.106 mlelstv p_offset = sc->sc_offset << sc->sc_parent->dk_blkshift;
1697 1.106 mlelstv p_size = sc->sc_size << sc->sc_parent->dk_blkshift;
1698 1.106 mlelstv
1699 1.106 mlelstv if (blkno < 0 || blkno + size / DEV_BSIZE > p_size) {
1700 1.23 dyoung printf("%s: blkno (%" PRIu64 ") + size / DEV_BSIZE (%zu) > "
1701 1.106 mlelstv "p_size (%" PRIu64 ")\n", __func__, blkno,
1702 1.106 mlelstv size / DEV_BSIZE, p_size);
1703 1.23 dyoung rv = EINVAL;
1704 1.23 dyoung goto out;
1705 1.23 dyoung }
1706 1.23 dyoung
1707 1.23 dyoung bdev = bdevsw_lookup(sc->sc_pdev);
1708 1.106 mlelstv rv = (*bdev->d_dump)(sc->sc_pdev, blkno + p_offset, va, size);
1709 1.23 dyoung
1710 1.23 dyoung out:
1711 1.27 ad mutex_exit(&sc->sc_parent->dk_rawlock);
1712 1.27 ad mutex_exit(&sc->sc_dk.dk_openlock);
1713 1.1 thorpej
1714 1.23 dyoung return rv;
1715 1.1 thorpej }
1716 1.49 pooka
1717 1.49 pooka /*
1718 1.49 pooka * config glue
1719 1.49 pooka */
1720 1.49 pooka
1721 1.64 mlelstv /*
1722 1.64 mlelstv * dkwedge_find_partition
1723 1.64 mlelstv *
1724 1.64 mlelstv * Find wedge corresponding to the specified parent name
1725 1.64 mlelstv * and offset/length.
1726 1.64 mlelstv */
1727 1.64 mlelstv device_t
1728 1.64 mlelstv dkwedge_find_partition(device_t parent, daddr_t startblk, uint64_t nblks)
1729 1.49 pooka {
1730 1.64 mlelstv struct dkwedge_softc *sc;
1731 1.64 mlelstv int i;
1732 1.64 mlelstv device_t wedge = NULL;
1733 1.49 pooka
1734 1.64 mlelstv rw_enter(&dkwedges_lock, RW_READER);
1735 1.64 mlelstv for (i = 0; i < ndkwedges; i++) {
1736 1.64 mlelstv if ((sc = dkwedges[i]) == NULL)
1737 1.64 mlelstv continue;
1738 1.64 mlelstv if (strcmp(sc->sc_parent->dk_name, device_xname(parent)) == 0 &&
1739 1.64 mlelstv sc->sc_offset == startblk &&
1740 1.64 mlelstv sc->sc_size == nblks) {
1741 1.64 mlelstv if (wedge) {
1742 1.64 mlelstv printf("WARNING: double match for boot wedge "
1743 1.64 mlelstv "(%s, %s)\n",
1744 1.64 mlelstv device_xname(wedge),
1745 1.64 mlelstv device_xname(sc->sc_dev));
1746 1.64 mlelstv continue;
1747 1.64 mlelstv }
1748 1.64 mlelstv wedge = sc->sc_dev;
1749 1.64 mlelstv }
1750 1.49 pooka }
1751 1.64 mlelstv rw_exit(&dkwedges_lock);
1752 1.49 pooka
1753 1.64 mlelstv return wedge;
1754 1.64 mlelstv }
1755 1.49 pooka
1756 1.69 christos const char *
1757 1.69 christos dkwedge_get_parent_name(dev_t dev)
1758 1.69 christos {
1759 1.69 christos /* XXX: perhaps do this in lookup? */
1760 1.69 christos int bmaj = bdevsw_lookup_major(&dk_bdevsw);
1761 1.69 christos int cmaj = cdevsw_lookup_major(&dk_cdevsw);
1762 1.69 christos if (major(dev) != bmaj && major(dev) != cmaj)
1763 1.69 christos return NULL;
1764 1.69 christos struct dkwedge_softc *sc = dkwedge_lookup(dev);
1765 1.69 christos if (sc == NULL)
1766 1.69 christos return NULL;
1767 1.69 christos return sc->sc_parent->dk_name;
1768 1.69 christos }
1769