ccd.c revision 1.150 1 1.150 dholland /* $NetBSD: ccd.c,v 1.150 2014/07/25 08:02:19 dholland Exp $ */
2 1.11 thorpej
3 1.28 thorpej /*-
4 1.133 ad * Copyright (c) 1996, 1997, 1998, 1999, 2007, 2009 The NetBSD Foundation, Inc.
5 1.11 thorpej * All rights reserved.
6 1.11 thorpej *
7 1.28 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.133 ad * by Jason R. Thorpe, and by Andrew Doran.
9 1.28 thorpej *
10 1.11 thorpej * Redistribution and use in source and binary forms, with or without
11 1.11 thorpej * modification, are permitted provided that the following conditions
12 1.11 thorpej * are met:
13 1.11 thorpej * 1. Redistributions of source code must retain the above copyright
14 1.11 thorpej * notice, this list of conditions and the following disclaimer.
15 1.11 thorpej * 2. Redistributions in binary form must reproduce the above copyright
16 1.11 thorpej * notice, this list of conditions and the following disclaimer in the
17 1.11 thorpej * documentation and/or other materials provided with the distribution.
18 1.11 thorpej *
19 1.28 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.28 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.28 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.45 jtc * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.45 jtc * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.28 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.28 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.28 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.28 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.28 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.28 thorpej * POSSIBILITY OF SUCH DAMAGE.
30 1.11 thorpej */
31 1.2 cgd
32 1.1 hpeyerl /*
33 1.138 rmind * Copyright (c) 1988 University of Utah.
34 1.3 hpeyerl * Copyright (c) 1990, 1993
35 1.3 hpeyerl * The Regents of the University of California. All rights reserved.
36 1.1 hpeyerl *
37 1.1 hpeyerl * This code is derived from software contributed to Berkeley by
38 1.1 hpeyerl * the Systems Programming Group of the University of Utah Computer
39 1.1 hpeyerl * Science Department.
40 1.1 hpeyerl *
41 1.1 hpeyerl * Redistribution and use in source and binary forms, with or without
42 1.1 hpeyerl * modification, are permitted provided that the following conditions
43 1.1 hpeyerl * are met:
44 1.1 hpeyerl * 1. Redistributions of source code must retain the above copyright
45 1.1 hpeyerl * notice, this list of conditions and the following disclaimer.
46 1.1 hpeyerl * 2. Redistributions in binary form must reproduce the above copyright
47 1.1 hpeyerl * notice, this list of conditions and the following disclaimer in the
48 1.1 hpeyerl * documentation and/or other materials provided with the distribution.
49 1.91 agc * 3. Neither the name of the University nor the names of its contributors
50 1.91 agc * may be used to endorse or promote products derived from this software
51 1.91 agc * without specific prior written permission.
52 1.91 agc *
53 1.91 agc * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
54 1.91 agc * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
55 1.91 agc * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
56 1.91 agc * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
57 1.91 agc * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
58 1.91 agc * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
59 1.91 agc * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
60 1.91 agc * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
61 1.91 agc * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
62 1.91 agc * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
63 1.91 agc * SUCH DAMAGE.
64 1.91 agc *
65 1.91 agc * from: Utah $Hdr: cd.c 1.6 90/11/28$
66 1.91 agc *
67 1.91 agc * @(#)cd.c 8.2 (Berkeley) 11/16/93
68 1.91 agc */
69 1.91 agc
70 1.91 agc /*
71 1.1 hpeyerl * "Concatenated" disk driver.
72 1.11 thorpej *
73 1.133 ad * Notes on concurrency:
74 1.133 ad *
75 1.133 ad * => sc_dvlock serializes access to the device nodes, excluding block I/O.
76 1.133 ad *
77 1.133 ad * => sc_iolock serializes access to (sc_flags & CCDF_INITED), disk stats,
78 1.133 ad * sc_stop, sc_bufq and b_resid from master buffers.
79 1.133 ad *
80 1.133 ad * => a combination of CCDF_INITED, sc_inflight, and sc_iolock is used to
81 1.133 ad * serialize I/O and configuration changes.
82 1.133 ad *
83 1.133 ad * => the in-core disk label does not change while the device is open.
84 1.133 ad *
85 1.133 ad * On memory consumption: ccd fans out I/O requests and so needs to
86 1.133 ad * allocate memory. If the system is desperately low on memory, we
87 1.133 ad * single thread I/O.
88 1.1 hpeyerl */
89 1.74 lukem
90 1.74 lukem #include <sys/cdefs.h>
91 1.150 dholland __KERNEL_RCSID(0, "$NetBSD: ccd.c,v 1.150 2014/07/25 08:02:19 dholland Exp $");
92 1.1 hpeyerl
93 1.1 hpeyerl #include <sys/param.h>
94 1.1 hpeyerl #include <sys/systm.h>
95 1.133 ad #include <sys/kernel.h>
96 1.3 hpeyerl #include <sys/proc.h>
97 1.1 hpeyerl #include <sys/errno.h>
98 1.1 hpeyerl #include <sys/buf.h>
99 1.133 ad #include <sys/kmem.h>
100 1.63 thorpej #include <sys/pool.h>
101 1.140 jruoho #include <sys/module.h>
102 1.11 thorpej #include <sys/namei.h>
103 1.3 hpeyerl #include <sys/stat.h>
104 1.3 hpeyerl #include <sys/ioctl.h>
105 1.3 hpeyerl #include <sys/disklabel.h>
106 1.11 thorpej #include <sys/device.h>
107 1.11 thorpej #include <sys/disk.h>
108 1.11 thorpej #include <sys/syslog.h>
109 1.3 hpeyerl #include <sys/fcntl.h>
110 1.11 thorpej #include <sys/vnode.h>
111 1.31 christos #include <sys/conf.h>
112 1.117 ad #include <sys/mutex.h>
113 1.56 thorpej #include <sys/queue.h>
114 1.110 elad #include <sys/kauth.h>
115 1.133 ad #include <sys/kthread.h>
116 1.133 ad #include <sys/bufq.h>
117 1.144 christos #include <sys/sysctl.h>
118 1.1 hpeyerl
119 1.135 uebayasi #include <uvm/uvm_extern.h>
120 1.135 uebayasi
121 1.1 hpeyerl #include <dev/ccdvar.h>
122 1.113 christos #include <dev/dkvar.h>
123 1.1 hpeyerl
124 1.149 hannken #include <miscfs/specfs/specdev.h> /* for v_rdev */
125 1.149 hannken
126 1.11 thorpej #if defined(CCDDEBUG) && !defined(DEBUG)
127 1.11 thorpej #define DEBUG
128 1.11 thorpej #endif
129 1.11 thorpej
130 1.1 hpeyerl #ifdef DEBUG
131 1.3 hpeyerl #define CCDB_FOLLOW 0x01
132 1.3 hpeyerl #define CCDB_INIT 0x02
133 1.3 hpeyerl #define CCDB_IO 0x04
134 1.11 thorpej #define CCDB_LABEL 0x08
135 1.11 thorpej #define CCDB_VNODE 0x10
136 1.24 thorpej int ccddebug = 0x00;
137 1.1 hpeyerl #endif
138 1.1 hpeyerl
139 1.6 cgd #define ccdunit(x) DISKUNIT(x)
140 1.6 cgd
141 1.6 cgd struct ccdbuf {
142 1.6 cgd struct buf cb_buf; /* new I/O buf */
143 1.6 cgd struct buf *cb_obp; /* ptr. to original I/O buf */
144 1.59 thorpej struct ccd_softc *cb_sc; /* pointer to ccd softc */
145 1.6 cgd int cb_comp; /* target component */
146 1.56 thorpej SIMPLEQ_ENTRY(ccdbuf) cb_q; /* fifo of component buffers */
147 1.38 thorpej };
148 1.24 thorpej
149 1.63 thorpej /* component buffer pool */
150 1.133 ad static pool_cache_t ccd_cache;
151 1.63 thorpej
152 1.133 ad #define CCD_GETBUF() pool_cache_get(ccd_cache, PR_WAITOK)
153 1.133 ad #define CCD_PUTBUF(cbp) pool_cache_put(ccd_cache, cbp)
154 1.1 hpeyerl
155 1.11 thorpej #define CCDLABELDEV(dev) \
156 1.11 thorpej (MAKEDISKDEV(major((dev)), ccdunit((dev)), RAW_PART))
157 1.1 hpeyerl
158 1.11 thorpej /* called by main() at boot time */
159 1.97 thorpej void ccdattach(int);
160 1.11 thorpej
161 1.11 thorpej /* called by biodone() at interrupt time */
162 1.97 thorpej static void ccdiodone(struct buf *);
163 1.11 thorpej
164 1.97 thorpej static void ccdinterleave(struct ccd_softc *);
165 1.97 thorpej static int ccdinit(struct ccd_softc *, char **, struct vnode **,
166 1.107 christos struct lwp *);
167 1.97 thorpej static struct ccdbuf *ccdbuffer(struct ccd_softc *, struct buf *,
168 1.118 christos daddr_t, void *, long);
169 1.97 thorpej static void ccdgetdefaultlabel(struct ccd_softc *, struct disklabel *);
170 1.97 thorpej static void ccdgetdisklabel(dev_t);
171 1.97 thorpej static void ccdmakedisklabel(struct ccd_softc *);
172 1.133 ad static void ccdstart(struct ccd_softc *);
173 1.133 ad static void ccdthread(void *);
174 1.97 thorpej
175 1.97 thorpej static dev_type_open(ccdopen);
176 1.97 thorpej static dev_type_close(ccdclose);
177 1.97 thorpej static dev_type_read(ccdread);
178 1.97 thorpej static dev_type_write(ccdwrite);
179 1.97 thorpej static dev_type_ioctl(ccdioctl);
180 1.97 thorpej static dev_type_strategy(ccdstrategy);
181 1.97 thorpej static dev_type_size(ccdsize);
182 1.78 gehenna
183 1.78 gehenna const struct bdevsw ccd_bdevsw = {
184 1.133 ad .d_open = ccdopen,
185 1.133 ad .d_close = ccdclose,
186 1.133 ad .d_strategy = ccdstrategy,
187 1.133 ad .d_ioctl = ccdioctl,
188 1.133 ad .d_dump = nodump,
189 1.133 ad .d_psize = ccdsize,
190 1.150 dholland .d_discard = nodiscard,
191 1.133 ad .d_flag = D_DISK | D_MPSAFE
192 1.78 gehenna };
193 1.78 gehenna
194 1.78 gehenna const struct cdevsw ccd_cdevsw = {
195 1.133 ad .d_open = ccdopen,
196 1.133 ad .d_close = ccdclose,
197 1.133 ad .d_read = ccdread,
198 1.133 ad .d_write = ccdwrite,
199 1.133 ad .d_ioctl = ccdioctl,
200 1.133 ad .d_stop = nostop,
201 1.133 ad .d_tty = notty,
202 1.133 ad .d_poll = nopoll,
203 1.133 ad .d_mmap = nommap,
204 1.133 ad .d_kqfilter = nokqfilter,
205 1.133 ad .d_flag = D_DISK | D_MPSAFE
206 1.78 gehenna };
207 1.3 hpeyerl
208 1.11 thorpej #ifdef DEBUG
209 1.97 thorpej static void printiinfo(struct ccdiinfo *);
210 1.11 thorpej #endif
211 1.11 thorpej
212 1.144 christos static LIST_HEAD(, ccd_softc) ccds = LIST_HEAD_INITIALIZER(ccds);
213 1.144 christos static kmutex_t ccd_lock;
214 1.144 christos
215 1.144 christos static struct ccd_softc *
216 1.144 christos ccdcreate(int unit) {
217 1.144 christos struct ccd_softc *sc = kmem_zalloc(sizeof(*sc), KM_SLEEP);
218 1.144 christos if (sc == NULL) {
219 1.144 christos #ifdef DIAGNOSTIC
220 1.144 christos printf("%s: out of memory\n", __func__);
221 1.144 christos #endif
222 1.144 christos return NULL;
223 1.144 christos }
224 1.144 christos /* Initialize per-softc structures. */
225 1.144 christos snprintf(sc->sc_xname, sizeof(sc->sc_xname), "ccd%d", unit);
226 1.144 christos mutex_init(&sc->sc_dvlock, MUTEX_DEFAULT, IPL_NONE);
227 1.144 christos sc->sc_iolock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NONE);
228 1.144 christos cv_init(&sc->sc_stop, "ccdstop");
229 1.144 christos cv_init(&sc->sc_push, "ccdthr");
230 1.144 christos disk_init(&sc->sc_dkdev, sc->sc_xname, NULL); /* XXX */
231 1.144 christos return sc;
232 1.144 christos }
233 1.144 christos
234 1.144 christos static void
235 1.144 christos ccddestroy(struct ccd_softc *sc) {
236 1.144 christos mutex_obj_free(sc->sc_iolock);
237 1.148 joerg mutex_exit(&sc->sc_dvlock);
238 1.144 christos mutex_destroy(&sc->sc_dvlock);
239 1.144 christos cv_destroy(&sc->sc_stop);
240 1.144 christos cv_destroy(&sc->sc_push);
241 1.144 christos disk_destroy(&sc->sc_dkdev);
242 1.144 christos kmem_free(sc, sizeof(*sc));
243 1.144 christos }
244 1.144 christos
245 1.144 christos static struct ccd_softc *
246 1.144 christos ccdget(int unit) {
247 1.144 christos struct ccd_softc *sc;
248 1.144 christos if (unit < 0) {
249 1.144 christos #ifdef DIAGNOSTIC
250 1.144 christos panic("%s: unit %d!", __func__, unit);
251 1.144 christos #endif
252 1.144 christos return NULL;
253 1.144 christos }
254 1.144 christos mutex_enter(&ccd_lock);
255 1.144 christos LIST_FOREACH(sc, &ccds, sc_link) {
256 1.144 christos if (sc->sc_unit == unit) {
257 1.144 christos mutex_exit(&ccd_lock);
258 1.144 christos return sc;
259 1.144 christos }
260 1.144 christos }
261 1.144 christos mutex_exit(&ccd_lock);
262 1.144 christos if ((sc = ccdcreate(unit)) == NULL)
263 1.144 christos return NULL;
264 1.144 christos mutex_enter(&ccd_lock);
265 1.144 christos LIST_INSERT_HEAD(&ccds, sc, sc_link);
266 1.144 christos mutex_exit(&ccd_lock);
267 1.144 christos return sc;
268 1.144 christos }
269 1.144 christos
270 1.144 christos static void
271 1.144 christos ccdput(struct ccd_softc *sc) {
272 1.144 christos mutex_enter(&ccd_lock);
273 1.144 christos LIST_REMOVE(sc, sc_link);
274 1.144 christos mutex_exit(&ccd_lock);
275 1.144 christos ccddestroy(sc);
276 1.144 christos }
277 1.1 hpeyerl
278 1.3 hpeyerl /*
279 1.11 thorpej * Called by main() during pseudo-device attachment. All we need
280 1.11 thorpej * to do is allocate enough space for devices to be configured later.
281 1.1 hpeyerl */
282 1.1 hpeyerl void
283 1.97 thorpej ccdattach(int num)
284 1.3 hpeyerl {
285 1.144 christos mutex_init(&ccd_lock, MUTEX_DEFAULT, IPL_NONE);
286 1.57 thorpej
287 1.63 thorpej /* Initialize the component buffer pool. */
288 1.133 ad ccd_cache = pool_cache_init(sizeof(struct ccdbuf), 0,
289 1.133 ad 0, 0, "ccdbuf", NULL, IPL_BIO, NULL, NULL, NULL);
290 1.1 hpeyerl }
291 1.1 hpeyerl
292 1.11 thorpej static int
293 1.97 thorpej ccdinit(struct ccd_softc *cs, char **cpaths, struct vnode **vpp,
294 1.107 christos struct lwp *l)
295 1.1 hpeyerl {
296 1.68 augustss struct ccdcinfo *ci = NULL;
297 1.68 augustss int ix;
298 1.11 thorpej struct ccdgeom *ccg = &cs->sc_geom;
299 1.111 christos char *tmppath;
300 1.67 enami int error, path_alloced;
301 1.143 christos uint64_t psize, minsize;
302 1.143 christos unsigned secsize, maxsecsize;
303 1.1 hpeyerl
304 1.1 hpeyerl #ifdef DEBUG
305 1.3 hpeyerl if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
306 1.59 thorpej printf("%s: ccdinit\n", cs->sc_xname);
307 1.1 hpeyerl #endif
308 1.11 thorpej
309 1.11 thorpej /* Allocate space for the component info. */
310 1.133 ad cs->sc_cinfo = kmem_alloc(cs->sc_nccdisks * sizeof(*cs->sc_cinfo),
311 1.133 ad KM_SLEEP);
312 1.133 ad tmppath = kmem_alloc(MAXPATHLEN, KM_SLEEP);
313 1.111 christos
314 1.57 thorpej cs->sc_size = 0;
315 1.57 thorpej
316 1.1 hpeyerl /*
317 1.1 hpeyerl * Verify that each component piece exists and record
318 1.1 hpeyerl * relevant information about it.
319 1.1 hpeyerl */
320 1.11 thorpej maxsecsize = 0;
321 1.1 hpeyerl minsize = 0;
322 1.67 enami for (ix = 0, path_alloced = 0; ix < cs->sc_nccdisks; ix++) {
323 1.1 hpeyerl ci = &cs->sc_cinfo[ix];
324 1.57 thorpej ci->ci_vp = vpp[ix];
325 1.11 thorpej
326 1.11 thorpej /*
327 1.11 thorpej * Copy in the pathname of the component.
328 1.11 thorpej */
329 1.141 joerg memset(tmppath, 0, MAXPATHLEN); /* sanity */
330 1.29 christos error = copyinstr(cpaths[ix], tmppath,
331 1.29 christos MAXPATHLEN, &ci->ci_pathlen);
332 1.133 ad if (ci->ci_pathlen == 0)
333 1.133 ad error = EINVAL;
334 1.29 christos if (error) {
335 1.11 thorpej #ifdef DEBUG
336 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
337 1.35 christos printf("%s: can't copy path, error = %d\n",
338 1.23 thorpej cs->sc_xname, error);
339 1.11 thorpej #endif
340 1.67 enami goto out;
341 1.11 thorpej }
342 1.133 ad ci->ci_path = kmem_alloc(ci->ci_pathlen, KM_SLEEP);
343 1.72 thorpej memcpy(ci->ci_path, tmppath, ci->ci_pathlen);
344 1.67 enami path_alloced++;
345 1.11 thorpej
346 1.11 thorpej /*
347 1.11 thorpej * XXX: Cache the component's dev_t.
348 1.11 thorpej */
349 1.149 hannken ci->ci_dev = vpp[ix]->v_rdev;
350 1.11 thorpej
351 1.3 hpeyerl /*
352 1.11 thorpej * Get partition information for the component.
353 1.3 hpeyerl */
354 1.143 christos error = getdisksize(vpp[ix], &psize, &secsize);
355 1.29 christos if (error) {
356 1.11 thorpej #ifdef DEBUG
357 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
358 1.143 christos printf("%s: %s: disksize failed, error = %d\n",
359 1.23 thorpej cs->sc_xname, ci->ci_path, error);
360 1.11 thorpej #endif
361 1.67 enami goto out;
362 1.11 thorpej }
363 1.69 enami
364 1.11 thorpej /*
365 1.11 thorpej * Calculate the size, truncating to an interleave
366 1.11 thorpej * boundary if necessary.
367 1.11 thorpej */
368 1.143 christos maxsecsize = secsize > maxsecsize ? secsize : maxsecsize;
369 1.1 hpeyerl if (cs->sc_ileave > 1)
370 1.143 christos psize -= psize % cs->sc_ileave;
371 1.11 thorpej
372 1.143 christos if (psize == 0) {
373 1.11 thorpej #ifdef DEBUG
374 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
375 1.35 christos printf("%s: %s: size == 0\n",
376 1.23 thorpej cs->sc_xname, ci->ci_path);
377 1.11 thorpej #endif
378 1.67 enami error = ENODEV;
379 1.67 enami goto out;
380 1.3 hpeyerl }
381 1.11 thorpej
382 1.143 christos if (minsize == 0 || psize < minsize)
383 1.143 christos minsize = psize;
384 1.143 christos ci->ci_size = psize;
385 1.143 christos cs->sc_size += psize;
386 1.1 hpeyerl }
387 1.11 thorpej
388 1.11 thorpej /*
389 1.11 thorpej * Don't allow the interleave to be smaller than
390 1.11 thorpej * the biggest component sector.
391 1.11 thorpej */
392 1.11 thorpej if ((cs->sc_ileave > 0) &&
393 1.11 thorpej (cs->sc_ileave < (maxsecsize / DEV_BSIZE))) {
394 1.11 thorpej #ifdef DEBUG
395 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
396 1.35 christos printf("%s: interleave must be at least %d\n",
397 1.23 thorpej cs->sc_xname, (maxsecsize / DEV_BSIZE));
398 1.11 thorpej #endif
399 1.67 enami error = EINVAL;
400 1.67 enami goto out;
401 1.11 thorpej }
402 1.11 thorpej
403 1.1 hpeyerl /*
404 1.1 hpeyerl * If uniform interleave is desired set all sizes to that of
405 1.1 hpeyerl * the smallest component.
406 1.1 hpeyerl */
407 1.57 thorpej if (cs->sc_flags & CCDF_UNIFORM) {
408 1.1 hpeyerl for (ci = cs->sc_cinfo;
409 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
410 1.1 hpeyerl ci->ci_size = minsize;
411 1.24 thorpej
412 1.53 thorpej cs->sc_size = cs->sc_nccdisks * minsize;
413 1.1 hpeyerl }
414 1.11 thorpej
415 1.11 thorpej /*
416 1.11 thorpej * Construct the interleave table.
417 1.11 thorpej */
418 1.57 thorpej ccdinterleave(cs);
419 1.11 thorpej
420 1.1 hpeyerl /*
421 1.11 thorpej * Create pseudo-geometry based on 1MB cylinders. It's
422 1.11 thorpej * pretty close.
423 1.1 hpeyerl */
424 1.11 thorpej ccg->ccg_secsize = DEV_BSIZE;
425 1.19 thorpej ccg->ccg_ntracks = 1;
426 1.11 thorpej ccg->ccg_nsectors = 1024 * (1024 / ccg->ccg_secsize);
427 1.11 thorpej ccg->ccg_ncylinders = cs->sc_size / ccg->ccg_nsectors;
428 1.11 thorpej
429 1.133 ad /*
430 1.133 ad * Create thread to handle deferred I/O.
431 1.133 ad */
432 1.133 ad cs->sc_zap = false;
433 1.133 ad error = kthread_create(PRI_BIO, KTHREAD_MPSAFE, NULL, ccdthread,
434 1.133 ad cs, &cs->sc_thread, "%s", cs->sc_xname);
435 1.133 ad if (error) {
436 1.133 ad printf("ccdinit: can't create thread: %d\n", error);
437 1.133 ad goto out;
438 1.133 ad }
439 1.133 ad
440 1.133 ad /*
441 1.133 ad * Only now that everything is set up can we enable the device.
442 1.133 ad */
443 1.133 ad mutex_enter(cs->sc_iolock);
444 1.11 thorpej cs->sc_flags |= CCDF_INITED;
445 1.133 ad mutex_exit(cs->sc_iolock);
446 1.133 ad kmem_free(tmppath, MAXPATHLEN);
447 1.11 thorpej return (0);
448 1.67 enami
449 1.67 enami out:
450 1.133 ad for (ix = 0; ix < path_alloced; ix++) {
451 1.133 ad kmem_free(cs->sc_cinfo[ix].ci_path,
452 1.133 ad cs->sc_cinfo[ix].ci_pathlen);
453 1.133 ad }
454 1.133 ad kmem_free(cs->sc_cinfo, cs->sc_nccdisks * sizeof(struct ccdcinfo));
455 1.133 ad kmem_free(tmppath, MAXPATHLEN);
456 1.67 enami return (error);
457 1.1 hpeyerl }
458 1.1 hpeyerl
459 1.11 thorpej static void
460 1.97 thorpej ccdinterleave(struct ccd_softc *cs)
461 1.1 hpeyerl {
462 1.68 augustss struct ccdcinfo *ci, *smallci;
463 1.68 augustss struct ccdiinfo *ii;
464 1.68 augustss daddr_t bn, lbn;
465 1.68 augustss int ix;
466 1.1 hpeyerl u_long size;
467 1.1 hpeyerl
468 1.1 hpeyerl #ifdef DEBUG
469 1.3 hpeyerl if (ccddebug & CCDB_INIT)
470 1.35 christos printf("ccdinterleave(%p): ileave %d\n", cs, cs->sc_ileave);
471 1.1 hpeyerl #endif
472 1.1 hpeyerl /*
473 1.1 hpeyerl * Allocate an interleave table.
474 1.1 hpeyerl * Chances are this is too big, but we don't care.
475 1.1 hpeyerl */
476 1.1 hpeyerl size = (cs->sc_nccdisks + 1) * sizeof(struct ccdiinfo);
477 1.133 ad cs->sc_itable = kmem_zalloc(size, KM_SLEEP);
478 1.11 thorpej
479 1.1 hpeyerl /*
480 1.1 hpeyerl * Trivial case: no interleave (actually interleave of disk size).
481 1.11 thorpej * Each table entry represents a single component in its entirety.
482 1.1 hpeyerl */
483 1.1 hpeyerl if (cs->sc_ileave == 0) {
484 1.1 hpeyerl bn = 0;
485 1.1 hpeyerl ii = cs->sc_itable;
486 1.11 thorpej
487 1.1 hpeyerl for (ix = 0; ix < cs->sc_nccdisks; ix++) {
488 1.19 thorpej /* Allocate space for ii_index. */
489 1.133 ad ii->ii_indexsz = sizeof(int);
490 1.133 ad ii->ii_index = kmem_alloc(ii->ii_indexsz, KM_SLEEP);
491 1.1 hpeyerl ii->ii_ndisk = 1;
492 1.1 hpeyerl ii->ii_startblk = bn;
493 1.1 hpeyerl ii->ii_startoff = 0;
494 1.1 hpeyerl ii->ii_index[0] = ix;
495 1.1 hpeyerl bn += cs->sc_cinfo[ix].ci_size;
496 1.1 hpeyerl ii++;
497 1.1 hpeyerl }
498 1.1 hpeyerl ii->ii_ndisk = 0;
499 1.1 hpeyerl #ifdef DEBUG
500 1.3 hpeyerl if (ccddebug & CCDB_INIT)
501 1.1 hpeyerl printiinfo(cs->sc_itable);
502 1.1 hpeyerl #endif
503 1.11 thorpej return;
504 1.1 hpeyerl }
505 1.11 thorpej
506 1.1 hpeyerl /*
507 1.1 hpeyerl * The following isn't fast or pretty; it doesn't have to be.
508 1.1 hpeyerl */
509 1.1 hpeyerl size = 0;
510 1.1 hpeyerl bn = lbn = 0;
511 1.1 hpeyerl for (ii = cs->sc_itable; ; ii++) {
512 1.11 thorpej /* Allocate space for ii_index. */
513 1.133 ad ii->ii_indexsz = sizeof(int) * cs->sc_nccdisks;
514 1.133 ad ii->ii_index = kmem_alloc(ii->ii_indexsz, KM_SLEEP);
515 1.11 thorpej
516 1.1 hpeyerl /*
517 1.1 hpeyerl * Locate the smallest of the remaining components
518 1.1 hpeyerl */
519 1.1 hpeyerl smallci = NULL;
520 1.1 hpeyerl for (ci = cs->sc_cinfo;
521 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
522 1.1 hpeyerl if (ci->ci_size > size &&
523 1.1 hpeyerl (smallci == NULL ||
524 1.1 hpeyerl ci->ci_size < smallci->ci_size))
525 1.1 hpeyerl smallci = ci;
526 1.11 thorpej
527 1.1 hpeyerl /*
528 1.1 hpeyerl * Nobody left, all done
529 1.1 hpeyerl */
530 1.1 hpeyerl if (smallci == NULL) {
531 1.1 hpeyerl ii->ii_ndisk = 0;
532 1.1 hpeyerl break;
533 1.1 hpeyerl }
534 1.11 thorpej
535 1.1 hpeyerl /*
536 1.1 hpeyerl * Record starting logical block and component offset
537 1.1 hpeyerl */
538 1.1 hpeyerl ii->ii_startblk = bn / cs->sc_ileave;
539 1.1 hpeyerl ii->ii_startoff = lbn;
540 1.11 thorpej
541 1.1 hpeyerl /*
542 1.1 hpeyerl * Determine how many disks take part in this interleave
543 1.1 hpeyerl * and record their indices.
544 1.1 hpeyerl */
545 1.1 hpeyerl ix = 0;
546 1.1 hpeyerl for (ci = cs->sc_cinfo;
547 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
548 1.1 hpeyerl if (ci->ci_size >= smallci->ci_size)
549 1.1 hpeyerl ii->ii_index[ix++] = ci - cs->sc_cinfo;
550 1.1 hpeyerl ii->ii_ndisk = ix;
551 1.1 hpeyerl bn += ix * (smallci->ci_size - size);
552 1.1 hpeyerl lbn = smallci->ci_size / cs->sc_ileave;
553 1.1 hpeyerl size = smallci->ci_size;
554 1.1 hpeyerl }
555 1.1 hpeyerl #ifdef DEBUG
556 1.3 hpeyerl if (ccddebug & CCDB_INIT)
557 1.1 hpeyerl printiinfo(cs->sc_itable);
558 1.1 hpeyerl #endif
559 1.1 hpeyerl }
560 1.1 hpeyerl
561 1.11 thorpej /* ARGSUSED */
562 1.97 thorpej static int
563 1.116 christos ccdopen(dev_t dev, int flags, int fmt, struct lwp *l)
564 1.1 hpeyerl {
565 1.1 hpeyerl int unit = ccdunit(dev);
566 1.11 thorpej struct ccd_softc *cs;
567 1.11 thorpej struct disklabel *lp;
568 1.15 thorpej int error = 0, part, pmask;
569 1.1 hpeyerl
570 1.1 hpeyerl #ifdef DEBUG
571 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
572 1.131 cegger printf("ccdopen(0x%"PRIx64", 0x%x)\n", dev, flags);
573 1.1 hpeyerl #endif
574 1.144 christos if ((cs = ccdget(unit)) == NULL)
575 1.144 christos return ENXIO;
576 1.15 thorpej
577 1.133 ad mutex_enter(&cs->sc_dvlock);
578 1.15 thorpej
579 1.23 thorpej lp = cs->sc_dkdev.dk_label;
580 1.11 thorpej
581 1.11 thorpej part = DISKPART(dev);
582 1.11 thorpej pmask = (1 << part);
583 1.11 thorpej
584 1.15 thorpej /*
585 1.15 thorpej * If we're initialized, check to see if there are any other
586 1.15 thorpej * open partitions. If not, then it's safe to update
587 1.87 thorpej * the in-core disklabel. Only read the disklabel if it is
588 1.87 thorpej * not already valid.
589 1.15 thorpej */
590 1.87 thorpej if ((cs->sc_flags & (CCDF_INITED|CCDF_VLABEL)) == CCDF_INITED &&
591 1.87 thorpej cs->sc_dkdev.dk_openmask == 0)
592 1.15 thorpej ccdgetdisklabel(dev);
593 1.15 thorpej
594 1.11 thorpej /* Check that the partition exists. */
595 1.27 thorpej if (part != RAW_PART) {
596 1.27 thorpej if (((cs->sc_flags & CCDF_INITED) == 0) ||
597 1.37 thorpej ((part >= lp->d_npartitions) ||
598 1.27 thorpej (lp->d_partitions[part].p_fstype == FS_UNUSED))) {
599 1.27 thorpej error = ENXIO;
600 1.27 thorpej goto done;
601 1.27 thorpej }
602 1.15 thorpej }
603 1.11 thorpej
604 1.11 thorpej /* Prevent our unit from being unconfigured while open. */
605 1.11 thorpej switch (fmt) {
606 1.11 thorpej case S_IFCHR:
607 1.11 thorpej cs->sc_dkdev.dk_copenmask |= pmask;
608 1.11 thorpej break;
609 1.11 thorpej
610 1.11 thorpej case S_IFBLK:
611 1.11 thorpej cs->sc_dkdev.dk_bopenmask |= pmask;
612 1.11 thorpej break;
613 1.11 thorpej }
614 1.11 thorpej cs->sc_dkdev.dk_openmask =
615 1.11 thorpej cs->sc_dkdev.dk_copenmask | cs->sc_dkdev.dk_bopenmask;
616 1.11 thorpej
617 1.15 thorpej done:
618 1.133 ad mutex_exit(&cs->sc_dvlock);
619 1.33 thorpej return (error);
620 1.7 cgd }
621 1.7 cgd
622 1.11 thorpej /* ARGSUSED */
623 1.97 thorpej static int
624 1.116 christos ccdclose(dev_t dev, int flags, int fmt, struct lwp *l)
625 1.7 cgd {
626 1.11 thorpej int unit = ccdunit(dev);
627 1.11 thorpej struct ccd_softc *cs;
628 1.117 ad int part;
629 1.11 thorpej
630 1.7 cgd #ifdef DEBUG
631 1.7 cgd if (ccddebug & CCDB_FOLLOW)
632 1.131 cegger printf("ccdclose(0x%"PRIx64", 0x%x)\n", dev, flags);
633 1.7 cgd #endif
634 1.11 thorpej
635 1.144 christos if ((cs = ccdget(unit)) == NULL)
636 1.144 christos return ENXIO;
637 1.15 thorpej
638 1.133 ad mutex_enter(&cs->sc_dvlock);
639 1.15 thorpej
640 1.11 thorpej part = DISKPART(dev);
641 1.11 thorpej
642 1.11 thorpej /* ...that much closer to allowing unconfiguration... */
643 1.11 thorpej switch (fmt) {
644 1.11 thorpej case S_IFCHR:
645 1.11 thorpej cs->sc_dkdev.dk_copenmask &= ~(1 << part);
646 1.11 thorpej break;
647 1.11 thorpej
648 1.11 thorpej case S_IFBLK:
649 1.11 thorpej cs->sc_dkdev.dk_bopenmask &= ~(1 << part);
650 1.11 thorpej break;
651 1.11 thorpej }
652 1.11 thorpej cs->sc_dkdev.dk_openmask =
653 1.11 thorpej cs->sc_dkdev.dk_copenmask | cs->sc_dkdev.dk_bopenmask;
654 1.11 thorpej
655 1.87 thorpej if (cs->sc_dkdev.dk_openmask == 0) {
656 1.87 thorpej if ((cs->sc_flags & CCDF_KLABEL) == 0)
657 1.87 thorpej cs->sc_flags &= ~CCDF_VLABEL;
658 1.87 thorpej }
659 1.87 thorpej
660 1.133 ad mutex_exit(&cs->sc_dvlock);
661 1.7 cgd return (0);
662 1.1 hpeyerl }
663 1.1 hpeyerl
664 1.133 ad static bool
665 1.133 ad ccdbackoff(struct ccd_softc *cs)
666 1.133 ad {
667 1.133 ad
668 1.133 ad /* XXX Arbitrary, should be a uvm call. */
669 1.133 ad return uvmexp.free < (uvmexp.freemin >> 1) &&
670 1.133 ad disk_isbusy(&cs->sc_dkdev);
671 1.133 ad }
672 1.133 ad
673 1.133 ad static void
674 1.133 ad ccdthread(void *cookie)
675 1.133 ad {
676 1.133 ad struct ccd_softc *cs;
677 1.133 ad
678 1.133 ad cs = cookie;
679 1.133 ad
680 1.133 ad #ifdef DEBUG
681 1.133 ad if (ccddebug & CCDB_FOLLOW)
682 1.133 ad printf("ccdthread: hello\n");
683 1.133 ad #endif
684 1.133 ad
685 1.133 ad mutex_enter(cs->sc_iolock);
686 1.133 ad while (__predict_true(!cs->sc_zap)) {
687 1.133 ad if (bufq_peek(cs->sc_bufq) == NULL) {
688 1.133 ad /* Nothing to do. */
689 1.133 ad cv_wait(&cs->sc_push, cs->sc_iolock);
690 1.133 ad continue;
691 1.133 ad }
692 1.133 ad if (ccdbackoff(cs)) {
693 1.133 ad /* Wait for memory to become available. */
694 1.133 ad (void)cv_timedwait(&cs->sc_push, cs->sc_iolock, 1);
695 1.133 ad continue;
696 1.133 ad }
697 1.133 ad #ifdef DEBUG
698 1.133 ad if (ccddebug & CCDB_FOLLOW)
699 1.133 ad printf("ccdthread: dispatching I/O\n");
700 1.133 ad #endif
701 1.133 ad ccdstart(cs);
702 1.133 ad mutex_enter(cs->sc_iolock);
703 1.133 ad }
704 1.133 ad cs->sc_thread = NULL;
705 1.133 ad mutex_exit(cs->sc_iolock);
706 1.133 ad #ifdef DEBUG
707 1.133 ad if (ccddebug & CCDB_FOLLOW)
708 1.133 ad printf("ccdthread: goodbye\n");
709 1.133 ad #endif
710 1.133 ad kthread_exit(0);
711 1.133 ad }
712 1.133 ad
713 1.97 thorpej static void
714 1.97 thorpej ccdstrategy(struct buf *bp)
715 1.1 hpeyerl {
716 1.68 augustss int unit = ccdunit(bp->b_dev);
717 1.144 christos struct ccd_softc *cs;
718 1.144 christos if ((cs = ccdget(unit)) == NULL)
719 1.144 christos return;
720 1.133 ad
721 1.133 ad /* Must be open or reading label. */
722 1.133 ad KASSERT(cs->sc_dkdev.dk_openmask != 0 ||
723 1.133 ad (cs->sc_flags & CCDF_RLABEL) != 0);
724 1.133 ad
725 1.133 ad mutex_enter(cs->sc_iolock);
726 1.133 ad /* Synchronize with device init/uninit. */
727 1.133 ad if (__predict_false((cs->sc_flags & CCDF_INITED) == 0)) {
728 1.133 ad mutex_exit(cs->sc_iolock);
729 1.133 ad #ifdef DEBUG
730 1.133 ad if (ccddebug & CCDB_FOLLOW)
731 1.133 ad printf("ccdstrategy: unit %d: not inited\n", unit);
732 1.133 ad #endif
733 1.133 ad bp->b_error = ENXIO;
734 1.133 ad bp->b_resid = bp->b_bcount;
735 1.133 ad biodone(bp);
736 1.133 ad return;
737 1.133 ad }
738 1.133 ad
739 1.133 ad /* Defer to thread if system is low on memory. */
740 1.133 ad bufq_put(cs->sc_bufq, bp);
741 1.133 ad if (__predict_false(ccdbackoff(cs))) {
742 1.133 ad mutex_exit(cs->sc_iolock);
743 1.133 ad #ifdef DEBUG
744 1.133 ad if (ccddebug & CCDB_FOLLOW)
745 1.133 ad printf("ccdstrategy: holding off on I/O\n");
746 1.133 ad #endif
747 1.133 ad return;
748 1.133 ad }
749 1.133 ad ccdstart(cs);
750 1.133 ad }
751 1.133 ad
752 1.133 ad static void
753 1.133 ad ccdstart(struct ccd_softc *cs)
754 1.133 ad {
755 1.88 thorpej daddr_t blkno;
756 1.11 thorpej int wlabel;
757 1.15 thorpej struct disklabel *lp;
758 1.133 ad long bcount, rcount;
759 1.133 ad struct ccdbuf *cbp;
760 1.133 ad char *addr;
761 1.133 ad daddr_t bn;
762 1.133 ad vnode_t *vp;
763 1.133 ad buf_t *bp;
764 1.133 ad
765 1.133 ad KASSERT(mutex_owned(cs->sc_iolock));
766 1.133 ad
767 1.133 ad disk_busy(&cs->sc_dkdev);
768 1.133 ad bp = bufq_get(cs->sc_bufq);
769 1.133 ad KASSERT(bp != NULL);
770 1.1 hpeyerl
771 1.1 hpeyerl #ifdef DEBUG
772 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
773 1.133 ad printf("ccdstart(%s, %p)\n", cs->sc_xname, bp);
774 1.59 thorpej #endif
775 1.11 thorpej
776 1.11 thorpej /* If it's a nil transfer, wake up the top half now. */
777 1.11 thorpej if (bp->b_bcount == 0)
778 1.11 thorpej goto done;
779 1.11 thorpej
780 1.23 thorpej lp = cs->sc_dkdev.dk_label;
781 1.15 thorpej
782 1.11 thorpej /*
783 1.17 thorpej * Do bounds checking and adjust transfer. If there's an
784 1.88 thorpej * error, the bounds check will flag that for us. Convert
785 1.88 thorpej * the partition relative block number to an absolute.
786 1.11 thorpej */
787 1.88 thorpej blkno = bp->b_blkno;
788 1.11 thorpej wlabel = cs->sc_flags & (CCDF_WLABEL|CCDF_LABELLING);
789 1.88 thorpej if (DISKPART(bp->b_dev) != RAW_PART) {
790 1.86 thorpej if (bounds_check_with_label(&cs->sc_dkdev, bp, wlabel) <= 0)
791 1.1 hpeyerl goto done;
792 1.88 thorpej blkno += lp->d_partitions[DISKPART(bp->b_dev)].p_offset;
793 1.88 thorpej }
794 1.133 ad mutex_exit(cs->sc_iolock);
795 1.88 thorpej bp->b_rawblkno = blkno;
796 1.11 thorpej
797 1.133 ad /* Allocate the component buffers and start I/O! */
798 1.133 ad bp->b_resid = bp->b_bcount;
799 1.133 ad bn = bp->b_rawblkno;
800 1.133 ad addr = bp->b_data;
801 1.133 ad for (bcount = bp->b_bcount; bcount > 0; bcount -= rcount) {
802 1.133 ad cbp = ccdbuffer(cs, bp, bn, addr, bcount);
803 1.133 ad rcount = cbp->cb_buf.b_bcount;
804 1.133 ad bn += btodb(rcount);
805 1.133 ad addr += rcount;
806 1.133 ad vp = cbp->cb_buf.b_vp;
807 1.133 ad if ((cbp->cb_buf.b_flags & B_READ) == 0) {
808 1.139 rmind mutex_enter(vp->v_interlock);
809 1.133 ad vp->v_numoutput++;
810 1.139 rmind mutex_exit(vp->v_interlock);
811 1.133 ad }
812 1.133 ad (void)VOP_STRATEGY(vp, &cbp->cb_buf);
813 1.133 ad }
814 1.1 hpeyerl return;
815 1.88 thorpej
816 1.88 thorpej done:
817 1.133 ad disk_unbusy(&cs->sc_dkdev, 0, 0);
818 1.133 ad cv_broadcast(&cs->sc_stop);
819 1.133 ad cv_broadcast(&cs->sc_push);
820 1.133 ad mutex_exit(cs->sc_iolock);
821 1.88 thorpej bp->b_resid = bp->b_bcount;
822 1.1 hpeyerl biodone(bp);
823 1.1 hpeyerl }
824 1.1 hpeyerl
825 1.1 hpeyerl /*
826 1.1 hpeyerl * Build a component buffer header.
827 1.1 hpeyerl */
828 1.55 thorpej static struct ccdbuf *
829 1.118 christos ccdbuffer(struct ccd_softc *cs, struct buf *bp, daddr_t bn, void *addr,
830 1.97 thorpej long bcount)
831 1.1 hpeyerl {
832 1.68 augustss struct ccdcinfo *ci;
833 1.68 augustss struct ccdbuf *cbp;
834 1.68 augustss daddr_t cbn, cboff;
835 1.68 augustss u_int64_t cbc;
836 1.36 thorpej int ccdisk;
837 1.1 hpeyerl
838 1.1 hpeyerl #ifdef DEBUG
839 1.3 hpeyerl if (ccddebug & CCDB_IO)
840 1.81 kleink printf("ccdbuffer(%p, %p, %" PRId64 ", %p, %ld)\n",
841 1.1 hpeyerl cs, bp, bn, addr, bcount);
842 1.1 hpeyerl #endif
843 1.1 hpeyerl /*
844 1.1 hpeyerl * Determine which component bn falls in.
845 1.1 hpeyerl */
846 1.1 hpeyerl cbn = bn;
847 1.1 hpeyerl cboff = 0;
848 1.11 thorpej
849 1.1 hpeyerl /*
850 1.1 hpeyerl * Serially concatenated
851 1.1 hpeyerl */
852 1.1 hpeyerl if (cs->sc_ileave == 0) {
853 1.68 augustss daddr_t sblk;
854 1.1 hpeyerl
855 1.1 hpeyerl sblk = 0;
856 1.36 thorpej for (ccdisk = 0, ci = &cs->sc_cinfo[ccdisk];
857 1.36 thorpej cbn >= sblk + ci->ci_size;
858 1.36 thorpej ccdisk++, ci = &cs->sc_cinfo[ccdisk])
859 1.1 hpeyerl sblk += ci->ci_size;
860 1.1 hpeyerl cbn -= sblk;
861 1.1 hpeyerl }
862 1.1 hpeyerl /*
863 1.1 hpeyerl * Interleaved
864 1.1 hpeyerl */
865 1.1 hpeyerl else {
866 1.68 augustss struct ccdiinfo *ii;
867 1.36 thorpej int off;
868 1.1 hpeyerl
869 1.1 hpeyerl cboff = cbn % cs->sc_ileave;
870 1.1 hpeyerl cbn /= cs->sc_ileave;
871 1.1 hpeyerl for (ii = cs->sc_itable; ii->ii_ndisk; ii++)
872 1.1 hpeyerl if (ii->ii_startblk > cbn)
873 1.1 hpeyerl break;
874 1.1 hpeyerl ii--;
875 1.1 hpeyerl off = cbn - ii->ii_startblk;
876 1.1 hpeyerl if (ii->ii_ndisk == 1) {
877 1.1 hpeyerl ccdisk = ii->ii_index[0];
878 1.1 hpeyerl cbn = ii->ii_startoff + off;
879 1.1 hpeyerl } else {
880 1.53 thorpej ccdisk = ii->ii_index[off % ii->ii_ndisk];
881 1.53 thorpej cbn = ii->ii_startoff + off / ii->ii_ndisk;
882 1.1 hpeyerl }
883 1.1 hpeyerl cbn *= cs->sc_ileave;
884 1.1 hpeyerl ci = &cs->sc_cinfo[ccdisk];
885 1.1 hpeyerl }
886 1.11 thorpej
887 1.1 hpeyerl /*
888 1.1 hpeyerl * Fill in the component buf structure.
889 1.1 hpeyerl */
890 1.63 thorpej cbp = CCD_GETBUF();
891 1.133 ad KASSERT(cbp != NULL);
892 1.126 ad buf_init(&cbp->cb_buf);
893 1.126 ad cbp->cb_buf.b_flags = bp->b_flags;
894 1.126 ad cbp->cb_buf.b_oflags = bp->b_oflags;
895 1.126 ad cbp->cb_buf.b_cflags = bp->b_cflags;
896 1.29 christos cbp->cb_buf.b_iodone = ccdiodone;
897 1.6 cgd cbp->cb_buf.b_proc = bp->b_proc;
898 1.95 hannken cbp->cb_buf.b_dev = ci->ci_dev;
899 1.6 cgd cbp->cb_buf.b_blkno = cbn + cboff;
900 1.6 cgd cbp->cb_buf.b_data = addr;
901 1.11 thorpej cbp->cb_buf.b_vp = ci->ci_vp;
902 1.139 rmind cbp->cb_buf.b_objlock = ci->ci_vp->v_interlock;
903 1.1 hpeyerl if (cs->sc_ileave == 0)
904 1.50 thorpej cbc = dbtob((u_int64_t)(ci->ci_size - cbn));
905 1.1 hpeyerl else
906 1.50 thorpej cbc = dbtob((u_int64_t)(cs->sc_ileave - cboff));
907 1.50 thorpej cbp->cb_buf.b_bcount = cbc < bcount ? cbc : bcount;
908 1.6 cgd
909 1.1 hpeyerl /*
910 1.6 cgd * context for ccdiodone
911 1.1 hpeyerl */
912 1.6 cgd cbp->cb_obp = bp;
913 1.59 thorpej cbp->cb_sc = cs;
914 1.36 thorpej cbp->cb_comp = ccdisk;
915 1.6 cgd
916 1.94 yamt BIO_COPYPRIO(&cbp->cb_buf, bp);
917 1.94 yamt
918 1.1 hpeyerl #ifdef DEBUG
919 1.3 hpeyerl if (ccddebug & CCDB_IO)
920 1.131 cegger printf(" dev 0x%"PRIx64"(u%lu): cbp %p bn %" PRId64 " addr %p"
921 1.99 yamt " bcnt %d\n",
922 1.62 mjacob ci->ci_dev, (unsigned long) (ci-cs->sc_cinfo), cbp,
923 1.62 mjacob cbp->cb_buf.b_blkno, cbp->cb_buf.b_data,
924 1.62 mjacob cbp->cb_buf.b_bcount);
925 1.1 hpeyerl #endif
926 1.55 thorpej
927 1.55 thorpej return (cbp);
928 1.1 hpeyerl }
929 1.1 hpeyerl
930 1.1 hpeyerl /*
931 1.11 thorpej * Called at interrupt time.
932 1.1 hpeyerl * Mark the component as done and if all components are done,
933 1.1 hpeyerl * take a ccd interrupt.
934 1.1 hpeyerl */
935 1.97 thorpej static void
936 1.97 thorpej ccdiodone(struct buf *vbp)
937 1.1 hpeyerl {
938 1.29 christos struct ccdbuf *cbp = (struct ccdbuf *) vbp;
939 1.59 thorpej struct buf *bp = cbp->cb_obp;
940 1.59 thorpej struct ccd_softc *cs = cbp->cb_sc;
941 1.133 ad int count;
942 1.1 hpeyerl
943 1.1 hpeyerl #ifdef DEBUG
944 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
945 1.35 christos printf("ccdiodone(%p)\n", cbp);
946 1.3 hpeyerl if (ccddebug & CCDB_IO) {
947 1.99 yamt printf("ccdiodone: bp %p bcount %d resid %d\n",
948 1.53 thorpej bp, bp->b_bcount, bp->b_resid);
949 1.131 cegger printf(" dev 0x%"PRIx64"(u%d), cbp %p bn %" PRId64 " addr %p"
950 1.99 yamt " bcnt %d\n",
951 1.6 cgd cbp->cb_buf.b_dev, cbp->cb_comp, cbp,
952 1.6 cgd cbp->cb_buf.b_blkno, cbp->cb_buf.b_data,
953 1.6 cgd cbp->cb_buf.b_bcount);
954 1.1 hpeyerl }
955 1.1 hpeyerl #endif
956 1.1 hpeyerl
957 1.122 ad if (cbp->cb_buf.b_error != 0) {
958 1.122 ad bp->b_error = cbp->cb_buf.b_error;
959 1.53 thorpej printf("%s: error %d on component %d\n",
960 1.53 thorpej cs->sc_xname, bp->b_error, cbp->cb_comp);
961 1.1 hpeyerl }
962 1.6 cgd count = cbp->cb_buf.b_bcount;
963 1.126 ad buf_destroy(&cbp->cb_buf);
964 1.63 thorpej CCD_PUTBUF(cbp);
965 1.1 hpeyerl
966 1.1 hpeyerl /*
967 1.1 hpeyerl * If all done, "interrupt".
968 1.53 thorpej */
969 1.133 ad mutex_enter(cs->sc_iolock);
970 1.53 thorpej bp->b_resid -= count;
971 1.53 thorpej if (bp->b_resid < 0)
972 1.53 thorpej panic("ccdiodone: count");
973 1.133 ad if (bp->b_resid == 0) {
974 1.133 ad /*
975 1.133 ad * Request is done for better or worse, wakeup the top half.
976 1.133 ad */
977 1.133 ad if (bp->b_error != 0)
978 1.133 ad bp->b_resid = bp->b_bcount;
979 1.133 ad disk_unbusy(&cs->sc_dkdev, (bp->b_bcount - bp->b_resid),
980 1.133 ad (bp->b_flags & B_READ));
981 1.133 ad if (!disk_isbusy(&cs->sc_dkdev)) {
982 1.133 ad if (bufq_peek(cs->sc_bufq) != NULL) {
983 1.133 ad cv_broadcast(&cs->sc_push);
984 1.133 ad }
985 1.133 ad cv_broadcast(&cs->sc_stop);
986 1.133 ad }
987 1.133 ad mutex_exit(cs->sc_iolock);
988 1.133 ad biodone(bp);
989 1.133 ad } else
990 1.133 ad mutex_exit(cs->sc_iolock);
991 1.1 hpeyerl }
992 1.1 hpeyerl
993 1.11 thorpej /* ARGSUSED */
994 1.97 thorpej static int
995 1.116 christos ccdread(dev_t dev, struct uio *uio, int flags)
996 1.3 hpeyerl {
997 1.11 thorpej int unit = ccdunit(dev);
998 1.11 thorpej struct ccd_softc *cs;
999 1.3 hpeyerl
1000 1.3 hpeyerl #ifdef DEBUG
1001 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
1002 1.131 cegger printf("ccdread(0x%"PRIx64", %p)\n", dev, uio);
1003 1.3 hpeyerl #endif
1004 1.144 christos if ((cs = ccdget(unit)) == NULL)
1005 1.144 christos return 0;
1006 1.11 thorpej
1007 1.133 ad /* Unlocked advisory check, ccdstrategy check is synchronous. */
1008 1.11 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1009 1.11 thorpej return (ENXIO);
1010 1.11 thorpej
1011 1.10 mycroft return (physio(ccdstrategy, NULL, dev, B_READ, minphys, uio));
1012 1.3 hpeyerl }
1013 1.3 hpeyerl
1014 1.11 thorpej /* ARGSUSED */
1015 1.97 thorpej static int
1016 1.116 christos ccdwrite(dev_t dev, struct uio *uio, int flags)
1017 1.3 hpeyerl {
1018 1.11 thorpej int unit = ccdunit(dev);
1019 1.11 thorpej struct ccd_softc *cs;
1020 1.3 hpeyerl
1021 1.3 hpeyerl #ifdef DEBUG
1022 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
1023 1.131 cegger printf("ccdwrite(0x%"PRIx64", %p)\n", dev, uio);
1024 1.3 hpeyerl #endif
1025 1.144 christos if ((cs = ccdget(unit)) == NULL)
1026 1.144 christos return ENOENT;
1027 1.11 thorpej
1028 1.133 ad /* Unlocked advisory check, ccdstrategy check is synchronous. */
1029 1.11 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1030 1.11 thorpej return (ENXIO);
1031 1.11 thorpej
1032 1.10 mycroft return (physio(ccdstrategy, NULL, dev, B_WRITE, minphys, uio));
1033 1.3 hpeyerl }
1034 1.3 hpeyerl
1035 1.97 thorpej static int
1036 1.118 christos ccdioctl(dev_t dev, u_long cmd, void *data, int flag, struct lwp *l)
1037 1.1 hpeyerl {
1038 1.11 thorpej int unit = ccdunit(dev);
1039 1.133 ad int i, j, lookedup = 0, error = 0;
1040 1.39 mycroft int part, pmask;
1041 1.11 thorpej struct ccd_softc *cs;
1042 1.11 thorpej struct ccd_ioctl *ccio = (struct ccd_ioctl *)data;
1043 1.110 elad kauth_cred_t uc;
1044 1.11 thorpej char **cpp;
1045 1.136 dholland struct pathbuf *pb;
1046 1.11 thorpej struct vnode **vpp;
1047 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1048 1.70 fvdl struct disklabel newlabel;
1049 1.70 fvdl #endif
1050 1.11 thorpej
1051 1.144 christos if ((cs = ccdget(unit)) == NULL)
1052 1.144 christos return ENOENT;
1053 1.133 ad uc = kauth_cred_get();
1054 1.109 jld
1055 1.41 thorpej /* Must be open for writes for these commands... */
1056 1.41 thorpej switch (cmd) {
1057 1.41 thorpej case CCDIOCSET:
1058 1.41 thorpej case CCDIOCCLR:
1059 1.41 thorpej case DIOCSDINFO:
1060 1.41 thorpej case DIOCWDINFO:
1061 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1062 1.70 fvdl case ODIOCSDINFO:
1063 1.70 fvdl case ODIOCWDINFO:
1064 1.70 fvdl #endif
1065 1.87 thorpej case DIOCKLABEL:
1066 1.41 thorpej case DIOCWLABEL:
1067 1.41 thorpej if ((flag & FWRITE) == 0)
1068 1.41 thorpej return (EBADF);
1069 1.41 thorpej }
1070 1.41 thorpej
1071 1.133 ad mutex_enter(&cs->sc_dvlock);
1072 1.57 thorpej
1073 1.41 thorpej /* Must be initialized for these... */
1074 1.41 thorpej switch (cmd) {
1075 1.41 thorpej case CCDIOCCLR:
1076 1.42 kleink case DIOCGDINFO:
1077 1.100 thorpej case DIOCCACHESYNC:
1078 1.42 kleink case DIOCSDINFO:
1079 1.42 kleink case DIOCWDINFO:
1080 1.42 kleink case DIOCGPART:
1081 1.41 thorpej case DIOCWLABEL:
1082 1.87 thorpej case DIOCKLABEL:
1083 1.44 thorpej case DIOCGDEFLABEL:
1084 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1085 1.70 fvdl case ODIOCGDINFO:
1086 1.70 fvdl case ODIOCSDINFO:
1087 1.70 fvdl case ODIOCWDINFO:
1088 1.70 fvdl case ODIOCGDEFLABEL:
1089 1.70 fvdl #endif
1090 1.57 thorpej if ((cs->sc_flags & CCDF_INITED) == 0) {
1091 1.57 thorpej error = ENXIO;
1092 1.57 thorpej goto out;
1093 1.57 thorpej }
1094 1.41 thorpej }
1095 1.41 thorpej
1096 1.11 thorpej switch (cmd) {
1097 1.11 thorpej case CCDIOCSET:
1098 1.57 thorpej if (cs->sc_flags & CCDF_INITED) {
1099 1.57 thorpej error = EBUSY;
1100 1.57 thorpej goto out;
1101 1.57 thorpej }
1102 1.54 thorpej
1103 1.54 thorpej /* Validate the flags. */
1104 1.57 thorpej if ((ccio->ccio_flags & CCDF_USERMASK) != ccio->ccio_flags) {
1105 1.57 thorpej error = EINVAL;
1106 1.57 thorpej goto out;
1107 1.57 thorpej }
1108 1.15 thorpej
1109 1.133 ad if (ccio->ccio_ndisks > CCD_MAXNDISKS ||
1110 1.133 ad ccio->ccio_ndisks == 0) {
1111 1.73 jdolecek error = EINVAL;
1112 1.73 jdolecek goto out;
1113 1.73 jdolecek }
1114 1.102 perry
1115 1.11 thorpej /* Fill in some important bits. */
1116 1.57 thorpej cs->sc_ileave = ccio->ccio_ileave;
1117 1.57 thorpej cs->sc_nccdisks = ccio->ccio_ndisks;
1118 1.57 thorpej cs->sc_flags = ccio->ccio_flags & CCDF_USERMASK;
1119 1.11 thorpej
1120 1.11 thorpej /*
1121 1.11 thorpej * Allocate space for and copy in the array of
1122 1.11 thorpej * componet pathnames and device numbers.
1123 1.11 thorpej */
1124 1.133 ad cpp = kmem_alloc(ccio->ccio_ndisks * sizeof(*cpp), KM_SLEEP);
1125 1.133 ad vpp = kmem_alloc(ccio->ccio_ndisks * sizeof(*vpp), KM_SLEEP);
1126 1.84 dsl error = copyin(ccio->ccio_disks, cpp,
1127 1.133 ad ccio->ccio_ndisks * sizeof(*cpp));
1128 1.11 thorpej if (error) {
1129 1.133 ad kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1130 1.133 ad kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1131 1.57 thorpej goto out;
1132 1.11 thorpej }
1133 1.11 thorpej
1134 1.11 thorpej #ifdef DEBUG
1135 1.11 thorpej if (ccddebug & CCDB_INIT)
1136 1.11 thorpej for (i = 0; i < ccio->ccio_ndisks; ++i)
1137 1.104 christos printf("ccdioctl: component %d: %p\n",
1138 1.11 thorpej i, cpp[i]);
1139 1.11 thorpej #endif
1140 1.11 thorpej
1141 1.11 thorpej for (i = 0; i < ccio->ccio_ndisks; ++i) {
1142 1.11 thorpej #ifdef DEBUG
1143 1.11 thorpej if (ccddebug & CCDB_INIT)
1144 1.35 christos printf("ccdioctl: lookedup = %d\n", lookedup);
1145 1.11 thorpej #endif
1146 1.136 dholland error = pathbuf_copyin(cpp[i], &pb);
1147 1.137 dholland if (error == 0) {
1148 1.137 dholland error = dk_lookup(pb, l, &vpp[i]);
1149 1.136 dholland }
1150 1.136 dholland pathbuf_destroy(pb);
1151 1.136 dholland if (error != 0) {
1152 1.11 thorpej for (j = 0; j < lookedup; ++j)
1153 1.12 thorpej (void)vn_close(vpp[j], FREAD|FWRITE,
1154 1.128 ad uc);
1155 1.133 ad kmem_free(vpp, ccio->ccio_ndisks *
1156 1.133 ad sizeof(*vpp));
1157 1.133 ad kmem_free(cpp, ccio->ccio_ndisks *
1158 1.133 ad sizeof(*cpp));
1159 1.57 thorpej goto out;
1160 1.11 thorpej }
1161 1.11 thorpej ++lookedup;
1162 1.11 thorpej }
1163 1.11 thorpej
1164 1.133 ad /* Attach the disk. */
1165 1.133 ad disk_attach(&cs->sc_dkdev);
1166 1.133 ad bufq_alloc(&cs->sc_bufq, "fcfs", 0);
1167 1.133 ad
1168 1.11 thorpej /*
1169 1.11 thorpej * Initialize the ccd. Fills in the softc for us.
1170 1.11 thorpej */
1171 1.107 christos if ((error = ccdinit(cs, cpp, vpp, l)) != 0) {
1172 1.11 thorpej for (j = 0; j < lookedup; ++j)
1173 1.18 thorpej (void)vn_close(vpp[j], FREAD|FWRITE,
1174 1.128 ad uc);
1175 1.133 ad kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1176 1.133 ad kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1177 1.133 ad disk_detach(&cs->sc_dkdev);
1178 1.133 ad bufq_free(cs->sc_bufq);
1179 1.57 thorpej goto out;
1180 1.11 thorpej }
1181 1.11 thorpej
1182 1.57 thorpej /* We can free the temporary variables now. */
1183 1.133 ad kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1184 1.133 ad kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1185 1.57 thorpej
1186 1.11 thorpej /*
1187 1.11 thorpej * The ccd has been successfully initialized, so
1188 1.23 thorpej * we can place it into the array. Don't try to
1189 1.23 thorpej * read the disklabel until the disk has been attached,
1190 1.23 thorpej * because space for the disklabel is allocated
1191 1.23 thorpej * in disk_attach();
1192 1.11 thorpej */
1193 1.11 thorpej ccio->ccio_unit = unit;
1194 1.11 thorpej ccio->ccio_size = cs->sc_size;
1195 1.23 thorpej
1196 1.23 thorpej /* Try and read the disklabel. */
1197 1.11 thorpej ccdgetdisklabel(dev);
1198 1.11 thorpej break;
1199 1.11 thorpej
1200 1.11 thorpej case CCDIOCCLR:
1201 1.11 thorpej /*
1202 1.11 thorpej * Don't unconfigure if any other partitions are open
1203 1.11 thorpej * or if both the character and block flavors of this
1204 1.11 thorpej * partition are open.
1205 1.11 thorpej */
1206 1.11 thorpej part = DISKPART(dev);
1207 1.11 thorpej pmask = (1 << part);
1208 1.11 thorpej if ((cs->sc_dkdev.dk_openmask & ~pmask) ||
1209 1.11 thorpej ((cs->sc_dkdev.dk_bopenmask & pmask) &&
1210 1.15 thorpej (cs->sc_dkdev.dk_copenmask & pmask))) {
1211 1.57 thorpej error = EBUSY;
1212 1.57 thorpej goto out;
1213 1.15 thorpej }
1214 1.88 thorpej
1215 1.133 ad /* Stop new I/O, wait for in-flight I/O to complete. */
1216 1.133 ad mutex_enter(cs->sc_iolock);
1217 1.133 ad cs->sc_flags &= ~(CCDF_INITED|CCDF_VLABEL);
1218 1.133 ad cs->sc_zap = true;
1219 1.133 ad while (disk_isbusy(&cs->sc_dkdev) ||
1220 1.133 ad bufq_peek(cs->sc_bufq) != NULL ||
1221 1.133 ad cs->sc_thread != NULL) {
1222 1.133 ad cv_broadcast(&cs->sc_push);
1223 1.133 ad (void)cv_timedwait(&cs->sc_stop, cs->sc_iolock, hz);
1224 1.133 ad }
1225 1.133 ad mutex_exit(cs->sc_iolock);
1226 1.11 thorpej
1227 1.11 thorpej /*
1228 1.11 thorpej * Free ccd_softc information and clear entry.
1229 1.11 thorpej */
1230 1.22 thorpej
1231 1.22 thorpej /* Close the components and free their pathnames. */
1232 1.11 thorpej for (i = 0; i < cs->sc_nccdisks; ++i) {
1233 1.11 thorpej /*
1234 1.11 thorpej * XXX: this close could potentially fail and
1235 1.11 thorpej * cause Bad Things. Maybe we need to force
1236 1.11 thorpej * the close to happen?
1237 1.11 thorpej */
1238 1.11 thorpej #ifdef DEBUG
1239 1.11 thorpej if (ccddebug & CCDB_VNODE)
1240 1.11 thorpej vprint("CCDIOCCLR: vnode info",
1241 1.11 thorpej cs->sc_cinfo[i].ci_vp);
1242 1.11 thorpej #endif
1243 1.11 thorpej (void)vn_close(cs->sc_cinfo[i].ci_vp, FREAD|FWRITE,
1244 1.128 ad uc);
1245 1.133 ad kmem_free(cs->sc_cinfo[i].ci_path,
1246 1.133 ad cs->sc_cinfo[i].ci_pathlen);
1247 1.38 thorpej }
1248 1.38 thorpej
1249 1.22 thorpej /* Free interleave index. */
1250 1.133 ad for (i = 0; cs->sc_itable[i].ii_ndisk; ++i) {
1251 1.133 ad kmem_free(cs->sc_itable[i].ii_index,
1252 1.133 ad cs->sc_itable[i].ii_indexsz);
1253 1.133 ad }
1254 1.22 thorpej
1255 1.22 thorpej /* Free component info and interleave table. */
1256 1.133 ad kmem_free(cs->sc_cinfo, cs->sc_nccdisks *
1257 1.133 ad sizeof(struct ccdcinfo));
1258 1.133 ad kmem_free(cs->sc_itable, (cs->sc_nccdisks + 1) *
1259 1.133 ad sizeof(struct ccdiinfo));
1260 1.15 thorpej
1261 1.23 thorpej /* Detatch the disk. */
1262 1.123 ad disk_detach(&cs->sc_dkdev);
1263 1.133 ad bufq_free(cs->sc_bufq);
1264 1.144 christos ccdput(cs);
1265 1.148 joerg /* Don't break, otherwise cs is read again. */
1266 1.148 joerg return 0;
1267 1.11 thorpej
1268 1.11 thorpej case DIOCGDINFO:
1269 1.23 thorpej *(struct disklabel *)data = *(cs->sc_dkdev.dk_label);
1270 1.11 thorpej break;
1271 1.133 ad
1272 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1273 1.70 fvdl case ODIOCGDINFO:
1274 1.70 fvdl newlabel = *(cs->sc_dkdev.dk_label);
1275 1.70 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
1276 1.71 fvdl return ENOTTY;
1277 1.70 fvdl memcpy(data, &newlabel, sizeof (struct olddisklabel));
1278 1.70 fvdl break;
1279 1.70 fvdl #endif
1280 1.11 thorpej
1281 1.11 thorpej case DIOCGPART:
1282 1.23 thorpej ((struct partinfo *)data)->disklab = cs->sc_dkdev.dk_label;
1283 1.11 thorpej ((struct partinfo *)data)->part =
1284 1.23 thorpej &cs->sc_dkdev.dk_label->d_partitions[DISKPART(dev)];
1285 1.11 thorpej break;
1286 1.11 thorpej
1287 1.100 thorpej case DIOCCACHESYNC:
1288 1.100 thorpej /*
1289 1.100 thorpej * XXX Do we really need to care about having a writable
1290 1.100 thorpej * file descriptor here?
1291 1.100 thorpej */
1292 1.100 thorpej if ((flag & FWRITE) == 0)
1293 1.100 thorpej return (EBADF);
1294 1.100 thorpej
1295 1.100 thorpej /*
1296 1.100 thorpej * We pass this call down to all components and report
1297 1.100 thorpej * the first error we encounter.
1298 1.100 thorpej */
1299 1.100 thorpej for (error = 0, i = 0; i < cs->sc_nccdisks; i++) {
1300 1.100 thorpej j = VOP_IOCTL(cs->sc_cinfo[i].ci_vp, cmd, data,
1301 1.124 pooka flag, uc);
1302 1.100 thorpej if (j != 0 && error == 0)
1303 1.100 thorpej error = j;
1304 1.100 thorpej }
1305 1.100 thorpej break;
1306 1.100 thorpej
1307 1.11 thorpej case DIOCWDINFO:
1308 1.11 thorpej case DIOCSDINFO:
1309 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1310 1.70 fvdl case ODIOCWDINFO:
1311 1.70 fvdl case ODIOCSDINFO:
1312 1.70 fvdl #endif
1313 1.70 fvdl {
1314 1.70 fvdl struct disklabel *lp;
1315 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1316 1.70 fvdl if (cmd == ODIOCSDINFO || cmd == ODIOCWDINFO) {
1317 1.70 fvdl memset(&newlabel, 0, sizeof newlabel);
1318 1.70 fvdl memcpy(&newlabel, data, sizeof (struct olddisklabel));
1319 1.70 fvdl lp = &newlabel;
1320 1.70 fvdl } else
1321 1.70 fvdl #endif
1322 1.70 fvdl lp = (struct disklabel *)data;
1323 1.70 fvdl
1324 1.11 thorpej cs->sc_flags |= CCDF_LABELLING;
1325 1.11 thorpej
1326 1.23 thorpej error = setdisklabel(cs->sc_dkdev.dk_label,
1327 1.70 fvdl lp, 0, cs->sc_dkdev.dk_cpulabel);
1328 1.11 thorpej if (error == 0) {
1329 1.70 fvdl if (cmd == DIOCWDINFO
1330 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1331 1.70 fvdl || cmd == ODIOCWDINFO
1332 1.70 fvdl #endif
1333 1.70 fvdl )
1334 1.11 thorpej error = writedisklabel(CCDLABELDEV(dev),
1335 1.23 thorpej ccdstrategy, cs->sc_dkdev.dk_label,
1336 1.23 thorpej cs->sc_dkdev.dk_cpulabel);
1337 1.11 thorpej }
1338 1.11 thorpej
1339 1.11 thorpej cs->sc_flags &= ~CCDF_LABELLING;
1340 1.11 thorpej break;
1341 1.70 fvdl }
1342 1.11 thorpej
1343 1.87 thorpej case DIOCKLABEL:
1344 1.87 thorpej if (*(int *)data != 0)
1345 1.87 thorpej cs->sc_flags |= CCDF_KLABEL;
1346 1.87 thorpej else
1347 1.87 thorpej cs->sc_flags &= ~CCDF_KLABEL;
1348 1.87 thorpej break;
1349 1.87 thorpej
1350 1.11 thorpej case DIOCWLABEL:
1351 1.11 thorpej if (*(int *)data != 0)
1352 1.11 thorpej cs->sc_flags |= CCDF_WLABEL;
1353 1.11 thorpej else
1354 1.11 thorpej cs->sc_flags &= ~CCDF_WLABEL;
1355 1.11 thorpej break;
1356 1.11 thorpej
1357 1.44 thorpej case DIOCGDEFLABEL:
1358 1.44 thorpej ccdgetdefaultlabel(cs, (struct disklabel *)data);
1359 1.44 thorpej break;
1360 1.70 fvdl
1361 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1362 1.70 fvdl case ODIOCGDEFLABEL:
1363 1.70 fvdl ccdgetdefaultlabel(cs, &newlabel);
1364 1.70 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
1365 1.71 fvdl return ENOTTY;
1366 1.70 fvdl memcpy(data, &newlabel, sizeof (struct olddisklabel));
1367 1.70 fvdl break;
1368 1.70 fvdl #endif
1369 1.44 thorpej
1370 1.11 thorpej default:
1371 1.57 thorpej error = ENOTTY;
1372 1.11 thorpej }
1373 1.11 thorpej
1374 1.57 thorpej out:
1375 1.133 ad mutex_exit(&cs->sc_dvlock);
1376 1.57 thorpej return (error);
1377 1.1 hpeyerl }
1378 1.1 hpeyerl
1379 1.97 thorpej static int
1380 1.97 thorpej ccdsize(dev_t dev)
1381 1.1 hpeyerl {
1382 1.11 thorpej struct ccd_softc *cs;
1383 1.40 thorpej struct disklabel *lp;
1384 1.40 thorpej int part, unit, omask, size;
1385 1.40 thorpej
1386 1.40 thorpej unit = ccdunit(dev);
1387 1.144 christos if ((cs = ccdget(unit)) == NULL)
1388 1.144 christos return -1;
1389 1.11 thorpej
1390 1.40 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1391 1.11 thorpej return (-1);
1392 1.11 thorpej
1393 1.11 thorpej part = DISKPART(dev);
1394 1.40 thorpej omask = cs->sc_dkdev.dk_openmask & (1 << part);
1395 1.40 thorpej lp = cs->sc_dkdev.dk_label;
1396 1.11 thorpej
1397 1.107 christos if (omask == 0 && ccdopen(dev, 0, S_IFBLK, curlwp))
1398 1.11 thorpej return (-1);
1399 1.11 thorpej
1400 1.40 thorpej if (lp->d_partitions[part].p_fstype != FS_SWAP)
1401 1.11 thorpej size = -1;
1402 1.11 thorpej else
1403 1.40 thorpej size = lp->d_partitions[part].p_size *
1404 1.40 thorpej (lp->d_secsize / DEV_BSIZE);
1405 1.11 thorpej
1406 1.107 christos if (omask == 0 && ccdclose(dev, 0, S_IFBLK, curlwp))
1407 1.11 thorpej return (-1);
1408 1.1 hpeyerl
1409 1.11 thorpej return (size);
1410 1.1 hpeyerl }
1411 1.1 hpeyerl
1412 1.11 thorpej static void
1413 1.97 thorpej ccdgetdefaultlabel(struct ccd_softc *cs, struct disklabel *lp)
1414 1.11 thorpej {
1415 1.11 thorpej struct ccdgeom *ccg = &cs->sc_geom;
1416 1.11 thorpej
1417 1.72 thorpej memset(lp, 0, sizeof(*lp));
1418 1.11 thorpej
1419 1.11 thorpej lp->d_secperunit = cs->sc_size;
1420 1.11 thorpej lp->d_secsize = ccg->ccg_secsize;
1421 1.11 thorpej lp->d_nsectors = ccg->ccg_nsectors;
1422 1.11 thorpej lp->d_ntracks = ccg->ccg_ntracks;
1423 1.11 thorpej lp->d_ncylinders = ccg->ccg_ncylinders;
1424 1.19 thorpej lp->d_secpercyl = lp->d_ntracks * lp->d_nsectors;
1425 1.11 thorpej
1426 1.11 thorpej strncpy(lp->d_typename, "ccd", sizeof(lp->d_typename));
1427 1.11 thorpej lp->d_type = DTYPE_CCD;
1428 1.11 thorpej strncpy(lp->d_packname, "fictitious", sizeof(lp->d_packname));
1429 1.11 thorpej lp->d_rpm = 3600;
1430 1.11 thorpej lp->d_interleave = 1;
1431 1.11 thorpej lp->d_flags = 0;
1432 1.11 thorpej
1433 1.11 thorpej lp->d_partitions[RAW_PART].p_offset = 0;
1434 1.11 thorpej lp->d_partitions[RAW_PART].p_size = cs->sc_size;
1435 1.11 thorpej lp->d_partitions[RAW_PART].p_fstype = FS_UNUSED;
1436 1.11 thorpej lp->d_npartitions = RAW_PART + 1;
1437 1.11 thorpej
1438 1.11 thorpej lp->d_magic = DISKMAGIC;
1439 1.11 thorpej lp->d_magic2 = DISKMAGIC;
1440 1.23 thorpej lp->d_checksum = dkcksum(cs->sc_dkdev.dk_label);
1441 1.44 thorpej }
1442 1.44 thorpej
1443 1.44 thorpej /*
1444 1.44 thorpej * Read the disklabel from the ccd. If one is not present, fake one
1445 1.44 thorpej * up.
1446 1.44 thorpej */
1447 1.44 thorpej static void
1448 1.97 thorpej ccdgetdisklabel(dev_t dev)
1449 1.44 thorpej {
1450 1.44 thorpej int unit = ccdunit(dev);
1451 1.144 christos struct ccd_softc *cs;
1452 1.85 dsl const char *errstring;
1453 1.144 christos struct disklabel *lp;
1454 1.144 christos struct cpu_disklabel *clp;
1455 1.44 thorpej
1456 1.144 christos if ((cs = ccdget(unit)) == NULL)
1457 1.144 christos return;
1458 1.144 christos lp = cs->sc_dkdev.dk_label;
1459 1.144 christos clp = cs->sc_dkdev.dk_cpulabel;
1460 1.133 ad KASSERT(mutex_owned(&cs->sc_dvlock));
1461 1.133 ad
1462 1.72 thorpej memset(clp, 0, sizeof(*clp));
1463 1.44 thorpej
1464 1.44 thorpej ccdgetdefaultlabel(cs, lp);
1465 1.11 thorpej
1466 1.11 thorpej /*
1467 1.11 thorpej * Call the generic disklabel extraction routine.
1468 1.11 thorpej */
1469 1.133 ad cs->sc_flags |= CCDF_RLABEL;
1470 1.92 lukem if ((cs->sc_flags & CCDF_NOLABEL) != 0)
1471 1.92 lukem errstring = "CCDF_NOLABEL set; ignoring on-disk label";
1472 1.92 lukem else
1473 1.92 lukem errstring = readdisklabel(CCDLABELDEV(dev), ccdstrategy,
1474 1.92 lukem cs->sc_dkdev.dk_label, cs->sc_dkdev.dk_cpulabel);
1475 1.29 christos if (errstring)
1476 1.11 thorpej ccdmakedisklabel(cs);
1477 1.47 enami else {
1478 1.47 enami int i;
1479 1.47 enami struct partition *pp;
1480 1.47 enami
1481 1.47 enami /*
1482 1.47 enami * Sanity check whether the found disklabel is valid.
1483 1.47 enami *
1484 1.47 enami * This is necessary since total size of ccd may vary
1485 1.47 enami * when an interleave is changed even though exactly
1486 1.47 enami * same componets are used, and old disklabel may used
1487 1.47 enami * if that is found.
1488 1.47 enami */
1489 1.47 enami if (lp->d_secperunit != cs->sc_size)
1490 1.47 enami printf("WARNING: %s: "
1491 1.47 enami "total sector size in disklabel (%d) != "
1492 1.60 thorpej "the size of ccd (%lu)\n", cs->sc_xname,
1493 1.60 thorpej lp->d_secperunit, (u_long)cs->sc_size);
1494 1.47 enami for (i = 0; i < lp->d_npartitions; i++) {
1495 1.47 enami pp = &lp->d_partitions[i];
1496 1.47 enami if (pp->p_offset + pp->p_size > cs->sc_size)
1497 1.48 enami printf("WARNING: %s: end of partition `%c' "
1498 1.60 thorpej "exceeds the size of ccd (%lu)\n",
1499 1.60 thorpej cs->sc_xname, 'a' + i, (u_long)cs->sc_size);
1500 1.47 enami }
1501 1.47 enami }
1502 1.11 thorpej
1503 1.11 thorpej #ifdef DEBUG
1504 1.11 thorpej /* It's actually extremely common to have unlabeled ccds. */
1505 1.11 thorpej if (ccddebug & CCDB_LABEL)
1506 1.11 thorpej if (errstring != NULL)
1507 1.35 christos printf("%s: %s\n", cs->sc_xname, errstring);
1508 1.11 thorpej #endif
1509 1.87 thorpej
1510 1.87 thorpej /* In-core label now valid. */
1511 1.133 ad cs->sc_flags = (cs->sc_flags | CCDF_VLABEL) & ~CCDF_RLABEL;
1512 1.11 thorpej }
1513 1.11 thorpej
1514 1.11 thorpej /*
1515 1.11 thorpej * Take care of things one might want to take care of in the event
1516 1.11 thorpej * that a disklabel isn't present.
1517 1.11 thorpej */
1518 1.11 thorpej static void
1519 1.97 thorpej ccdmakedisklabel(struct ccd_softc *cs)
1520 1.11 thorpej {
1521 1.23 thorpej struct disklabel *lp = cs->sc_dkdev.dk_label;
1522 1.11 thorpej
1523 1.11 thorpej /*
1524 1.11 thorpej * For historical reasons, if there's no disklabel present
1525 1.11 thorpej * the raw partition must be marked FS_BSDFFS.
1526 1.11 thorpej */
1527 1.11 thorpej lp->d_partitions[RAW_PART].p_fstype = FS_BSDFFS;
1528 1.11 thorpej
1529 1.11 thorpej strncpy(lp->d_packname, "default label", sizeof(lp->d_packname));
1530 1.44 thorpej
1531 1.44 thorpej lp->d_checksum = dkcksum(lp);
1532 1.11 thorpej }
1533 1.11 thorpej
1534 1.11 thorpej #ifdef DEBUG
1535 1.11 thorpej static void
1536 1.97 thorpej printiinfo(struct ccdiinfo *ii)
1537 1.11 thorpej {
1538 1.68 augustss int ix, i;
1539 1.11 thorpej
1540 1.11 thorpej for (ix = 0; ii->ii_ndisk; ix++, ii++) {
1541 1.81 kleink printf(" itab[%d]: #dk %d sblk %" PRId64 " soff %" PRId64,
1542 1.34 christos ix, ii->ii_ndisk, ii->ii_startblk, ii->ii_startoff);
1543 1.11 thorpej for (i = 0; i < ii->ii_ndisk; i++)
1544 1.35 christos printf(" %d", ii->ii_index[i]);
1545 1.35 christos printf("\n");
1546 1.11 thorpej }
1547 1.1 hpeyerl }
1548 1.1 hpeyerl #endif
1549 1.134 haad
1550 1.146 pgoyette MODULE(MODULE_CLASS_DRIVER, ccd, "dk_subr");
1551 1.134 haad
1552 1.134 haad static int
1553 1.134 haad ccd_modcmd(modcmd_t cmd, void *arg)
1554 1.134 haad {
1555 1.145 martin int error = 0;
1556 1.145 martin #ifdef _MODULE
1557 1.145 martin int bmajor = -1, cmajor = -1;
1558 1.145 martin #endif
1559 1.140 jruoho
1560 1.140 jruoho
1561 1.134 haad switch (cmd) {
1562 1.134 haad case MODULE_CMD_INIT:
1563 1.140 jruoho #ifdef _MODULE
1564 1.134 haad ccdattach(4);
1565 1.140 jruoho
1566 1.134 haad return devsw_attach("ccd", &ccd_bdevsw, &bmajor,
1567 1.134 haad &ccd_cdevsw, &cmajor);
1568 1.140 jruoho #endif
1569 1.134 haad break;
1570 1.134 haad
1571 1.134 haad case MODULE_CMD_FINI:
1572 1.140 jruoho #ifdef _MODULE
1573 1.134 haad return devsw_detach(&ccd_bdevsw, &ccd_cdevsw);
1574 1.140 jruoho #endif
1575 1.134 haad break;
1576 1.134 haad
1577 1.134 haad case MODULE_CMD_STAT:
1578 1.134 haad return ENOTTY;
1579 1.134 haad
1580 1.134 haad default:
1581 1.134 haad return ENOTTY;
1582 1.134 haad }
1583 1.134 haad
1584 1.134 haad return error;
1585 1.134 haad }
1586 1.144 christos
1587 1.144 christos static int
1588 1.144 christos ccd_units_sysctl(SYSCTLFN_ARGS)
1589 1.144 christos {
1590 1.144 christos struct sysctlnode node;
1591 1.144 christos struct ccd_softc *sc;
1592 1.144 christos int error, i, nccd, *units;
1593 1.144 christos size_t size;
1594 1.144 christos
1595 1.144 christos nccd = 0;
1596 1.144 christos mutex_enter(&ccd_lock);
1597 1.144 christos LIST_FOREACH(sc, &ccds, sc_link)
1598 1.144 christos nccd++;
1599 1.144 christos mutex_exit(&ccd_lock);
1600 1.144 christos
1601 1.144 christos if (nccd != 0) {
1602 1.144 christos size = nccd * sizeof(*units);
1603 1.144 christos units = kmem_zalloc(size, KM_SLEEP);
1604 1.144 christos if (units == NULL)
1605 1.144 christos return ENOMEM;
1606 1.144 christos
1607 1.144 christos i = 0;
1608 1.144 christos mutex_enter(&ccd_lock);
1609 1.144 christos LIST_FOREACH(sc, &ccds, sc_link) {
1610 1.144 christos if (i >= nccd)
1611 1.144 christos break;
1612 1.144 christos units[i] = sc->sc_unit;
1613 1.144 christos }
1614 1.144 christos mutex_exit(&ccd_lock);
1615 1.144 christos } else {
1616 1.144 christos units = NULL;
1617 1.144 christos size = 0;
1618 1.144 christos }
1619 1.144 christos
1620 1.144 christos node = *rnode;
1621 1.144 christos node.sysctl_data = units;
1622 1.144 christos node.sysctl_size = size;
1623 1.144 christos
1624 1.144 christos error = sysctl_lookup(SYSCTLFN_CALL(&node));
1625 1.144 christos if (units)
1626 1.144 christos kmem_free(units, size);
1627 1.144 christos return error;
1628 1.144 christos }
1629 1.144 christos
1630 1.144 christos static int
1631 1.144 christos ccd_info_sysctl(SYSCTLFN_ARGS)
1632 1.144 christos {
1633 1.144 christos struct sysctlnode node;
1634 1.144 christos struct ccddiskinfo ccd;
1635 1.144 christos struct ccd_softc *sc;
1636 1.144 christos int unit;
1637 1.144 christos
1638 1.144 christos if (newp == NULL || newlen != sizeof(int))
1639 1.144 christos return EINVAL;
1640 1.144 christos
1641 1.144 christos unit = *(const int *)newp;
1642 1.144 christos newp = NULL;
1643 1.144 christos newlen = 0;
1644 1.144 christos ccd.ccd_ndisks = ~0;
1645 1.144 christos mutex_enter(&ccd_lock);
1646 1.144 christos LIST_FOREACH(sc, &ccds, sc_link) {
1647 1.144 christos if (sc->sc_unit == unit) {
1648 1.144 christos ccd.ccd_ileave = sc->sc_ileave;
1649 1.144 christos ccd.ccd_size = sc->sc_size;
1650 1.144 christos ccd.ccd_ndisks = sc->sc_nccdisks;
1651 1.144 christos ccd.ccd_flags = sc->sc_flags;
1652 1.144 christos break;
1653 1.144 christos }
1654 1.144 christos }
1655 1.144 christos mutex_exit(&ccd_lock);
1656 1.144 christos
1657 1.144 christos if (ccd.ccd_ndisks == ~0)
1658 1.144 christos return ENOENT;
1659 1.144 christos
1660 1.144 christos node = *rnode;
1661 1.144 christos node.sysctl_data = &ccd;
1662 1.144 christos node.sysctl_size = sizeof(ccd);
1663 1.144 christos
1664 1.144 christos return sysctl_lookup(SYSCTLFN_CALL(&node));
1665 1.144 christos }
1666 1.144 christos
1667 1.144 christos static int
1668 1.144 christos ccd_components_sysctl(SYSCTLFN_ARGS)
1669 1.144 christos {
1670 1.144 christos struct sysctlnode node;
1671 1.144 christos int error, unit;
1672 1.144 christos size_t size;
1673 1.144 christos char *names, *p, *ep;
1674 1.144 christos struct ccd_softc *sc;
1675 1.144 christos
1676 1.144 christos if (newp == NULL || newlen != sizeof(int))
1677 1.144 christos return EINVAL;
1678 1.144 christos
1679 1.144 christos size = 0;
1680 1.144 christos unit = *(const int *)newp;
1681 1.144 christos newp = NULL;
1682 1.144 christos newlen = 0;
1683 1.144 christos mutex_enter(&ccd_lock);
1684 1.144 christos LIST_FOREACH(sc, &ccds, sc_link)
1685 1.144 christos if (sc->sc_unit == unit) {
1686 1.144 christos for (size_t i = 0; i < sc->sc_nccdisks; i++)
1687 1.144 christos size += strlen(sc->sc_cinfo[i].ci_path) + 1;
1688 1.144 christos break;
1689 1.144 christos }
1690 1.144 christos mutex_exit(&ccd_lock);
1691 1.144 christos
1692 1.144 christos if (size == 0)
1693 1.144 christos return ENOENT;
1694 1.144 christos names = kmem_zalloc(size, KM_SLEEP);
1695 1.144 christos if (names == NULL)
1696 1.144 christos return ENOMEM;
1697 1.144 christos
1698 1.144 christos p = names;
1699 1.144 christos ep = names + size;
1700 1.144 christos mutex_enter(&ccd_lock);
1701 1.144 christos LIST_FOREACH(sc, &ccds, sc_link)
1702 1.144 christos if (sc->sc_unit == unit) {
1703 1.144 christos for (size_t i = 0; i < sc->sc_nccdisks; i++) {
1704 1.144 christos char *d = sc->sc_cinfo[i].ci_path;
1705 1.144 christos while (p < ep && (*p++ = *d++) != '\0')
1706 1.144 christos continue;
1707 1.144 christos }
1708 1.144 christos break;
1709 1.144 christos }
1710 1.144 christos mutex_exit(&ccd_lock);
1711 1.144 christos
1712 1.144 christos node = *rnode;
1713 1.144 christos node.sysctl_data = names;
1714 1.144 christos node.sysctl_size = ep - names;
1715 1.144 christos
1716 1.144 christos error = sysctl_lookup(SYSCTLFN_CALL(&node));
1717 1.144 christos kmem_free(names, size);
1718 1.144 christos return error;
1719 1.144 christos }
1720 1.144 christos
1721 1.144 christos SYSCTL_SETUP(sysctl_kern_ccd_setup, "sysctl kern.ccd subtree setup")
1722 1.144 christos {
1723 1.144 christos const struct sysctlnode *node = NULL;
1724 1.144 christos
1725 1.144 christos sysctl_createv(clog, 0, NULL, &node,
1726 1.144 christos CTLFLAG_PERMANENT,
1727 1.144 christos CTLTYPE_NODE, "ccd",
1728 1.144 christos SYSCTL_DESCR("ConCatenated Disk state"),
1729 1.144 christos NULL, 0, NULL, 0,
1730 1.144 christos CTL_KERN, CTL_CREATE, CTL_EOL);
1731 1.144 christos
1732 1.144 christos if (node == NULL)
1733 1.144 christos return;
1734 1.144 christos
1735 1.144 christos sysctl_createv(clog, 0, &node, NULL,
1736 1.144 christos CTLFLAG_PERMANENT | CTLFLAG_READONLY,
1737 1.144 christos CTLTYPE_STRUCT, "units",
1738 1.144 christos SYSCTL_DESCR("List of ccd unit numbers"),
1739 1.144 christos ccd_units_sysctl, 0, NULL, 0,
1740 1.144 christos CTL_CREATE, CTL_EOL);
1741 1.144 christos sysctl_createv(clog, 0, &node, NULL,
1742 1.144 christos CTLFLAG_PERMANENT | CTLFLAG_READWRITE,
1743 1.144 christos CTLTYPE_STRUCT, "info",
1744 1.144 christos SYSCTL_DESCR("Information about a CCD unit"),
1745 1.144 christos ccd_info_sysctl, 0, NULL, 0,
1746 1.144 christos CTL_CREATE, CTL_EOL);
1747 1.144 christos sysctl_createv(clog, 0, &node, NULL,
1748 1.144 christos CTLFLAG_PERMANENT | CTLFLAG_READWRITE,
1749 1.144 christos CTLTYPE_STRUCT, "components",
1750 1.144 christos SYSCTL_DESCR("Information about CCD components"),
1751 1.144 christos ccd_components_sysctl, 0, NULL, 0,
1752 1.144 christos CTL_CREATE, CTL_EOL);
1753 1.144 christos }
1754