ccd.c revision 1.149 1 1.149 hannken /* $NetBSD: ccd.c,v 1.149 2014/06/14 07:39:00 hannken Exp $ */
2 1.11 thorpej
3 1.28 thorpej /*-
4 1.133 ad * Copyright (c) 1996, 1997, 1998, 1999, 2007, 2009 The NetBSD Foundation, Inc.
5 1.11 thorpej * All rights reserved.
6 1.11 thorpej *
7 1.28 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.133 ad * by Jason R. Thorpe, and by Andrew Doran.
9 1.28 thorpej *
10 1.11 thorpej * Redistribution and use in source and binary forms, with or without
11 1.11 thorpej * modification, are permitted provided that the following conditions
12 1.11 thorpej * are met:
13 1.11 thorpej * 1. Redistributions of source code must retain the above copyright
14 1.11 thorpej * notice, this list of conditions and the following disclaimer.
15 1.11 thorpej * 2. Redistributions in binary form must reproduce the above copyright
16 1.11 thorpej * notice, this list of conditions and the following disclaimer in the
17 1.11 thorpej * documentation and/or other materials provided with the distribution.
18 1.11 thorpej *
19 1.28 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.28 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.28 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.45 jtc * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.45 jtc * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.28 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.28 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.28 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.28 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.28 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.28 thorpej * POSSIBILITY OF SUCH DAMAGE.
30 1.11 thorpej */
31 1.2 cgd
32 1.1 hpeyerl /*
33 1.138 rmind * Copyright (c) 1988 University of Utah.
34 1.3 hpeyerl * Copyright (c) 1990, 1993
35 1.3 hpeyerl * The Regents of the University of California. All rights reserved.
36 1.1 hpeyerl *
37 1.1 hpeyerl * This code is derived from software contributed to Berkeley by
38 1.1 hpeyerl * the Systems Programming Group of the University of Utah Computer
39 1.1 hpeyerl * Science Department.
40 1.1 hpeyerl *
41 1.1 hpeyerl * Redistribution and use in source and binary forms, with or without
42 1.1 hpeyerl * modification, are permitted provided that the following conditions
43 1.1 hpeyerl * are met:
44 1.1 hpeyerl * 1. Redistributions of source code must retain the above copyright
45 1.1 hpeyerl * notice, this list of conditions and the following disclaimer.
46 1.1 hpeyerl * 2. Redistributions in binary form must reproduce the above copyright
47 1.1 hpeyerl * notice, this list of conditions and the following disclaimer in the
48 1.1 hpeyerl * documentation and/or other materials provided with the distribution.
49 1.91 agc * 3. Neither the name of the University nor the names of its contributors
50 1.91 agc * may be used to endorse or promote products derived from this software
51 1.91 agc * without specific prior written permission.
52 1.91 agc *
53 1.91 agc * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
54 1.91 agc * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
55 1.91 agc * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
56 1.91 agc * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
57 1.91 agc * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
58 1.91 agc * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
59 1.91 agc * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
60 1.91 agc * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
61 1.91 agc * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
62 1.91 agc * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
63 1.91 agc * SUCH DAMAGE.
64 1.91 agc *
65 1.91 agc * from: Utah $Hdr: cd.c 1.6 90/11/28$
66 1.91 agc *
67 1.91 agc * @(#)cd.c 8.2 (Berkeley) 11/16/93
68 1.91 agc */
69 1.91 agc
70 1.91 agc /*
71 1.1 hpeyerl * "Concatenated" disk driver.
72 1.11 thorpej *
73 1.133 ad * Notes on concurrency:
74 1.133 ad *
75 1.133 ad * => sc_dvlock serializes access to the device nodes, excluding block I/O.
76 1.133 ad *
77 1.133 ad * => sc_iolock serializes access to (sc_flags & CCDF_INITED), disk stats,
78 1.133 ad * sc_stop, sc_bufq and b_resid from master buffers.
79 1.133 ad *
80 1.133 ad * => a combination of CCDF_INITED, sc_inflight, and sc_iolock is used to
81 1.133 ad * serialize I/O and configuration changes.
82 1.133 ad *
83 1.133 ad * => the in-core disk label does not change while the device is open.
84 1.133 ad *
85 1.133 ad * On memory consumption: ccd fans out I/O requests and so needs to
86 1.133 ad * allocate memory. If the system is desperately low on memory, we
87 1.133 ad * single thread I/O.
88 1.1 hpeyerl */
89 1.74 lukem
90 1.74 lukem #include <sys/cdefs.h>
91 1.149 hannken __KERNEL_RCSID(0, "$NetBSD: ccd.c,v 1.149 2014/06/14 07:39:00 hannken Exp $");
92 1.1 hpeyerl
93 1.1 hpeyerl #include <sys/param.h>
94 1.1 hpeyerl #include <sys/systm.h>
95 1.133 ad #include <sys/kernel.h>
96 1.3 hpeyerl #include <sys/proc.h>
97 1.1 hpeyerl #include <sys/errno.h>
98 1.1 hpeyerl #include <sys/buf.h>
99 1.133 ad #include <sys/kmem.h>
100 1.63 thorpej #include <sys/pool.h>
101 1.140 jruoho #include <sys/module.h>
102 1.11 thorpej #include <sys/namei.h>
103 1.3 hpeyerl #include <sys/stat.h>
104 1.3 hpeyerl #include <sys/ioctl.h>
105 1.3 hpeyerl #include <sys/disklabel.h>
106 1.11 thorpej #include <sys/device.h>
107 1.11 thorpej #include <sys/disk.h>
108 1.11 thorpej #include <sys/syslog.h>
109 1.3 hpeyerl #include <sys/fcntl.h>
110 1.11 thorpej #include <sys/vnode.h>
111 1.31 christos #include <sys/conf.h>
112 1.117 ad #include <sys/mutex.h>
113 1.56 thorpej #include <sys/queue.h>
114 1.110 elad #include <sys/kauth.h>
115 1.133 ad #include <sys/kthread.h>
116 1.133 ad #include <sys/bufq.h>
117 1.144 christos #include <sys/sysctl.h>
118 1.1 hpeyerl
119 1.135 uebayasi #include <uvm/uvm_extern.h>
120 1.135 uebayasi
121 1.1 hpeyerl #include <dev/ccdvar.h>
122 1.113 christos #include <dev/dkvar.h>
123 1.1 hpeyerl
124 1.149 hannken #include <miscfs/specfs/specdev.h> /* for v_rdev */
125 1.149 hannken
126 1.11 thorpej #if defined(CCDDEBUG) && !defined(DEBUG)
127 1.11 thorpej #define DEBUG
128 1.11 thorpej #endif
129 1.11 thorpej
130 1.1 hpeyerl #ifdef DEBUG
131 1.3 hpeyerl #define CCDB_FOLLOW 0x01
132 1.3 hpeyerl #define CCDB_INIT 0x02
133 1.3 hpeyerl #define CCDB_IO 0x04
134 1.11 thorpej #define CCDB_LABEL 0x08
135 1.11 thorpej #define CCDB_VNODE 0x10
136 1.24 thorpej int ccddebug = 0x00;
137 1.1 hpeyerl #endif
138 1.1 hpeyerl
139 1.6 cgd #define ccdunit(x) DISKUNIT(x)
140 1.6 cgd
141 1.6 cgd struct ccdbuf {
142 1.6 cgd struct buf cb_buf; /* new I/O buf */
143 1.6 cgd struct buf *cb_obp; /* ptr. to original I/O buf */
144 1.59 thorpej struct ccd_softc *cb_sc; /* pointer to ccd softc */
145 1.6 cgd int cb_comp; /* target component */
146 1.56 thorpej SIMPLEQ_ENTRY(ccdbuf) cb_q; /* fifo of component buffers */
147 1.38 thorpej };
148 1.24 thorpej
149 1.63 thorpej /* component buffer pool */
150 1.133 ad static pool_cache_t ccd_cache;
151 1.63 thorpej
152 1.133 ad #define CCD_GETBUF() pool_cache_get(ccd_cache, PR_WAITOK)
153 1.133 ad #define CCD_PUTBUF(cbp) pool_cache_put(ccd_cache, cbp)
154 1.1 hpeyerl
155 1.11 thorpej #define CCDLABELDEV(dev) \
156 1.11 thorpej (MAKEDISKDEV(major((dev)), ccdunit((dev)), RAW_PART))
157 1.1 hpeyerl
158 1.11 thorpej /* called by main() at boot time */
159 1.97 thorpej void ccdattach(int);
160 1.11 thorpej
161 1.11 thorpej /* called by biodone() at interrupt time */
162 1.97 thorpej static void ccdiodone(struct buf *);
163 1.11 thorpej
164 1.97 thorpej static void ccdinterleave(struct ccd_softc *);
165 1.97 thorpej static int ccdinit(struct ccd_softc *, char **, struct vnode **,
166 1.107 christos struct lwp *);
167 1.97 thorpej static struct ccdbuf *ccdbuffer(struct ccd_softc *, struct buf *,
168 1.118 christos daddr_t, void *, long);
169 1.97 thorpej static void ccdgetdefaultlabel(struct ccd_softc *, struct disklabel *);
170 1.97 thorpej static void ccdgetdisklabel(dev_t);
171 1.97 thorpej static void ccdmakedisklabel(struct ccd_softc *);
172 1.133 ad static void ccdstart(struct ccd_softc *);
173 1.133 ad static void ccdthread(void *);
174 1.97 thorpej
175 1.97 thorpej static dev_type_open(ccdopen);
176 1.97 thorpej static dev_type_close(ccdclose);
177 1.97 thorpej static dev_type_read(ccdread);
178 1.97 thorpej static dev_type_write(ccdwrite);
179 1.97 thorpej static dev_type_ioctl(ccdioctl);
180 1.97 thorpej static dev_type_strategy(ccdstrategy);
181 1.97 thorpej static dev_type_size(ccdsize);
182 1.78 gehenna
183 1.78 gehenna const struct bdevsw ccd_bdevsw = {
184 1.133 ad .d_open = ccdopen,
185 1.133 ad .d_close = ccdclose,
186 1.133 ad .d_strategy = ccdstrategy,
187 1.133 ad .d_ioctl = ccdioctl,
188 1.133 ad .d_dump = nodump,
189 1.133 ad .d_psize = ccdsize,
190 1.133 ad .d_flag = D_DISK | D_MPSAFE
191 1.78 gehenna };
192 1.78 gehenna
193 1.78 gehenna const struct cdevsw ccd_cdevsw = {
194 1.133 ad .d_open = ccdopen,
195 1.133 ad .d_close = ccdclose,
196 1.133 ad .d_read = ccdread,
197 1.133 ad .d_write = ccdwrite,
198 1.133 ad .d_ioctl = ccdioctl,
199 1.133 ad .d_stop = nostop,
200 1.133 ad .d_tty = notty,
201 1.133 ad .d_poll = nopoll,
202 1.133 ad .d_mmap = nommap,
203 1.133 ad .d_kqfilter = nokqfilter,
204 1.133 ad .d_flag = D_DISK | D_MPSAFE
205 1.78 gehenna };
206 1.3 hpeyerl
207 1.11 thorpej #ifdef DEBUG
208 1.97 thorpej static void printiinfo(struct ccdiinfo *);
209 1.11 thorpej #endif
210 1.11 thorpej
211 1.144 christos static LIST_HEAD(, ccd_softc) ccds = LIST_HEAD_INITIALIZER(ccds);
212 1.144 christos static kmutex_t ccd_lock;
213 1.144 christos
214 1.144 christos static struct ccd_softc *
215 1.144 christos ccdcreate(int unit) {
216 1.144 christos struct ccd_softc *sc = kmem_zalloc(sizeof(*sc), KM_SLEEP);
217 1.144 christos if (sc == NULL) {
218 1.144 christos #ifdef DIAGNOSTIC
219 1.144 christos printf("%s: out of memory\n", __func__);
220 1.144 christos #endif
221 1.144 christos return NULL;
222 1.144 christos }
223 1.144 christos /* Initialize per-softc structures. */
224 1.144 christos snprintf(sc->sc_xname, sizeof(sc->sc_xname), "ccd%d", unit);
225 1.144 christos mutex_init(&sc->sc_dvlock, MUTEX_DEFAULT, IPL_NONE);
226 1.144 christos sc->sc_iolock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NONE);
227 1.144 christos cv_init(&sc->sc_stop, "ccdstop");
228 1.144 christos cv_init(&sc->sc_push, "ccdthr");
229 1.144 christos disk_init(&sc->sc_dkdev, sc->sc_xname, NULL); /* XXX */
230 1.144 christos return sc;
231 1.144 christos }
232 1.144 christos
233 1.144 christos static void
234 1.144 christos ccddestroy(struct ccd_softc *sc) {
235 1.144 christos mutex_obj_free(sc->sc_iolock);
236 1.148 joerg mutex_exit(&sc->sc_dvlock);
237 1.144 christos mutex_destroy(&sc->sc_dvlock);
238 1.144 christos cv_destroy(&sc->sc_stop);
239 1.144 christos cv_destroy(&sc->sc_push);
240 1.144 christos disk_destroy(&sc->sc_dkdev);
241 1.144 christos kmem_free(sc, sizeof(*sc));
242 1.144 christos }
243 1.144 christos
244 1.144 christos static struct ccd_softc *
245 1.144 christos ccdget(int unit) {
246 1.144 christos struct ccd_softc *sc;
247 1.144 christos if (unit < 0) {
248 1.144 christos #ifdef DIAGNOSTIC
249 1.144 christos panic("%s: unit %d!", __func__, unit);
250 1.144 christos #endif
251 1.144 christos return NULL;
252 1.144 christos }
253 1.144 christos mutex_enter(&ccd_lock);
254 1.144 christos LIST_FOREACH(sc, &ccds, sc_link) {
255 1.144 christos if (sc->sc_unit == unit) {
256 1.144 christos mutex_exit(&ccd_lock);
257 1.144 christos return sc;
258 1.144 christos }
259 1.144 christos }
260 1.144 christos mutex_exit(&ccd_lock);
261 1.144 christos if ((sc = ccdcreate(unit)) == NULL)
262 1.144 christos return NULL;
263 1.144 christos mutex_enter(&ccd_lock);
264 1.144 christos LIST_INSERT_HEAD(&ccds, sc, sc_link);
265 1.144 christos mutex_exit(&ccd_lock);
266 1.144 christos return sc;
267 1.144 christos }
268 1.144 christos
269 1.144 christos static void
270 1.144 christos ccdput(struct ccd_softc *sc) {
271 1.144 christos mutex_enter(&ccd_lock);
272 1.144 christos LIST_REMOVE(sc, sc_link);
273 1.144 christos mutex_exit(&ccd_lock);
274 1.144 christos ccddestroy(sc);
275 1.144 christos }
276 1.1 hpeyerl
277 1.3 hpeyerl /*
278 1.11 thorpej * Called by main() during pseudo-device attachment. All we need
279 1.11 thorpej * to do is allocate enough space for devices to be configured later.
280 1.1 hpeyerl */
281 1.1 hpeyerl void
282 1.97 thorpej ccdattach(int num)
283 1.3 hpeyerl {
284 1.144 christos mutex_init(&ccd_lock, MUTEX_DEFAULT, IPL_NONE);
285 1.57 thorpej
286 1.63 thorpej /* Initialize the component buffer pool. */
287 1.133 ad ccd_cache = pool_cache_init(sizeof(struct ccdbuf), 0,
288 1.133 ad 0, 0, "ccdbuf", NULL, IPL_BIO, NULL, NULL, NULL);
289 1.1 hpeyerl }
290 1.1 hpeyerl
291 1.11 thorpej static int
292 1.97 thorpej ccdinit(struct ccd_softc *cs, char **cpaths, struct vnode **vpp,
293 1.107 christos struct lwp *l)
294 1.1 hpeyerl {
295 1.68 augustss struct ccdcinfo *ci = NULL;
296 1.68 augustss int ix;
297 1.11 thorpej struct ccdgeom *ccg = &cs->sc_geom;
298 1.111 christos char *tmppath;
299 1.67 enami int error, path_alloced;
300 1.143 christos uint64_t psize, minsize;
301 1.143 christos unsigned secsize, maxsecsize;
302 1.1 hpeyerl
303 1.1 hpeyerl #ifdef DEBUG
304 1.3 hpeyerl if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
305 1.59 thorpej printf("%s: ccdinit\n", cs->sc_xname);
306 1.1 hpeyerl #endif
307 1.11 thorpej
308 1.11 thorpej /* Allocate space for the component info. */
309 1.133 ad cs->sc_cinfo = kmem_alloc(cs->sc_nccdisks * sizeof(*cs->sc_cinfo),
310 1.133 ad KM_SLEEP);
311 1.133 ad tmppath = kmem_alloc(MAXPATHLEN, KM_SLEEP);
312 1.111 christos
313 1.57 thorpej cs->sc_size = 0;
314 1.57 thorpej
315 1.1 hpeyerl /*
316 1.1 hpeyerl * Verify that each component piece exists and record
317 1.1 hpeyerl * relevant information about it.
318 1.1 hpeyerl */
319 1.11 thorpej maxsecsize = 0;
320 1.1 hpeyerl minsize = 0;
321 1.67 enami for (ix = 0, path_alloced = 0; ix < cs->sc_nccdisks; ix++) {
322 1.1 hpeyerl ci = &cs->sc_cinfo[ix];
323 1.57 thorpej ci->ci_vp = vpp[ix];
324 1.11 thorpej
325 1.11 thorpej /*
326 1.11 thorpej * Copy in the pathname of the component.
327 1.11 thorpej */
328 1.141 joerg memset(tmppath, 0, MAXPATHLEN); /* sanity */
329 1.29 christos error = copyinstr(cpaths[ix], tmppath,
330 1.29 christos MAXPATHLEN, &ci->ci_pathlen);
331 1.133 ad if (ci->ci_pathlen == 0)
332 1.133 ad error = EINVAL;
333 1.29 christos if (error) {
334 1.11 thorpej #ifdef DEBUG
335 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
336 1.35 christos printf("%s: can't copy path, error = %d\n",
337 1.23 thorpej cs->sc_xname, error);
338 1.11 thorpej #endif
339 1.67 enami goto out;
340 1.11 thorpej }
341 1.133 ad ci->ci_path = kmem_alloc(ci->ci_pathlen, KM_SLEEP);
342 1.72 thorpej memcpy(ci->ci_path, tmppath, ci->ci_pathlen);
343 1.67 enami path_alloced++;
344 1.11 thorpej
345 1.11 thorpej /*
346 1.11 thorpej * XXX: Cache the component's dev_t.
347 1.11 thorpej */
348 1.149 hannken ci->ci_dev = vpp[ix]->v_rdev;
349 1.11 thorpej
350 1.3 hpeyerl /*
351 1.11 thorpej * Get partition information for the component.
352 1.3 hpeyerl */
353 1.143 christos error = getdisksize(vpp[ix], &psize, &secsize);
354 1.29 christos if (error) {
355 1.11 thorpej #ifdef DEBUG
356 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
357 1.143 christos printf("%s: %s: disksize failed, error = %d\n",
358 1.23 thorpej cs->sc_xname, ci->ci_path, error);
359 1.11 thorpej #endif
360 1.67 enami goto out;
361 1.11 thorpej }
362 1.69 enami
363 1.11 thorpej /*
364 1.11 thorpej * Calculate the size, truncating to an interleave
365 1.11 thorpej * boundary if necessary.
366 1.11 thorpej */
367 1.143 christos maxsecsize = secsize > maxsecsize ? secsize : maxsecsize;
368 1.1 hpeyerl if (cs->sc_ileave > 1)
369 1.143 christos psize -= psize % cs->sc_ileave;
370 1.11 thorpej
371 1.143 christos if (psize == 0) {
372 1.11 thorpej #ifdef DEBUG
373 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
374 1.35 christos printf("%s: %s: size == 0\n",
375 1.23 thorpej cs->sc_xname, ci->ci_path);
376 1.11 thorpej #endif
377 1.67 enami error = ENODEV;
378 1.67 enami goto out;
379 1.3 hpeyerl }
380 1.11 thorpej
381 1.143 christos if (minsize == 0 || psize < minsize)
382 1.143 christos minsize = psize;
383 1.143 christos ci->ci_size = psize;
384 1.143 christos cs->sc_size += psize;
385 1.1 hpeyerl }
386 1.11 thorpej
387 1.11 thorpej /*
388 1.11 thorpej * Don't allow the interleave to be smaller than
389 1.11 thorpej * the biggest component sector.
390 1.11 thorpej */
391 1.11 thorpej if ((cs->sc_ileave > 0) &&
392 1.11 thorpej (cs->sc_ileave < (maxsecsize / DEV_BSIZE))) {
393 1.11 thorpej #ifdef DEBUG
394 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
395 1.35 christos printf("%s: interleave must be at least %d\n",
396 1.23 thorpej cs->sc_xname, (maxsecsize / DEV_BSIZE));
397 1.11 thorpej #endif
398 1.67 enami error = EINVAL;
399 1.67 enami goto out;
400 1.11 thorpej }
401 1.11 thorpej
402 1.1 hpeyerl /*
403 1.1 hpeyerl * If uniform interleave is desired set all sizes to that of
404 1.1 hpeyerl * the smallest component.
405 1.1 hpeyerl */
406 1.57 thorpej if (cs->sc_flags & CCDF_UNIFORM) {
407 1.1 hpeyerl for (ci = cs->sc_cinfo;
408 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
409 1.1 hpeyerl ci->ci_size = minsize;
410 1.24 thorpej
411 1.53 thorpej cs->sc_size = cs->sc_nccdisks * minsize;
412 1.1 hpeyerl }
413 1.11 thorpej
414 1.11 thorpej /*
415 1.11 thorpej * Construct the interleave table.
416 1.11 thorpej */
417 1.57 thorpej ccdinterleave(cs);
418 1.11 thorpej
419 1.1 hpeyerl /*
420 1.11 thorpej * Create pseudo-geometry based on 1MB cylinders. It's
421 1.11 thorpej * pretty close.
422 1.1 hpeyerl */
423 1.11 thorpej ccg->ccg_secsize = DEV_BSIZE;
424 1.19 thorpej ccg->ccg_ntracks = 1;
425 1.11 thorpej ccg->ccg_nsectors = 1024 * (1024 / ccg->ccg_secsize);
426 1.11 thorpej ccg->ccg_ncylinders = cs->sc_size / ccg->ccg_nsectors;
427 1.11 thorpej
428 1.133 ad /*
429 1.133 ad * Create thread to handle deferred I/O.
430 1.133 ad */
431 1.133 ad cs->sc_zap = false;
432 1.133 ad error = kthread_create(PRI_BIO, KTHREAD_MPSAFE, NULL, ccdthread,
433 1.133 ad cs, &cs->sc_thread, "%s", cs->sc_xname);
434 1.133 ad if (error) {
435 1.133 ad printf("ccdinit: can't create thread: %d\n", error);
436 1.133 ad goto out;
437 1.133 ad }
438 1.133 ad
439 1.133 ad /*
440 1.133 ad * Only now that everything is set up can we enable the device.
441 1.133 ad */
442 1.133 ad mutex_enter(cs->sc_iolock);
443 1.11 thorpej cs->sc_flags |= CCDF_INITED;
444 1.133 ad mutex_exit(cs->sc_iolock);
445 1.133 ad kmem_free(tmppath, MAXPATHLEN);
446 1.11 thorpej return (0);
447 1.67 enami
448 1.67 enami out:
449 1.133 ad for (ix = 0; ix < path_alloced; ix++) {
450 1.133 ad kmem_free(cs->sc_cinfo[ix].ci_path,
451 1.133 ad cs->sc_cinfo[ix].ci_pathlen);
452 1.133 ad }
453 1.133 ad kmem_free(cs->sc_cinfo, cs->sc_nccdisks * sizeof(struct ccdcinfo));
454 1.133 ad kmem_free(tmppath, MAXPATHLEN);
455 1.67 enami return (error);
456 1.1 hpeyerl }
457 1.1 hpeyerl
458 1.11 thorpej static void
459 1.97 thorpej ccdinterleave(struct ccd_softc *cs)
460 1.1 hpeyerl {
461 1.68 augustss struct ccdcinfo *ci, *smallci;
462 1.68 augustss struct ccdiinfo *ii;
463 1.68 augustss daddr_t bn, lbn;
464 1.68 augustss int ix;
465 1.1 hpeyerl u_long size;
466 1.1 hpeyerl
467 1.1 hpeyerl #ifdef DEBUG
468 1.3 hpeyerl if (ccddebug & CCDB_INIT)
469 1.35 christos printf("ccdinterleave(%p): ileave %d\n", cs, cs->sc_ileave);
470 1.1 hpeyerl #endif
471 1.1 hpeyerl /*
472 1.1 hpeyerl * Allocate an interleave table.
473 1.1 hpeyerl * Chances are this is too big, but we don't care.
474 1.1 hpeyerl */
475 1.1 hpeyerl size = (cs->sc_nccdisks + 1) * sizeof(struct ccdiinfo);
476 1.133 ad cs->sc_itable = kmem_zalloc(size, KM_SLEEP);
477 1.11 thorpej
478 1.1 hpeyerl /*
479 1.1 hpeyerl * Trivial case: no interleave (actually interleave of disk size).
480 1.11 thorpej * Each table entry represents a single component in its entirety.
481 1.1 hpeyerl */
482 1.1 hpeyerl if (cs->sc_ileave == 0) {
483 1.1 hpeyerl bn = 0;
484 1.1 hpeyerl ii = cs->sc_itable;
485 1.11 thorpej
486 1.1 hpeyerl for (ix = 0; ix < cs->sc_nccdisks; ix++) {
487 1.19 thorpej /* Allocate space for ii_index. */
488 1.133 ad ii->ii_indexsz = sizeof(int);
489 1.133 ad ii->ii_index = kmem_alloc(ii->ii_indexsz, KM_SLEEP);
490 1.1 hpeyerl ii->ii_ndisk = 1;
491 1.1 hpeyerl ii->ii_startblk = bn;
492 1.1 hpeyerl ii->ii_startoff = 0;
493 1.1 hpeyerl ii->ii_index[0] = ix;
494 1.1 hpeyerl bn += cs->sc_cinfo[ix].ci_size;
495 1.1 hpeyerl ii++;
496 1.1 hpeyerl }
497 1.1 hpeyerl ii->ii_ndisk = 0;
498 1.1 hpeyerl #ifdef DEBUG
499 1.3 hpeyerl if (ccddebug & CCDB_INIT)
500 1.1 hpeyerl printiinfo(cs->sc_itable);
501 1.1 hpeyerl #endif
502 1.11 thorpej return;
503 1.1 hpeyerl }
504 1.11 thorpej
505 1.1 hpeyerl /*
506 1.1 hpeyerl * The following isn't fast or pretty; it doesn't have to be.
507 1.1 hpeyerl */
508 1.1 hpeyerl size = 0;
509 1.1 hpeyerl bn = lbn = 0;
510 1.1 hpeyerl for (ii = cs->sc_itable; ; ii++) {
511 1.11 thorpej /* Allocate space for ii_index. */
512 1.133 ad ii->ii_indexsz = sizeof(int) * cs->sc_nccdisks;
513 1.133 ad ii->ii_index = kmem_alloc(ii->ii_indexsz, KM_SLEEP);
514 1.11 thorpej
515 1.1 hpeyerl /*
516 1.1 hpeyerl * Locate the smallest of the remaining components
517 1.1 hpeyerl */
518 1.1 hpeyerl smallci = NULL;
519 1.1 hpeyerl for (ci = cs->sc_cinfo;
520 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
521 1.1 hpeyerl if (ci->ci_size > size &&
522 1.1 hpeyerl (smallci == NULL ||
523 1.1 hpeyerl ci->ci_size < smallci->ci_size))
524 1.1 hpeyerl smallci = ci;
525 1.11 thorpej
526 1.1 hpeyerl /*
527 1.1 hpeyerl * Nobody left, all done
528 1.1 hpeyerl */
529 1.1 hpeyerl if (smallci == NULL) {
530 1.1 hpeyerl ii->ii_ndisk = 0;
531 1.1 hpeyerl break;
532 1.1 hpeyerl }
533 1.11 thorpej
534 1.1 hpeyerl /*
535 1.1 hpeyerl * Record starting logical block and component offset
536 1.1 hpeyerl */
537 1.1 hpeyerl ii->ii_startblk = bn / cs->sc_ileave;
538 1.1 hpeyerl ii->ii_startoff = lbn;
539 1.11 thorpej
540 1.1 hpeyerl /*
541 1.1 hpeyerl * Determine how many disks take part in this interleave
542 1.1 hpeyerl * and record their indices.
543 1.1 hpeyerl */
544 1.1 hpeyerl ix = 0;
545 1.1 hpeyerl for (ci = cs->sc_cinfo;
546 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
547 1.1 hpeyerl if (ci->ci_size >= smallci->ci_size)
548 1.1 hpeyerl ii->ii_index[ix++] = ci - cs->sc_cinfo;
549 1.1 hpeyerl ii->ii_ndisk = ix;
550 1.1 hpeyerl bn += ix * (smallci->ci_size - size);
551 1.1 hpeyerl lbn = smallci->ci_size / cs->sc_ileave;
552 1.1 hpeyerl size = smallci->ci_size;
553 1.1 hpeyerl }
554 1.1 hpeyerl #ifdef DEBUG
555 1.3 hpeyerl if (ccddebug & CCDB_INIT)
556 1.1 hpeyerl printiinfo(cs->sc_itable);
557 1.1 hpeyerl #endif
558 1.1 hpeyerl }
559 1.1 hpeyerl
560 1.11 thorpej /* ARGSUSED */
561 1.97 thorpej static int
562 1.116 christos ccdopen(dev_t dev, int flags, int fmt, struct lwp *l)
563 1.1 hpeyerl {
564 1.1 hpeyerl int unit = ccdunit(dev);
565 1.11 thorpej struct ccd_softc *cs;
566 1.11 thorpej struct disklabel *lp;
567 1.15 thorpej int error = 0, part, pmask;
568 1.1 hpeyerl
569 1.1 hpeyerl #ifdef DEBUG
570 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
571 1.131 cegger printf("ccdopen(0x%"PRIx64", 0x%x)\n", dev, flags);
572 1.1 hpeyerl #endif
573 1.144 christos if ((cs = ccdget(unit)) == NULL)
574 1.144 christos return ENXIO;
575 1.15 thorpej
576 1.133 ad mutex_enter(&cs->sc_dvlock);
577 1.15 thorpej
578 1.23 thorpej lp = cs->sc_dkdev.dk_label;
579 1.11 thorpej
580 1.11 thorpej part = DISKPART(dev);
581 1.11 thorpej pmask = (1 << part);
582 1.11 thorpej
583 1.15 thorpej /*
584 1.15 thorpej * If we're initialized, check to see if there are any other
585 1.15 thorpej * open partitions. If not, then it's safe to update
586 1.87 thorpej * the in-core disklabel. Only read the disklabel if it is
587 1.87 thorpej * not already valid.
588 1.15 thorpej */
589 1.87 thorpej if ((cs->sc_flags & (CCDF_INITED|CCDF_VLABEL)) == CCDF_INITED &&
590 1.87 thorpej cs->sc_dkdev.dk_openmask == 0)
591 1.15 thorpej ccdgetdisklabel(dev);
592 1.15 thorpej
593 1.11 thorpej /* Check that the partition exists. */
594 1.27 thorpej if (part != RAW_PART) {
595 1.27 thorpej if (((cs->sc_flags & CCDF_INITED) == 0) ||
596 1.37 thorpej ((part >= lp->d_npartitions) ||
597 1.27 thorpej (lp->d_partitions[part].p_fstype == FS_UNUSED))) {
598 1.27 thorpej error = ENXIO;
599 1.27 thorpej goto done;
600 1.27 thorpej }
601 1.15 thorpej }
602 1.11 thorpej
603 1.11 thorpej /* Prevent our unit from being unconfigured while open. */
604 1.11 thorpej switch (fmt) {
605 1.11 thorpej case S_IFCHR:
606 1.11 thorpej cs->sc_dkdev.dk_copenmask |= pmask;
607 1.11 thorpej break;
608 1.11 thorpej
609 1.11 thorpej case S_IFBLK:
610 1.11 thorpej cs->sc_dkdev.dk_bopenmask |= pmask;
611 1.11 thorpej break;
612 1.11 thorpej }
613 1.11 thorpej cs->sc_dkdev.dk_openmask =
614 1.11 thorpej cs->sc_dkdev.dk_copenmask | cs->sc_dkdev.dk_bopenmask;
615 1.11 thorpej
616 1.15 thorpej done:
617 1.133 ad mutex_exit(&cs->sc_dvlock);
618 1.33 thorpej return (error);
619 1.7 cgd }
620 1.7 cgd
621 1.11 thorpej /* ARGSUSED */
622 1.97 thorpej static int
623 1.116 christos ccdclose(dev_t dev, int flags, int fmt, struct lwp *l)
624 1.7 cgd {
625 1.11 thorpej int unit = ccdunit(dev);
626 1.11 thorpej struct ccd_softc *cs;
627 1.117 ad int part;
628 1.11 thorpej
629 1.7 cgd #ifdef DEBUG
630 1.7 cgd if (ccddebug & CCDB_FOLLOW)
631 1.131 cegger printf("ccdclose(0x%"PRIx64", 0x%x)\n", dev, flags);
632 1.7 cgd #endif
633 1.11 thorpej
634 1.144 christos if ((cs = ccdget(unit)) == NULL)
635 1.144 christos return ENXIO;
636 1.15 thorpej
637 1.133 ad mutex_enter(&cs->sc_dvlock);
638 1.15 thorpej
639 1.11 thorpej part = DISKPART(dev);
640 1.11 thorpej
641 1.11 thorpej /* ...that much closer to allowing unconfiguration... */
642 1.11 thorpej switch (fmt) {
643 1.11 thorpej case S_IFCHR:
644 1.11 thorpej cs->sc_dkdev.dk_copenmask &= ~(1 << part);
645 1.11 thorpej break;
646 1.11 thorpej
647 1.11 thorpej case S_IFBLK:
648 1.11 thorpej cs->sc_dkdev.dk_bopenmask &= ~(1 << part);
649 1.11 thorpej break;
650 1.11 thorpej }
651 1.11 thorpej cs->sc_dkdev.dk_openmask =
652 1.11 thorpej cs->sc_dkdev.dk_copenmask | cs->sc_dkdev.dk_bopenmask;
653 1.11 thorpej
654 1.87 thorpej if (cs->sc_dkdev.dk_openmask == 0) {
655 1.87 thorpej if ((cs->sc_flags & CCDF_KLABEL) == 0)
656 1.87 thorpej cs->sc_flags &= ~CCDF_VLABEL;
657 1.87 thorpej }
658 1.87 thorpej
659 1.133 ad mutex_exit(&cs->sc_dvlock);
660 1.7 cgd return (0);
661 1.1 hpeyerl }
662 1.1 hpeyerl
663 1.133 ad static bool
664 1.133 ad ccdbackoff(struct ccd_softc *cs)
665 1.133 ad {
666 1.133 ad
667 1.133 ad /* XXX Arbitrary, should be a uvm call. */
668 1.133 ad return uvmexp.free < (uvmexp.freemin >> 1) &&
669 1.133 ad disk_isbusy(&cs->sc_dkdev);
670 1.133 ad }
671 1.133 ad
672 1.133 ad static void
673 1.133 ad ccdthread(void *cookie)
674 1.133 ad {
675 1.133 ad struct ccd_softc *cs;
676 1.133 ad
677 1.133 ad cs = cookie;
678 1.133 ad
679 1.133 ad #ifdef DEBUG
680 1.133 ad if (ccddebug & CCDB_FOLLOW)
681 1.133 ad printf("ccdthread: hello\n");
682 1.133 ad #endif
683 1.133 ad
684 1.133 ad mutex_enter(cs->sc_iolock);
685 1.133 ad while (__predict_true(!cs->sc_zap)) {
686 1.133 ad if (bufq_peek(cs->sc_bufq) == NULL) {
687 1.133 ad /* Nothing to do. */
688 1.133 ad cv_wait(&cs->sc_push, cs->sc_iolock);
689 1.133 ad continue;
690 1.133 ad }
691 1.133 ad if (ccdbackoff(cs)) {
692 1.133 ad /* Wait for memory to become available. */
693 1.133 ad (void)cv_timedwait(&cs->sc_push, cs->sc_iolock, 1);
694 1.133 ad continue;
695 1.133 ad }
696 1.133 ad #ifdef DEBUG
697 1.133 ad if (ccddebug & CCDB_FOLLOW)
698 1.133 ad printf("ccdthread: dispatching I/O\n");
699 1.133 ad #endif
700 1.133 ad ccdstart(cs);
701 1.133 ad mutex_enter(cs->sc_iolock);
702 1.133 ad }
703 1.133 ad cs->sc_thread = NULL;
704 1.133 ad mutex_exit(cs->sc_iolock);
705 1.133 ad #ifdef DEBUG
706 1.133 ad if (ccddebug & CCDB_FOLLOW)
707 1.133 ad printf("ccdthread: goodbye\n");
708 1.133 ad #endif
709 1.133 ad kthread_exit(0);
710 1.133 ad }
711 1.133 ad
712 1.97 thorpej static void
713 1.97 thorpej ccdstrategy(struct buf *bp)
714 1.1 hpeyerl {
715 1.68 augustss int unit = ccdunit(bp->b_dev);
716 1.144 christos struct ccd_softc *cs;
717 1.144 christos if ((cs = ccdget(unit)) == NULL)
718 1.144 christos return;
719 1.133 ad
720 1.133 ad /* Must be open or reading label. */
721 1.133 ad KASSERT(cs->sc_dkdev.dk_openmask != 0 ||
722 1.133 ad (cs->sc_flags & CCDF_RLABEL) != 0);
723 1.133 ad
724 1.133 ad mutex_enter(cs->sc_iolock);
725 1.133 ad /* Synchronize with device init/uninit. */
726 1.133 ad if (__predict_false((cs->sc_flags & CCDF_INITED) == 0)) {
727 1.133 ad mutex_exit(cs->sc_iolock);
728 1.133 ad #ifdef DEBUG
729 1.133 ad if (ccddebug & CCDB_FOLLOW)
730 1.133 ad printf("ccdstrategy: unit %d: not inited\n", unit);
731 1.133 ad #endif
732 1.133 ad bp->b_error = ENXIO;
733 1.133 ad bp->b_resid = bp->b_bcount;
734 1.133 ad biodone(bp);
735 1.133 ad return;
736 1.133 ad }
737 1.133 ad
738 1.133 ad /* Defer to thread if system is low on memory. */
739 1.133 ad bufq_put(cs->sc_bufq, bp);
740 1.133 ad if (__predict_false(ccdbackoff(cs))) {
741 1.133 ad mutex_exit(cs->sc_iolock);
742 1.133 ad #ifdef DEBUG
743 1.133 ad if (ccddebug & CCDB_FOLLOW)
744 1.133 ad printf("ccdstrategy: holding off on I/O\n");
745 1.133 ad #endif
746 1.133 ad return;
747 1.133 ad }
748 1.133 ad ccdstart(cs);
749 1.133 ad }
750 1.133 ad
751 1.133 ad static void
752 1.133 ad ccdstart(struct ccd_softc *cs)
753 1.133 ad {
754 1.88 thorpej daddr_t blkno;
755 1.11 thorpej int wlabel;
756 1.15 thorpej struct disklabel *lp;
757 1.133 ad long bcount, rcount;
758 1.133 ad struct ccdbuf *cbp;
759 1.133 ad char *addr;
760 1.133 ad daddr_t bn;
761 1.133 ad vnode_t *vp;
762 1.133 ad buf_t *bp;
763 1.133 ad
764 1.133 ad KASSERT(mutex_owned(cs->sc_iolock));
765 1.133 ad
766 1.133 ad disk_busy(&cs->sc_dkdev);
767 1.133 ad bp = bufq_get(cs->sc_bufq);
768 1.133 ad KASSERT(bp != NULL);
769 1.1 hpeyerl
770 1.1 hpeyerl #ifdef DEBUG
771 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
772 1.133 ad printf("ccdstart(%s, %p)\n", cs->sc_xname, bp);
773 1.59 thorpej #endif
774 1.11 thorpej
775 1.11 thorpej /* If it's a nil transfer, wake up the top half now. */
776 1.11 thorpej if (bp->b_bcount == 0)
777 1.11 thorpej goto done;
778 1.11 thorpej
779 1.23 thorpej lp = cs->sc_dkdev.dk_label;
780 1.15 thorpej
781 1.11 thorpej /*
782 1.17 thorpej * Do bounds checking and adjust transfer. If there's an
783 1.88 thorpej * error, the bounds check will flag that for us. Convert
784 1.88 thorpej * the partition relative block number to an absolute.
785 1.11 thorpej */
786 1.88 thorpej blkno = bp->b_blkno;
787 1.11 thorpej wlabel = cs->sc_flags & (CCDF_WLABEL|CCDF_LABELLING);
788 1.88 thorpej if (DISKPART(bp->b_dev) != RAW_PART) {
789 1.86 thorpej if (bounds_check_with_label(&cs->sc_dkdev, bp, wlabel) <= 0)
790 1.1 hpeyerl goto done;
791 1.88 thorpej blkno += lp->d_partitions[DISKPART(bp->b_dev)].p_offset;
792 1.88 thorpej }
793 1.133 ad mutex_exit(cs->sc_iolock);
794 1.88 thorpej bp->b_rawblkno = blkno;
795 1.11 thorpej
796 1.133 ad /* Allocate the component buffers and start I/O! */
797 1.133 ad bp->b_resid = bp->b_bcount;
798 1.133 ad bn = bp->b_rawblkno;
799 1.133 ad addr = bp->b_data;
800 1.133 ad for (bcount = bp->b_bcount; bcount > 0; bcount -= rcount) {
801 1.133 ad cbp = ccdbuffer(cs, bp, bn, addr, bcount);
802 1.133 ad rcount = cbp->cb_buf.b_bcount;
803 1.133 ad bn += btodb(rcount);
804 1.133 ad addr += rcount;
805 1.133 ad vp = cbp->cb_buf.b_vp;
806 1.133 ad if ((cbp->cb_buf.b_flags & B_READ) == 0) {
807 1.139 rmind mutex_enter(vp->v_interlock);
808 1.133 ad vp->v_numoutput++;
809 1.139 rmind mutex_exit(vp->v_interlock);
810 1.133 ad }
811 1.133 ad (void)VOP_STRATEGY(vp, &cbp->cb_buf);
812 1.133 ad }
813 1.1 hpeyerl return;
814 1.88 thorpej
815 1.88 thorpej done:
816 1.133 ad disk_unbusy(&cs->sc_dkdev, 0, 0);
817 1.133 ad cv_broadcast(&cs->sc_stop);
818 1.133 ad cv_broadcast(&cs->sc_push);
819 1.133 ad mutex_exit(cs->sc_iolock);
820 1.88 thorpej bp->b_resid = bp->b_bcount;
821 1.1 hpeyerl biodone(bp);
822 1.1 hpeyerl }
823 1.1 hpeyerl
824 1.1 hpeyerl /*
825 1.1 hpeyerl * Build a component buffer header.
826 1.1 hpeyerl */
827 1.55 thorpej static struct ccdbuf *
828 1.118 christos ccdbuffer(struct ccd_softc *cs, struct buf *bp, daddr_t bn, void *addr,
829 1.97 thorpej long bcount)
830 1.1 hpeyerl {
831 1.68 augustss struct ccdcinfo *ci;
832 1.68 augustss struct ccdbuf *cbp;
833 1.68 augustss daddr_t cbn, cboff;
834 1.68 augustss u_int64_t cbc;
835 1.36 thorpej int ccdisk;
836 1.1 hpeyerl
837 1.1 hpeyerl #ifdef DEBUG
838 1.3 hpeyerl if (ccddebug & CCDB_IO)
839 1.81 kleink printf("ccdbuffer(%p, %p, %" PRId64 ", %p, %ld)\n",
840 1.1 hpeyerl cs, bp, bn, addr, bcount);
841 1.1 hpeyerl #endif
842 1.1 hpeyerl /*
843 1.1 hpeyerl * Determine which component bn falls in.
844 1.1 hpeyerl */
845 1.1 hpeyerl cbn = bn;
846 1.1 hpeyerl cboff = 0;
847 1.11 thorpej
848 1.1 hpeyerl /*
849 1.1 hpeyerl * Serially concatenated
850 1.1 hpeyerl */
851 1.1 hpeyerl if (cs->sc_ileave == 0) {
852 1.68 augustss daddr_t sblk;
853 1.1 hpeyerl
854 1.1 hpeyerl sblk = 0;
855 1.36 thorpej for (ccdisk = 0, ci = &cs->sc_cinfo[ccdisk];
856 1.36 thorpej cbn >= sblk + ci->ci_size;
857 1.36 thorpej ccdisk++, ci = &cs->sc_cinfo[ccdisk])
858 1.1 hpeyerl sblk += ci->ci_size;
859 1.1 hpeyerl cbn -= sblk;
860 1.1 hpeyerl }
861 1.1 hpeyerl /*
862 1.1 hpeyerl * Interleaved
863 1.1 hpeyerl */
864 1.1 hpeyerl else {
865 1.68 augustss struct ccdiinfo *ii;
866 1.36 thorpej int off;
867 1.1 hpeyerl
868 1.1 hpeyerl cboff = cbn % cs->sc_ileave;
869 1.1 hpeyerl cbn /= cs->sc_ileave;
870 1.1 hpeyerl for (ii = cs->sc_itable; ii->ii_ndisk; ii++)
871 1.1 hpeyerl if (ii->ii_startblk > cbn)
872 1.1 hpeyerl break;
873 1.1 hpeyerl ii--;
874 1.1 hpeyerl off = cbn - ii->ii_startblk;
875 1.1 hpeyerl if (ii->ii_ndisk == 1) {
876 1.1 hpeyerl ccdisk = ii->ii_index[0];
877 1.1 hpeyerl cbn = ii->ii_startoff + off;
878 1.1 hpeyerl } else {
879 1.53 thorpej ccdisk = ii->ii_index[off % ii->ii_ndisk];
880 1.53 thorpej cbn = ii->ii_startoff + off / ii->ii_ndisk;
881 1.1 hpeyerl }
882 1.1 hpeyerl cbn *= cs->sc_ileave;
883 1.1 hpeyerl ci = &cs->sc_cinfo[ccdisk];
884 1.1 hpeyerl }
885 1.11 thorpej
886 1.1 hpeyerl /*
887 1.1 hpeyerl * Fill in the component buf structure.
888 1.1 hpeyerl */
889 1.63 thorpej cbp = CCD_GETBUF();
890 1.133 ad KASSERT(cbp != NULL);
891 1.126 ad buf_init(&cbp->cb_buf);
892 1.126 ad cbp->cb_buf.b_flags = bp->b_flags;
893 1.126 ad cbp->cb_buf.b_oflags = bp->b_oflags;
894 1.126 ad cbp->cb_buf.b_cflags = bp->b_cflags;
895 1.29 christos cbp->cb_buf.b_iodone = ccdiodone;
896 1.6 cgd cbp->cb_buf.b_proc = bp->b_proc;
897 1.95 hannken cbp->cb_buf.b_dev = ci->ci_dev;
898 1.6 cgd cbp->cb_buf.b_blkno = cbn + cboff;
899 1.6 cgd cbp->cb_buf.b_data = addr;
900 1.11 thorpej cbp->cb_buf.b_vp = ci->ci_vp;
901 1.139 rmind cbp->cb_buf.b_objlock = ci->ci_vp->v_interlock;
902 1.1 hpeyerl if (cs->sc_ileave == 0)
903 1.50 thorpej cbc = dbtob((u_int64_t)(ci->ci_size - cbn));
904 1.1 hpeyerl else
905 1.50 thorpej cbc = dbtob((u_int64_t)(cs->sc_ileave - cboff));
906 1.50 thorpej cbp->cb_buf.b_bcount = cbc < bcount ? cbc : bcount;
907 1.6 cgd
908 1.1 hpeyerl /*
909 1.6 cgd * context for ccdiodone
910 1.1 hpeyerl */
911 1.6 cgd cbp->cb_obp = bp;
912 1.59 thorpej cbp->cb_sc = cs;
913 1.36 thorpej cbp->cb_comp = ccdisk;
914 1.6 cgd
915 1.94 yamt BIO_COPYPRIO(&cbp->cb_buf, bp);
916 1.94 yamt
917 1.1 hpeyerl #ifdef DEBUG
918 1.3 hpeyerl if (ccddebug & CCDB_IO)
919 1.131 cegger printf(" dev 0x%"PRIx64"(u%lu): cbp %p bn %" PRId64 " addr %p"
920 1.99 yamt " bcnt %d\n",
921 1.62 mjacob ci->ci_dev, (unsigned long) (ci-cs->sc_cinfo), cbp,
922 1.62 mjacob cbp->cb_buf.b_blkno, cbp->cb_buf.b_data,
923 1.62 mjacob cbp->cb_buf.b_bcount);
924 1.1 hpeyerl #endif
925 1.55 thorpej
926 1.55 thorpej return (cbp);
927 1.1 hpeyerl }
928 1.1 hpeyerl
929 1.1 hpeyerl /*
930 1.11 thorpej * Called at interrupt time.
931 1.1 hpeyerl * Mark the component as done and if all components are done,
932 1.1 hpeyerl * take a ccd interrupt.
933 1.1 hpeyerl */
934 1.97 thorpej static void
935 1.97 thorpej ccdiodone(struct buf *vbp)
936 1.1 hpeyerl {
937 1.29 christos struct ccdbuf *cbp = (struct ccdbuf *) vbp;
938 1.59 thorpej struct buf *bp = cbp->cb_obp;
939 1.59 thorpej struct ccd_softc *cs = cbp->cb_sc;
940 1.133 ad int count;
941 1.1 hpeyerl
942 1.1 hpeyerl #ifdef DEBUG
943 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
944 1.35 christos printf("ccdiodone(%p)\n", cbp);
945 1.3 hpeyerl if (ccddebug & CCDB_IO) {
946 1.99 yamt printf("ccdiodone: bp %p bcount %d resid %d\n",
947 1.53 thorpej bp, bp->b_bcount, bp->b_resid);
948 1.131 cegger printf(" dev 0x%"PRIx64"(u%d), cbp %p bn %" PRId64 " addr %p"
949 1.99 yamt " bcnt %d\n",
950 1.6 cgd cbp->cb_buf.b_dev, cbp->cb_comp, cbp,
951 1.6 cgd cbp->cb_buf.b_blkno, cbp->cb_buf.b_data,
952 1.6 cgd cbp->cb_buf.b_bcount);
953 1.1 hpeyerl }
954 1.1 hpeyerl #endif
955 1.1 hpeyerl
956 1.122 ad if (cbp->cb_buf.b_error != 0) {
957 1.122 ad bp->b_error = cbp->cb_buf.b_error;
958 1.53 thorpej printf("%s: error %d on component %d\n",
959 1.53 thorpej cs->sc_xname, bp->b_error, cbp->cb_comp);
960 1.1 hpeyerl }
961 1.6 cgd count = cbp->cb_buf.b_bcount;
962 1.126 ad buf_destroy(&cbp->cb_buf);
963 1.63 thorpej CCD_PUTBUF(cbp);
964 1.1 hpeyerl
965 1.1 hpeyerl /*
966 1.1 hpeyerl * If all done, "interrupt".
967 1.53 thorpej */
968 1.133 ad mutex_enter(cs->sc_iolock);
969 1.53 thorpej bp->b_resid -= count;
970 1.53 thorpej if (bp->b_resid < 0)
971 1.53 thorpej panic("ccdiodone: count");
972 1.133 ad if (bp->b_resid == 0) {
973 1.133 ad /*
974 1.133 ad * Request is done for better or worse, wakeup the top half.
975 1.133 ad */
976 1.133 ad if (bp->b_error != 0)
977 1.133 ad bp->b_resid = bp->b_bcount;
978 1.133 ad disk_unbusy(&cs->sc_dkdev, (bp->b_bcount - bp->b_resid),
979 1.133 ad (bp->b_flags & B_READ));
980 1.133 ad if (!disk_isbusy(&cs->sc_dkdev)) {
981 1.133 ad if (bufq_peek(cs->sc_bufq) != NULL) {
982 1.133 ad cv_broadcast(&cs->sc_push);
983 1.133 ad }
984 1.133 ad cv_broadcast(&cs->sc_stop);
985 1.133 ad }
986 1.133 ad mutex_exit(cs->sc_iolock);
987 1.133 ad biodone(bp);
988 1.133 ad } else
989 1.133 ad mutex_exit(cs->sc_iolock);
990 1.1 hpeyerl }
991 1.1 hpeyerl
992 1.11 thorpej /* ARGSUSED */
993 1.97 thorpej static int
994 1.116 christos ccdread(dev_t dev, struct uio *uio, int flags)
995 1.3 hpeyerl {
996 1.11 thorpej int unit = ccdunit(dev);
997 1.11 thorpej struct ccd_softc *cs;
998 1.3 hpeyerl
999 1.3 hpeyerl #ifdef DEBUG
1000 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
1001 1.131 cegger printf("ccdread(0x%"PRIx64", %p)\n", dev, uio);
1002 1.3 hpeyerl #endif
1003 1.144 christos if ((cs = ccdget(unit)) == NULL)
1004 1.144 christos return 0;
1005 1.11 thorpej
1006 1.133 ad /* Unlocked advisory check, ccdstrategy check is synchronous. */
1007 1.11 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1008 1.11 thorpej return (ENXIO);
1009 1.11 thorpej
1010 1.10 mycroft return (physio(ccdstrategy, NULL, dev, B_READ, minphys, uio));
1011 1.3 hpeyerl }
1012 1.3 hpeyerl
1013 1.11 thorpej /* ARGSUSED */
1014 1.97 thorpej static int
1015 1.116 christos ccdwrite(dev_t dev, struct uio *uio, int flags)
1016 1.3 hpeyerl {
1017 1.11 thorpej int unit = ccdunit(dev);
1018 1.11 thorpej struct ccd_softc *cs;
1019 1.3 hpeyerl
1020 1.3 hpeyerl #ifdef DEBUG
1021 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
1022 1.131 cegger printf("ccdwrite(0x%"PRIx64", %p)\n", dev, uio);
1023 1.3 hpeyerl #endif
1024 1.144 christos if ((cs = ccdget(unit)) == NULL)
1025 1.144 christos return ENOENT;
1026 1.11 thorpej
1027 1.133 ad /* Unlocked advisory check, ccdstrategy check is synchronous. */
1028 1.11 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1029 1.11 thorpej return (ENXIO);
1030 1.11 thorpej
1031 1.10 mycroft return (physio(ccdstrategy, NULL, dev, B_WRITE, minphys, uio));
1032 1.3 hpeyerl }
1033 1.3 hpeyerl
1034 1.97 thorpej static int
1035 1.118 christos ccdioctl(dev_t dev, u_long cmd, void *data, int flag, struct lwp *l)
1036 1.1 hpeyerl {
1037 1.11 thorpej int unit = ccdunit(dev);
1038 1.133 ad int i, j, lookedup = 0, error = 0;
1039 1.39 mycroft int part, pmask;
1040 1.11 thorpej struct ccd_softc *cs;
1041 1.11 thorpej struct ccd_ioctl *ccio = (struct ccd_ioctl *)data;
1042 1.110 elad kauth_cred_t uc;
1043 1.11 thorpej char **cpp;
1044 1.136 dholland struct pathbuf *pb;
1045 1.11 thorpej struct vnode **vpp;
1046 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1047 1.70 fvdl struct disklabel newlabel;
1048 1.70 fvdl #endif
1049 1.11 thorpej
1050 1.144 christos if ((cs = ccdget(unit)) == NULL)
1051 1.144 christos return ENOENT;
1052 1.133 ad uc = kauth_cred_get();
1053 1.109 jld
1054 1.41 thorpej /* Must be open for writes for these commands... */
1055 1.41 thorpej switch (cmd) {
1056 1.41 thorpej case CCDIOCSET:
1057 1.41 thorpej case CCDIOCCLR:
1058 1.41 thorpej case DIOCSDINFO:
1059 1.41 thorpej case DIOCWDINFO:
1060 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1061 1.70 fvdl case ODIOCSDINFO:
1062 1.70 fvdl case ODIOCWDINFO:
1063 1.70 fvdl #endif
1064 1.87 thorpej case DIOCKLABEL:
1065 1.41 thorpej case DIOCWLABEL:
1066 1.41 thorpej if ((flag & FWRITE) == 0)
1067 1.41 thorpej return (EBADF);
1068 1.41 thorpej }
1069 1.41 thorpej
1070 1.133 ad mutex_enter(&cs->sc_dvlock);
1071 1.57 thorpej
1072 1.41 thorpej /* Must be initialized for these... */
1073 1.41 thorpej switch (cmd) {
1074 1.41 thorpej case CCDIOCCLR:
1075 1.42 kleink case DIOCGDINFO:
1076 1.100 thorpej case DIOCCACHESYNC:
1077 1.42 kleink case DIOCSDINFO:
1078 1.42 kleink case DIOCWDINFO:
1079 1.42 kleink case DIOCGPART:
1080 1.41 thorpej case DIOCWLABEL:
1081 1.87 thorpej case DIOCKLABEL:
1082 1.44 thorpej case DIOCGDEFLABEL:
1083 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1084 1.70 fvdl case ODIOCGDINFO:
1085 1.70 fvdl case ODIOCSDINFO:
1086 1.70 fvdl case ODIOCWDINFO:
1087 1.70 fvdl case ODIOCGDEFLABEL:
1088 1.70 fvdl #endif
1089 1.57 thorpej if ((cs->sc_flags & CCDF_INITED) == 0) {
1090 1.57 thorpej error = ENXIO;
1091 1.57 thorpej goto out;
1092 1.57 thorpej }
1093 1.41 thorpej }
1094 1.41 thorpej
1095 1.11 thorpej switch (cmd) {
1096 1.11 thorpej case CCDIOCSET:
1097 1.57 thorpej if (cs->sc_flags & CCDF_INITED) {
1098 1.57 thorpej error = EBUSY;
1099 1.57 thorpej goto out;
1100 1.57 thorpej }
1101 1.54 thorpej
1102 1.54 thorpej /* Validate the flags. */
1103 1.57 thorpej if ((ccio->ccio_flags & CCDF_USERMASK) != ccio->ccio_flags) {
1104 1.57 thorpej error = EINVAL;
1105 1.57 thorpej goto out;
1106 1.57 thorpej }
1107 1.15 thorpej
1108 1.133 ad if (ccio->ccio_ndisks > CCD_MAXNDISKS ||
1109 1.133 ad ccio->ccio_ndisks == 0) {
1110 1.73 jdolecek error = EINVAL;
1111 1.73 jdolecek goto out;
1112 1.73 jdolecek }
1113 1.102 perry
1114 1.11 thorpej /* Fill in some important bits. */
1115 1.57 thorpej cs->sc_ileave = ccio->ccio_ileave;
1116 1.57 thorpej cs->sc_nccdisks = ccio->ccio_ndisks;
1117 1.57 thorpej cs->sc_flags = ccio->ccio_flags & CCDF_USERMASK;
1118 1.11 thorpej
1119 1.11 thorpej /*
1120 1.11 thorpej * Allocate space for and copy in the array of
1121 1.11 thorpej * componet pathnames and device numbers.
1122 1.11 thorpej */
1123 1.133 ad cpp = kmem_alloc(ccio->ccio_ndisks * sizeof(*cpp), KM_SLEEP);
1124 1.133 ad vpp = kmem_alloc(ccio->ccio_ndisks * sizeof(*vpp), KM_SLEEP);
1125 1.84 dsl error = copyin(ccio->ccio_disks, cpp,
1126 1.133 ad ccio->ccio_ndisks * sizeof(*cpp));
1127 1.11 thorpej if (error) {
1128 1.133 ad kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1129 1.133 ad kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1130 1.57 thorpej goto out;
1131 1.11 thorpej }
1132 1.11 thorpej
1133 1.11 thorpej #ifdef DEBUG
1134 1.11 thorpej if (ccddebug & CCDB_INIT)
1135 1.11 thorpej for (i = 0; i < ccio->ccio_ndisks; ++i)
1136 1.104 christos printf("ccdioctl: component %d: %p\n",
1137 1.11 thorpej i, cpp[i]);
1138 1.11 thorpej #endif
1139 1.11 thorpej
1140 1.11 thorpej for (i = 0; i < ccio->ccio_ndisks; ++i) {
1141 1.11 thorpej #ifdef DEBUG
1142 1.11 thorpej if (ccddebug & CCDB_INIT)
1143 1.35 christos printf("ccdioctl: lookedup = %d\n", lookedup);
1144 1.11 thorpej #endif
1145 1.136 dholland error = pathbuf_copyin(cpp[i], &pb);
1146 1.137 dholland if (error == 0) {
1147 1.137 dholland error = dk_lookup(pb, l, &vpp[i]);
1148 1.136 dholland }
1149 1.136 dholland pathbuf_destroy(pb);
1150 1.136 dholland if (error != 0) {
1151 1.11 thorpej for (j = 0; j < lookedup; ++j)
1152 1.12 thorpej (void)vn_close(vpp[j], FREAD|FWRITE,
1153 1.128 ad uc);
1154 1.133 ad kmem_free(vpp, ccio->ccio_ndisks *
1155 1.133 ad sizeof(*vpp));
1156 1.133 ad kmem_free(cpp, ccio->ccio_ndisks *
1157 1.133 ad sizeof(*cpp));
1158 1.57 thorpej goto out;
1159 1.11 thorpej }
1160 1.11 thorpej ++lookedup;
1161 1.11 thorpej }
1162 1.11 thorpej
1163 1.133 ad /* Attach the disk. */
1164 1.133 ad disk_attach(&cs->sc_dkdev);
1165 1.133 ad bufq_alloc(&cs->sc_bufq, "fcfs", 0);
1166 1.133 ad
1167 1.11 thorpej /*
1168 1.11 thorpej * Initialize the ccd. Fills in the softc for us.
1169 1.11 thorpej */
1170 1.107 christos if ((error = ccdinit(cs, cpp, vpp, l)) != 0) {
1171 1.11 thorpej for (j = 0; j < lookedup; ++j)
1172 1.18 thorpej (void)vn_close(vpp[j], FREAD|FWRITE,
1173 1.128 ad uc);
1174 1.133 ad kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1175 1.133 ad kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1176 1.133 ad disk_detach(&cs->sc_dkdev);
1177 1.133 ad bufq_free(cs->sc_bufq);
1178 1.57 thorpej goto out;
1179 1.11 thorpej }
1180 1.11 thorpej
1181 1.57 thorpej /* We can free the temporary variables now. */
1182 1.133 ad kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1183 1.133 ad kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1184 1.57 thorpej
1185 1.11 thorpej /*
1186 1.11 thorpej * The ccd has been successfully initialized, so
1187 1.23 thorpej * we can place it into the array. Don't try to
1188 1.23 thorpej * read the disklabel until the disk has been attached,
1189 1.23 thorpej * because space for the disklabel is allocated
1190 1.23 thorpej * in disk_attach();
1191 1.11 thorpej */
1192 1.11 thorpej ccio->ccio_unit = unit;
1193 1.11 thorpej ccio->ccio_size = cs->sc_size;
1194 1.23 thorpej
1195 1.23 thorpej /* Try and read the disklabel. */
1196 1.11 thorpej ccdgetdisklabel(dev);
1197 1.11 thorpej break;
1198 1.11 thorpej
1199 1.11 thorpej case CCDIOCCLR:
1200 1.11 thorpej /*
1201 1.11 thorpej * Don't unconfigure if any other partitions are open
1202 1.11 thorpej * or if both the character and block flavors of this
1203 1.11 thorpej * partition are open.
1204 1.11 thorpej */
1205 1.11 thorpej part = DISKPART(dev);
1206 1.11 thorpej pmask = (1 << part);
1207 1.11 thorpej if ((cs->sc_dkdev.dk_openmask & ~pmask) ||
1208 1.11 thorpej ((cs->sc_dkdev.dk_bopenmask & pmask) &&
1209 1.15 thorpej (cs->sc_dkdev.dk_copenmask & pmask))) {
1210 1.57 thorpej error = EBUSY;
1211 1.57 thorpej goto out;
1212 1.15 thorpej }
1213 1.88 thorpej
1214 1.133 ad /* Stop new I/O, wait for in-flight I/O to complete. */
1215 1.133 ad mutex_enter(cs->sc_iolock);
1216 1.133 ad cs->sc_flags &= ~(CCDF_INITED|CCDF_VLABEL);
1217 1.133 ad cs->sc_zap = true;
1218 1.133 ad while (disk_isbusy(&cs->sc_dkdev) ||
1219 1.133 ad bufq_peek(cs->sc_bufq) != NULL ||
1220 1.133 ad cs->sc_thread != NULL) {
1221 1.133 ad cv_broadcast(&cs->sc_push);
1222 1.133 ad (void)cv_timedwait(&cs->sc_stop, cs->sc_iolock, hz);
1223 1.133 ad }
1224 1.133 ad mutex_exit(cs->sc_iolock);
1225 1.11 thorpej
1226 1.11 thorpej /*
1227 1.11 thorpej * Free ccd_softc information and clear entry.
1228 1.11 thorpej */
1229 1.22 thorpej
1230 1.22 thorpej /* Close the components and free their pathnames. */
1231 1.11 thorpej for (i = 0; i < cs->sc_nccdisks; ++i) {
1232 1.11 thorpej /*
1233 1.11 thorpej * XXX: this close could potentially fail and
1234 1.11 thorpej * cause Bad Things. Maybe we need to force
1235 1.11 thorpej * the close to happen?
1236 1.11 thorpej */
1237 1.11 thorpej #ifdef DEBUG
1238 1.11 thorpej if (ccddebug & CCDB_VNODE)
1239 1.11 thorpej vprint("CCDIOCCLR: vnode info",
1240 1.11 thorpej cs->sc_cinfo[i].ci_vp);
1241 1.11 thorpej #endif
1242 1.11 thorpej (void)vn_close(cs->sc_cinfo[i].ci_vp, FREAD|FWRITE,
1243 1.128 ad uc);
1244 1.133 ad kmem_free(cs->sc_cinfo[i].ci_path,
1245 1.133 ad cs->sc_cinfo[i].ci_pathlen);
1246 1.38 thorpej }
1247 1.38 thorpej
1248 1.22 thorpej /* Free interleave index. */
1249 1.133 ad for (i = 0; cs->sc_itable[i].ii_ndisk; ++i) {
1250 1.133 ad kmem_free(cs->sc_itable[i].ii_index,
1251 1.133 ad cs->sc_itable[i].ii_indexsz);
1252 1.133 ad }
1253 1.22 thorpej
1254 1.22 thorpej /* Free component info and interleave table. */
1255 1.133 ad kmem_free(cs->sc_cinfo, cs->sc_nccdisks *
1256 1.133 ad sizeof(struct ccdcinfo));
1257 1.133 ad kmem_free(cs->sc_itable, (cs->sc_nccdisks + 1) *
1258 1.133 ad sizeof(struct ccdiinfo));
1259 1.15 thorpej
1260 1.23 thorpej /* Detatch the disk. */
1261 1.123 ad disk_detach(&cs->sc_dkdev);
1262 1.133 ad bufq_free(cs->sc_bufq);
1263 1.144 christos ccdput(cs);
1264 1.148 joerg /* Don't break, otherwise cs is read again. */
1265 1.148 joerg return 0;
1266 1.11 thorpej
1267 1.11 thorpej case DIOCGDINFO:
1268 1.23 thorpej *(struct disklabel *)data = *(cs->sc_dkdev.dk_label);
1269 1.11 thorpej break;
1270 1.133 ad
1271 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1272 1.70 fvdl case ODIOCGDINFO:
1273 1.70 fvdl newlabel = *(cs->sc_dkdev.dk_label);
1274 1.70 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
1275 1.71 fvdl return ENOTTY;
1276 1.70 fvdl memcpy(data, &newlabel, sizeof (struct olddisklabel));
1277 1.70 fvdl break;
1278 1.70 fvdl #endif
1279 1.11 thorpej
1280 1.11 thorpej case DIOCGPART:
1281 1.23 thorpej ((struct partinfo *)data)->disklab = cs->sc_dkdev.dk_label;
1282 1.11 thorpej ((struct partinfo *)data)->part =
1283 1.23 thorpej &cs->sc_dkdev.dk_label->d_partitions[DISKPART(dev)];
1284 1.11 thorpej break;
1285 1.11 thorpej
1286 1.100 thorpej case DIOCCACHESYNC:
1287 1.100 thorpej /*
1288 1.100 thorpej * XXX Do we really need to care about having a writable
1289 1.100 thorpej * file descriptor here?
1290 1.100 thorpej */
1291 1.100 thorpej if ((flag & FWRITE) == 0)
1292 1.100 thorpej return (EBADF);
1293 1.100 thorpej
1294 1.100 thorpej /*
1295 1.100 thorpej * We pass this call down to all components and report
1296 1.100 thorpej * the first error we encounter.
1297 1.100 thorpej */
1298 1.100 thorpej for (error = 0, i = 0; i < cs->sc_nccdisks; i++) {
1299 1.100 thorpej j = VOP_IOCTL(cs->sc_cinfo[i].ci_vp, cmd, data,
1300 1.124 pooka flag, uc);
1301 1.100 thorpej if (j != 0 && error == 0)
1302 1.100 thorpej error = j;
1303 1.100 thorpej }
1304 1.100 thorpej break;
1305 1.100 thorpej
1306 1.11 thorpej case DIOCWDINFO:
1307 1.11 thorpej case DIOCSDINFO:
1308 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1309 1.70 fvdl case ODIOCWDINFO:
1310 1.70 fvdl case ODIOCSDINFO:
1311 1.70 fvdl #endif
1312 1.70 fvdl {
1313 1.70 fvdl struct disklabel *lp;
1314 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1315 1.70 fvdl if (cmd == ODIOCSDINFO || cmd == ODIOCWDINFO) {
1316 1.70 fvdl memset(&newlabel, 0, sizeof newlabel);
1317 1.70 fvdl memcpy(&newlabel, data, sizeof (struct olddisklabel));
1318 1.70 fvdl lp = &newlabel;
1319 1.70 fvdl } else
1320 1.70 fvdl #endif
1321 1.70 fvdl lp = (struct disklabel *)data;
1322 1.70 fvdl
1323 1.11 thorpej cs->sc_flags |= CCDF_LABELLING;
1324 1.11 thorpej
1325 1.23 thorpej error = setdisklabel(cs->sc_dkdev.dk_label,
1326 1.70 fvdl lp, 0, cs->sc_dkdev.dk_cpulabel);
1327 1.11 thorpej if (error == 0) {
1328 1.70 fvdl if (cmd == DIOCWDINFO
1329 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1330 1.70 fvdl || cmd == ODIOCWDINFO
1331 1.70 fvdl #endif
1332 1.70 fvdl )
1333 1.11 thorpej error = writedisklabel(CCDLABELDEV(dev),
1334 1.23 thorpej ccdstrategy, cs->sc_dkdev.dk_label,
1335 1.23 thorpej cs->sc_dkdev.dk_cpulabel);
1336 1.11 thorpej }
1337 1.11 thorpej
1338 1.11 thorpej cs->sc_flags &= ~CCDF_LABELLING;
1339 1.11 thorpej break;
1340 1.70 fvdl }
1341 1.11 thorpej
1342 1.87 thorpej case DIOCKLABEL:
1343 1.87 thorpej if (*(int *)data != 0)
1344 1.87 thorpej cs->sc_flags |= CCDF_KLABEL;
1345 1.87 thorpej else
1346 1.87 thorpej cs->sc_flags &= ~CCDF_KLABEL;
1347 1.87 thorpej break;
1348 1.87 thorpej
1349 1.11 thorpej case DIOCWLABEL:
1350 1.11 thorpej if (*(int *)data != 0)
1351 1.11 thorpej cs->sc_flags |= CCDF_WLABEL;
1352 1.11 thorpej else
1353 1.11 thorpej cs->sc_flags &= ~CCDF_WLABEL;
1354 1.11 thorpej break;
1355 1.11 thorpej
1356 1.44 thorpej case DIOCGDEFLABEL:
1357 1.44 thorpej ccdgetdefaultlabel(cs, (struct disklabel *)data);
1358 1.44 thorpej break;
1359 1.70 fvdl
1360 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1361 1.70 fvdl case ODIOCGDEFLABEL:
1362 1.70 fvdl ccdgetdefaultlabel(cs, &newlabel);
1363 1.70 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
1364 1.71 fvdl return ENOTTY;
1365 1.70 fvdl memcpy(data, &newlabel, sizeof (struct olddisklabel));
1366 1.70 fvdl break;
1367 1.70 fvdl #endif
1368 1.44 thorpej
1369 1.11 thorpej default:
1370 1.57 thorpej error = ENOTTY;
1371 1.11 thorpej }
1372 1.11 thorpej
1373 1.57 thorpej out:
1374 1.133 ad mutex_exit(&cs->sc_dvlock);
1375 1.57 thorpej return (error);
1376 1.1 hpeyerl }
1377 1.1 hpeyerl
1378 1.97 thorpej static int
1379 1.97 thorpej ccdsize(dev_t dev)
1380 1.1 hpeyerl {
1381 1.11 thorpej struct ccd_softc *cs;
1382 1.40 thorpej struct disklabel *lp;
1383 1.40 thorpej int part, unit, omask, size;
1384 1.40 thorpej
1385 1.40 thorpej unit = ccdunit(dev);
1386 1.144 christos if ((cs = ccdget(unit)) == NULL)
1387 1.144 christos return -1;
1388 1.11 thorpej
1389 1.40 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1390 1.11 thorpej return (-1);
1391 1.11 thorpej
1392 1.11 thorpej part = DISKPART(dev);
1393 1.40 thorpej omask = cs->sc_dkdev.dk_openmask & (1 << part);
1394 1.40 thorpej lp = cs->sc_dkdev.dk_label;
1395 1.11 thorpej
1396 1.107 christos if (omask == 0 && ccdopen(dev, 0, S_IFBLK, curlwp))
1397 1.11 thorpej return (-1);
1398 1.11 thorpej
1399 1.40 thorpej if (lp->d_partitions[part].p_fstype != FS_SWAP)
1400 1.11 thorpej size = -1;
1401 1.11 thorpej else
1402 1.40 thorpej size = lp->d_partitions[part].p_size *
1403 1.40 thorpej (lp->d_secsize / DEV_BSIZE);
1404 1.11 thorpej
1405 1.107 christos if (omask == 0 && ccdclose(dev, 0, S_IFBLK, curlwp))
1406 1.11 thorpej return (-1);
1407 1.1 hpeyerl
1408 1.11 thorpej return (size);
1409 1.1 hpeyerl }
1410 1.1 hpeyerl
1411 1.11 thorpej static void
1412 1.97 thorpej ccdgetdefaultlabel(struct ccd_softc *cs, struct disklabel *lp)
1413 1.11 thorpej {
1414 1.11 thorpej struct ccdgeom *ccg = &cs->sc_geom;
1415 1.11 thorpej
1416 1.72 thorpej memset(lp, 0, sizeof(*lp));
1417 1.11 thorpej
1418 1.11 thorpej lp->d_secperunit = cs->sc_size;
1419 1.11 thorpej lp->d_secsize = ccg->ccg_secsize;
1420 1.11 thorpej lp->d_nsectors = ccg->ccg_nsectors;
1421 1.11 thorpej lp->d_ntracks = ccg->ccg_ntracks;
1422 1.11 thorpej lp->d_ncylinders = ccg->ccg_ncylinders;
1423 1.19 thorpej lp->d_secpercyl = lp->d_ntracks * lp->d_nsectors;
1424 1.11 thorpej
1425 1.11 thorpej strncpy(lp->d_typename, "ccd", sizeof(lp->d_typename));
1426 1.11 thorpej lp->d_type = DTYPE_CCD;
1427 1.11 thorpej strncpy(lp->d_packname, "fictitious", sizeof(lp->d_packname));
1428 1.11 thorpej lp->d_rpm = 3600;
1429 1.11 thorpej lp->d_interleave = 1;
1430 1.11 thorpej lp->d_flags = 0;
1431 1.11 thorpej
1432 1.11 thorpej lp->d_partitions[RAW_PART].p_offset = 0;
1433 1.11 thorpej lp->d_partitions[RAW_PART].p_size = cs->sc_size;
1434 1.11 thorpej lp->d_partitions[RAW_PART].p_fstype = FS_UNUSED;
1435 1.11 thorpej lp->d_npartitions = RAW_PART + 1;
1436 1.11 thorpej
1437 1.11 thorpej lp->d_magic = DISKMAGIC;
1438 1.11 thorpej lp->d_magic2 = DISKMAGIC;
1439 1.23 thorpej lp->d_checksum = dkcksum(cs->sc_dkdev.dk_label);
1440 1.44 thorpej }
1441 1.44 thorpej
1442 1.44 thorpej /*
1443 1.44 thorpej * Read the disklabel from the ccd. If one is not present, fake one
1444 1.44 thorpej * up.
1445 1.44 thorpej */
1446 1.44 thorpej static void
1447 1.97 thorpej ccdgetdisklabel(dev_t dev)
1448 1.44 thorpej {
1449 1.44 thorpej int unit = ccdunit(dev);
1450 1.144 christos struct ccd_softc *cs;
1451 1.85 dsl const char *errstring;
1452 1.144 christos struct disklabel *lp;
1453 1.144 christos struct cpu_disklabel *clp;
1454 1.44 thorpej
1455 1.144 christos if ((cs = ccdget(unit)) == NULL)
1456 1.144 christos return;
1457 1.144 christos lp = cs->sc_dkdev.dk_label;
1458 1.144 christos clp = cs->sc_dkdev.dk_cpulabel;
1459 1.133 ad KASSERT(mutex_owned(&cs->sc_dvlock));
1460 1.133 ad
1461 1.72 thorpej memset(clp, 0, sizeof(*clp));
1462 1.44 thorpej
1463 1.44 thorpej ccdgetdefaultlabel(cs, lp);
1464 1.11 thorpej
1465 1.11 thorpej /*
1466 1.11 thorpej * Call the generic disklabel extraction routine.
1467 1.11 thorpej */
1468 1.133 ad cs->sc_flags |= CCDF_RLABEL;
1469 1.92 lukem if ((cs->sc_flags & CCDF_NOLABEL) != 0)
1470 1.92 lukem errstring = "CCDF_NOLABEL set; ignoring on-disk label";
1471 1.92 lukem else
1472 1.92 lukem errstring = readdisklabel(CCDLABELDEV(dev), ccdstrategy,
1473 1.92 lukem cs->sc_dkdev.dk_label, cs->sc_dkdev.dk_cpulabel);
1474 1.29 christos if (errstring)
1475 1.11 thorpej ccdmakedisklabel(cs);
1476 1.47 enami else {
1477 1.47 enami int i;
1478 1.47 enami struct partition *pp;
1479 1.47 enami
1480 1.47 enami /*
1481 1.47 enami * Sanity check whether the found disklabel is valid.
1482 1.47 enami *
1483 1.47 enami * This is necessary since total size of ccd may vary
1484 1.47 enami * when an interleave is changed even though exactly
1485 1.47 enami * same componets are used, and old disklabel may used
1486 1.47 enami * if that is found.
1487 1.47 enami */
1488 1.47 enami if (lp->d_secperunit != cs->sc_size)
1489 1.47 enami printf("WARNING: %s: "
1490 1.47 enami "total sector size in disklabel (%d) != "
1491 1.60 thorpej "the size of ccd (%lu)\n", cs->sc_xname,
1492 1.60 thorpej lp->d_secperunit, (u_long)cs->sc_size);
1493 1.47 enami for (i = 0; i < lp->d_npartitions; i++) {
1494 1.47 enami pp = &lp->d_partitions[i];
1495 1.47 enami if (pp->p_offset + pp->p_size > cs->sc_size)
1496 1.48 enami printf("WARNING: %s: end of partition `%c' "
1497 1.60 thorpej "exceeds the size of ccd (%lu)\n",
1498 1.60 thorpej cs->sc_xname, 'a' + i, (u_long)cs->sc_size);
1499 1.47 enami }
1500 1.47 enami }
1501 1.11 thorpej
1502 1.11 thorpej #ifdef DEBUG
1503 1.11 thorpej /* It's actually extremely common to have unlabeled ccds. */
1504 1.11 thorpej if (ccddebug & CCDB_LABEL)
1505 1.11 thorpej if (errstring != NULL)
1506 1.35 christos printf("%s: %s\n", cs->sc_xname, errstring);
1507 1.11 thorpej #endif
1508 1.87 thorpej
1509 1.87 thorpej /* In-core label now valid. */
1510 1.133 ad cs->sc_flags = (cs->sc_flags | CCDF_VLABEL) & ~CCDF_RLABEL;
1511 1.11 thorpej }
1512 1.11 thorpej
1513 1.11 thorpej /*
1514 1.11 thorpej * Take care of things one might want to take care of in the event
1515 1.11 thorpej * that a disklabel isn't present.
1516 1.11 thorpej */
1517 1.11 thorpej static void
1518 1.97 thorpej ccdmakedisklabel(struct ccd_softc *cs)
1519 1.11 thorpej {
1520 1.23 thorpej struct disklabel *lp = cs->sc_dkdev.dk_label;
1521 1.11 thorpej
1522 1.11 thorpej /*
1523 1.11 thorpej * For historical reasons, if there's no disklabel present
1524 1.11 thorpej * the raw partition must be marked FS_BSDFFS.
1525 1.11 thorpej */
1526 1.11 thorpej lp->d_partitions[RAW_PART].p_fstype = FS_BSDFFS;
1527 1.11 thorpej
1528 1.11 thorpej strncpy(lp->d_packname, "default label", sizeof(lp->d_packname));
1529 1.44 thorpej
1530 1.44 thorpej lp->d_checksum = dkcksum(lp);
1531 1.11 thorpej }
1532 1.11 thorpej
1533 1.11 thorpej #ifdef DEBUG
1534 1.11 thorpej static void
1535 1.97 thorpej printiinfo(struct ccdiinfo *ii)
1536 1.11 thorpej {
1537 1.68 augustss int ix, i;
1538 1.11 thorpej
1539 1.11 thorpej for (ix = 0; ii->ii_ndisk; ix++, ii++) {
1540 1.81 kleink printf(" itab[%d]: #dk %d sblk %" PRId64 " soff %" PRId64,
1541 1.34 christos ix, ii->ii_ndisk, ii->ii_startblk, ii->ii_startoff);
1542 1.11 thorpej for (i = 0; i < ii->ii_ndisk; i++)
1543 1.35 christos printf(" %d", ii->ii_index[i]);
1544 1.35 christos printf("\n");
1545 1.11 thorpej }
1546 1.1 hpeyerl }
1547 1.1 hpeyerl #endif
1548 1.134 haad
1549 1.146 pgoyette MODULE(MODULE_CLASS_DRIVER, ccd, "dk_subr");
1550 1.134 haad
1551 1.134 haad static int
1552 1.134 haad ccd_modcmd(modcmd_t cmd, void *arg)
1553 1.134 haad {
1554 1.145 martin int error = 0;
1555 1.145 martin #ifdef _MODULE
1556 1.145 martin int bmajor = -1, cmajor = -1;
1557 1.145 martin #endif
1558 1.140 jruoho
1559 1.140 jruoho
1560 1.134 haad switch (cmd) {
1561 1.134 haad case MODULE_CMD_INIT:
1562 1.140 jruoho #ifdef _MODULE
1563 1.134 haad ccdattach(4);
1564 1.140 jruoho
1565 1.134 haad return devsw_attach("ccd", &ccd_bdevsw, &bmajor,
1566 1.134 haad &ccd_cdevsw, &cmajor);
1567 1.140 jruoho #endif
1568 1.134 haad break;
1569 1.134 haad
1570 1.134 haad case MODULE_CMD_FINI:
1571 1.140 jruoho #ifdef _MODULE
1572 1.134 haad return devsw_detach(&ccd_bdevsw, &ccd_cdevsw);
1573 1.140 jruoho #endif
1574 1.134 haad break;
1575 1.134 haad
1576 1.134 haad case MODULE_CMD_STAT:
1577 1.134 haad return ENOTTY;
1578 1.134 haad
1579 1.134 haad default:
1580 1.134 haad return ENOTTY;
1581 1.134 haad }
1582 1.134 haad
1583 1.134 haad return error;
1584 1.134 haad }
1585 1.144 christos
1586 1.144 christos static int
1587 1.144 christos ccd_units_sysctl(SYSCTLFN_ARGS)
1588 1.144 christos {
1589 1.144 christos struct sysctlnode node;
1590 1.144 christos struct ccd_softc *sc;
1591 1.144 christos int error, i, nccd, *units;
1592 1.144 christos size_t size;
1593 1.144 christos
1594 1.144 christos nccd = 0;
1595 1.144 christos mutex_enter(&ccd_lock);
1596 1.144 christos LIST_FOREACH(sc, &ccds, sc_link)
1597 1.144 christos nccd++;
1598 1.144 christos mutex_exit(&ccd_lock);
1599 1.144 christos
1600 1.144 christos if (nccd != 0) {
1601 1.144 christos size = nccd * sizeof(*units);
1602 1.144 christos units = kmem_zalloc(size, KM_SLEEP);
1603 1.144 christos if (units == NULL)
1604 1.144 christos return ENOMEM;
1605 1.144 christos
1606 1.144 christos i = 0;
1607 1.144 christos mutex_enter(&ccd_lock);
1608 1.144 christos LIST_FOREACH(sc, &ccds, sc_link) {
1609 1.144 christos if (i >= nccd)
1610 1.144 christos break;
1611 1.144 christos units[i] = sc->sc_unit;
1612 1.144 christos }
1613 1.144 christos mutex_exit(&ccd_lock);
1614 1.144 christos } else {
1615 1.144 christos units = NULL;
1616 1.144 christos size = 0;
1617 1.144 christos }
1618 1.144 christos
1619 1.144 christos node = *rnode;
1620 1.144 christos node.sysctl_data = units;
1621 1.144 christos node.sysctl_size = size;
1622 1.144 christos
1623 1.144 christos error = sysctl_lookup(SYSCTLFN_CALL(&node));
1624 1.144 christos if (units)
1625 1.144 christos kmem_free(units, size);
1626 1.144 christos return error;
1627 1.144 christos }
1628 1.144 christos
1629 1.144 christos static int
1630 1.144 christos ccd_info_sysctl(SYSCTLFN_ARGS)
1631 1.144 christos {
1632 1.144 christos struct sysctlnode node;
1633 1.144 christos struct ccddiskinfo ccd;
1634 1.144 christos struct ccd_softc *sc;
1635 1.144 christos int unit;
1636 1.144 christos
1637 1.144 christos if (newp == NULL || newlen != sizeof(int))
1638 1.144 christos return EINVAL;
1639 1.144 christos
1640 1.144 christos unit = *(const int *)newp;
1641 1.144 christos newp = NULL;
1642 1.144 christos newlen = 0;
1643 1.144 christos ccd.ccd_ndisks = ~0;
1644 1.144 christos mutex_enter(&ccd_lock);
1645 1.144 christos LIST_FOREACH(sc, &ccds, sc_link) {
1646 1.144 christos if (sc->sc_unit == unit) {
1647 1.144 christos ccd.ccd_ileave = sc->sc_ileave;
1648 1.144 christos ccd.ccd_size = sc->sc_size;
1649 1.144 christos ccd.ccd_ndisks = sc->sc_nccdisks;
1650 1.144 christos ccd.ccd_flags = sc->sc_flags;
1651 1.144 christos break;
1652 1.144 christos }
1653 1.144 christos }
1654 1.144 christos mutex_exit(&ccd_lock);
1655 1.144 christos
1656 1.144 christos if (ccd.ccd_ndisks == ~0)
1657 1.144 christos return ENOENT;
1658 1.144 christos
1659 1.144 christos node = *rnode;
1660 1.144 christos node.sysctl_data = &ccd;
1661 1.144 christos node.sysctl_size = sizeof(ccd);
1662 1.144 christos
1663 1.144 christos return sysctl_lookup(SYSCTLFN_CALL(&node));
1664 1.144 christos }
1665 1.144 christos
1666 1.144 christos static int
1667 1.144 christos ccd_components_sysctl(SYSCTLFN_ARGS)
1668 1.144 christos {
1669 1.144 christos struct sysctlnode node;
1670 1.144 christos int error, unit;
1671 1.144 christos size_t size;
1672 1.144 christos char *names, *p, *ep;
1673 1.144 christos struct ccd_softc *sc;
1674 1.144 christos
1675 1.144 christos if (newp == NULL || newlen != sizeof(int))
1676 1.144 christos return EINVAL;
1677 1.144 christos
1678 1.144 christos size = 0;
1679 1.144 christos unit = *(const int *)newp;
1680 1.144 christos newp = NULL;
1681 1.144 christos newlen = 0;
1682 1.144 christos mutex_enter(&ccd_lock);
1683 1.144 christos LIST_FOREACH(sc, &ccds, sc_link)
1684 1.144 christos if (sc->sc_unit == unit) {
1685 1.144 christos for (size_t i = 0; i < sc->sc_nccdisks; i++)
1686 1.144 christos size += strlen(sc->sc_cinfo[i].ci_path) + 1;
1687 1.144 christos break;
1688 1.144 christos }
1689 1.144 christos mutex_exit(&ccd_lock);
1690 1.144 christos
1691 1.144 christos if (size == 0)
1692 1.144 christos return ENOENT;
1693 1.144 christos names = kmem_zalloc(size, KM_SLEEP);
1694 1.144 christos if (names == NULL)
1695 1.144 christos return ENOMEM;
1696 1.144 christos
1697 1.144 christos p = names;
1698 1.144 christos ep = names + size;
1699 1.144 christos mutex_enter(&ccd_lock);
1700 1.144 christos LIST_FOREACH(sc, &ccds, sc_link)
1701 1.144 christos if (sc->sc_unit == unit) {
1702 1.144 christos for (size_t i = 0; i < sc->sc_nccdisks; i++) {
1703 1.144 christos char *d = sc->sc_cinfo[i].ci_path;
1704 1.144 christos while (p < ep && (*p++ = *d++) != '\0')
1705 1.144 christos continue;
1706 1.144 christos }
1707 1.144 christos break;
1708 1.144 christos }
1709 1.144 christos mutex_exit(&ccd_lock);
1710 1.144 christos
1711 1.144 christos node = *rnode;
1712 1.144 christos node.sysctl_data = names;
1713 1.144 christos node.sysctl_size = ep - names;
1714 1.144 christos
1715 1.144 christos error = sysctl_lookup(SYSCTLFN_CALL(&node));
1716 1.144 christos kmem_free(names, size);
1717 1.144 christos return error;
1718 1.144 christos }
1719 1.144 christos
1720 1.144 christos SYSCTL_SETUP(sysctl_kern_ccd_setup, "sysctl kern.ccd subtree setup")
1721 1.144 christos {
1722 1.144 christos const struct sysctlnode *node = NULL;
1723 1.144 christos
1724 1.144 christos sysctl_createv(clog, 0, NULL, &node,
1725 1.144 christos CTLFLAG_PERMANENT,
1726 1.144 christos CTLTYPE_NODE, "ccd",
1727 1.144 christos SYSCTL_DESCR("ConCatenated Disk state"),
1728 1.144 christos NULL, 0, NULL, 0,
1729 1.144 christos CTL_KERN, CTL_CREATE, CTL_EOL);
1730 1.144 christos
1731 1.144 christos if (node == NULL)
1732 1.144 christos return;
1733 1.144 christos
1734 1.144 christos sysctl_createv(clog, 0, &node, NULL,
1735 1.144 christos CTLFLAG_PERMANENT | CTLFLAG_READONLY,
1736 1.144 christos CTLTYPE_STRUCT, "units",
1737 1.144 christos SYSCTL_DESCR("List of ccd unit numbers"),
1738 1.144 christos ccd_units_sysctl, 0, NULL, 0,
1739 1.144 christos CTL_CREATE, CTL_EOL);
1740 1.144 christos sysctl_createv(clog, 0, &node, NULL,
1741 1.144 christos CTLFLAG_PERMANENT | CTLFLAG_READWRITE,
1742 1.144 christos CTLTYPE_STRUCT, "info",
1743 1.144 christos SYSCTL_DESCR("Information about a CCD unit"),
1744 1.144 christos ccd_info_sysctl, 0, NULL, 0,
1745 1.144 christos CTL_CREATE, CTL_EOL);
1746 1.144 christos sysctl_createv(clog, 0, &node, NULL,
1747 1.144 christos CTLFLAG_PERMANENT | CTLFLAG_READWRITE,
1748 1.144 christos CTLTYPE_STRUCT, "components",
1749 1.144 christos SYSCTL_DESCR("Information about CCD components"),
1750 1.144 christos ccd_components_sysctl, 0, NULL, 0,
1751 1.144 christos CTL_CREATE, CTL_EOL);
1752 1.144 christos }
1753