ccd.c revision 1.135 1 1.135 uebayasi /* $NetBSD: ccd.c,v 1.135 2010/11/14 03:49:52 uebayasi Exp $ */
2 1.11 thorpej
3 1.28 thorpej /*-
4 1.133 ad * Copyright (c) 1996, 1997, 1998, 1999, 2007, 2009 The NetBSD Foundation, Inc.
5 1.11 thorpej * All rights reserved.
6 1.11 thorpej *
7 1.28 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.133 ad * by Jason R. Thorpe, and by Andrew Doran.
9 1.28 thorpej *
10 1.11 thorpej * Redistribution and use in source and binary forms, with or without
11 1.11 thorpej * modification, are permitted provided that the following conditions
12 1.11 thorpej * are met:
13 1.11 thorpej * 1. Redistributions of source code must retain the above copyright
14 1.11 thorpej * notice, this list of conditions and the following disclaimer.
15 1.11 thorpej * 2. Redistributions in binary form must reproduce the above copyright
16 1.11 thorpej * notice, this list of conditions and the following disclaimer in the
17 1.11 thorpej * documentation and/or other materials provided with the distribution.
18 1.11 thorpej *
19 1.28 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.28 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.28 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.45 jtc * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.45 jtc * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.28 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.28 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.28 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.28 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.28 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.28 thorpej * POSSIBILITY OF SUCH DAMAGE.
30 1.11 thorpej */
31 1.2 cgd
32 1.1 hpeyerl /*
33 1.3 hpeyerl * Copyright (c) 1990, 1993
34 1.3 hpeyerl * The Regents of the University of California. All rights reserved.
35 1.1 hpeyerl *
36 1.1 hpeyerl * This code is derived from software contributed to Berkeley by
37 1.1 hpeyerl * the Systems Programming Group of the University of Utah Computer
38 1.1 hpeyerl * Science Department.
39 1.1 hpeyerl *
40 1.1 hpeyerl * Redistribution and use in source and binary forms, with or without
41 1.1 hpeyerl * modification, are permitted provided that the following conditions
42 1.1 hpeyerl * are met:
43 1.1 hpeyerl * 1. Redistributions of source code must retain the above copyright
44 1.1 hpeyerl * notice, this list of conditions and the following disclaimer.
45 1.1 hpeyerl * 2. Redistributions in binary form must reproduce the above copyright
46 1.1 hpeyerl * notice, this list of conditions and the following disclaimer in the
47 1.1 hpeyerl * documentation and/or other materials provided with the distribution.
48 1.91 agc * 3. Neither the name of the University nor the names of its contributors
49 1.91 agc * may be used to endorse or promote products derived from this software
50 1.91 agc * without specific prior written permission.
51 1.91 agc *
52 1.91 agc * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 1.91 agc * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 1.91 agc * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 1.91 agc * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 1.91 agc * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 1.91 agc * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 1.91 agc * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 1.91 agc * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 1.91 agc * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 1.91 agc * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
62 1.91 agc * SUCH DAMAGE.
63 1.91 agc *
64 1.91 agc * from: Utah $Hdr: cd.c 1.6 90/11/28$
65 1.91 agc *
66 1.91 agc * @(#)cd.c 8.2 (Berkeley) 11/16/93
67 1.91 agc */
68 1.91 agc
69 1.91 agc /*
70 1.91 agc * Copyright (c) 1988 University of Utah.
71 1.91 agc *
72 1.91 agc * This code is derived from software contributed to Berkeley by
73 1.91 agc * the Systems Programming Group of the University of Utah Computer
74 1.91 agc * Science Department.
75 1.91 agc *
76 1.91 agc * Redistribution and use in source and binary forms, with or without
77 1.91 agc * modification, are permitted provided that the following conditions
78 1.91 agc * are met:
79 1.91 agc * 1. Redistributions of source code must retain the above copyright
80 1.91 agc * notice, this list of conditions and the following disclaimer.
81 1.91 agc * 2. Redistributions in binary form must reproduce the above copyright
82 1.91 agc * notice, this list of conditions and the following disclaimer in the
83 1.91 agc * documentation and/or other materials provided with the distribution.
84 1.1 hpeyerl * 3. All advertising materials mentioning features or use of this software
85 1.1 hpeyerl * must display the following acknowledgement:
86 1.1 hpeyerl * This product includes software developed by the University of
87 1.1 hpeyerl * California, Berkeley and its contributors.
88 1.1 hpeyerl * 4. Neither the name of the University nor the names of its contributors
89 1.1 hpeyerl * may be used to endorse or promote products derived from this software
90 1.1 hpeyerl * without specific prior written permission.
91 1.1 hpeyerl *
92 1.1 hpeyerl * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
93 1.1 hpeyerl * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
94 1.1 hpeyerl * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
95 1.1 hpeyerl * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
96 1.1 hpeyerl * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
97 1.1 hpeyerl * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
98 1.1 hpeyerl * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
99 1.1 hpeyerl * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
100 1.1 hpeyerl * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
101 1.1 hpeyerl * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
102 1.1 hpeyerl * SUCH DAMAGE.
103 1.1 hpeyerl *
104 1.2 cgd * from: Utah $Hdr: cd.c 1.6 90/11/28$
105 1.2 cgd *
106 1.3 hpeyerl * @(#)cd.c 8.2 (Berkeley) 11/16/93
107 1.1 hpeyerl */
108 1.1 hpeyerl
109 1.1 hpeyerl /*
110 1.1 hpeyerl * "Concatenated" disk driver.
111 1.11 thorpej *
112 1.133 ad * Notes on concurrency:
113 1.133 ad *
114 1.133 ad * => sc_dvlock serializes access to the device nodes, excluding block I/O.
115 1.133 ad *
116 1.133 ad * => sc_iolock serializes access to (sc_flags & CCDF_INITED), disk stats,
117 1.133 ad * sc_stop, sc_bufq and b_resid from master buffers.
118 1.133 ad *
119 1.133 ad * => a combination of CCDF_INITED, sc_inflight, and sc_iolock is used to
120 1.133 ad * serialize I/O and configuration changes.
121 1.133 ad *
122 1.133 ad * => the in-core disk label does not change while the device is open.
123 1.133 ad *
124 1.133 ad * On memory consumption: ccd fans out I/O requests and so needs to
125 1.133 ad * allocate memory. If the system is desperately low on memory, we
126 1.133 ad * single thread I/O.
127 1.1 hpeyerl */
128 1.74 lukem
129 1.74 lukem #include <sys/cdefs.h>
130 1.135 uebayasi __KERNEL_RCSID(0, "$NetBSD: ccd.c,v 1.135 2010/11/14 03:49:52 uebayasi Exp $");
131 1.1 hpeyerl
132 1.1 hpeyerl #include <sys/param.h>
133 1.1 hpeyerl #include <sys/systm.h>
134 1.133 ad #include <sys/kernel.h>
135 1.3 hpeyerl #include <sys/proc.h>
136 1.1 hpeyerl #include <sys/errno.h>
137 1.1 hpeyerl #include <sys/buf.h>
138 1.133 ad #include <sys/kmem.h>
139 1.63 thorpej #include <sys/pool.h>
140 1.11 thorpej #include <sys/namei.h>
141 1.3 hpeyerl #include <sys/stat.h>
142 1.3 hpeyerl #include <sys/ioctl.h>
143 1.3 hpeyerl #include <sys/disklabel.h>
144 1.11 thorpej #include <sys/device.h>
145 1.11 thorpej #include <sys/disk.h>
146 1.11 thorpej #include <sys/syslog.h>
147 1.3 hpeyerl #include <sys/fcntl.h>
148 1.11 thorpej #include <sys/vnode.h>
149 1.31 christos #include <sys/conf.h>
150 1.117 ad #include <sys/mutex.h>
151 1.56 thorpej #include <sys/queue.h>
152 1.110 elad #include <sys/kauth.h>
153 1.133 ad #include <sys/kthread.h>
154 1.133 ad #include <sys/bufq.h>
155 1.1 hpeyerl
156 1.135 uebayasi #include <uvm/uvm_extern.h>
157 1.135 uebayasi
158 1.1 hpeyerl #include <dev/ccdvar.h>
159 1.113 christos #include <dev/dkvar.h>
160 1.1 hpeyerl
161 1.11 thorpej #if defined(CCDDEBUG) && !defined(DEBUG)
162 1.11 thorpej #define DEBUG
163 1.11 thorpej #endif
164 1.11 thorpej
165 1.1 hpeyerl #ifdef DEBUG
166 1.3 hpeyerl #define CCDB_FOLLOW 0x01
167 1.3 hpeyerl #define CCDB_INIT 0x02
168 1.3 hpeyerl #define CCDB_IO 0x04
169 1.11 thorpej #define CCDB_LABEL 0x08
170 1.11 thorpej #define CCDB_VNODE 0x10
171 1.24 thorpej int ccddebug = 0x00;
172 1.1 hpeyerl #endif
173 1.1 hpeyerl
174 1.6 cgd #define ccdunit(x) DISKUNIT(x)
175 1.6 cgd
176 1.6 cgd struct ccdbuf {
177 1.6 cgd struct buf cb_buf; /* new I/O buf */
178 1.6 cgd struct buf *cb_obp; /* ptr. to original I/O buf */
179 1.59 thorpej struct ccd_softc *cb_sc; /* pointer to ccd softc */
180 1.6 cgd int cb_comp; /* target component */
181 1.56 thorpej SIMPLEQ_ENTRY(ccdbuf) cb_q; /* fifo of component buffers */
182 1.38 thorpej };
183 1.24 thorpej
184 1.63 thorpej /* component buffer pool */
185 1.133 ad static pool_cache_t ccd_cache;
186 1.63 thorpej
187 1.133 ad #define CCD_GETBUF() pool_cache_get(ccd_cache, PR_WAITOK)
188 1.133 ad #define CCD_PUTBUF(cbp) pool_cache_put(ccd_cache, cbp)
189 1.1 hpeyerl
190 1.11 thorpej #define CCDLABELDEV(dev) \
191 1.11 thorpej (MAKEDISKDEV(major((dev)), ccdunit((dev)), RAW_PART))
192 1.1 hpeyerl
193 1.11 thorpej /* called by main() at boot time */
194 1.97 thorpej void ccdattach(int);
195 1.11 thorpej
196 1.11 thorpej /* called by biodone() at interrupt time */
197 1.97 thorpej static void ccdiodone(struct buf *);
198 1.11 thorpej
199 1.97 thorpej static void ccdinterleave(struct ccd_softc *);
200 1.97 thorpej static int ccdinit(struct ccd_softc *, char **, struct vnode **,
201 1.107 christos struct lwp *);
202 1.97 thorpej static struct ccdbuf *ccdbuffer(struct ccd_softc *, struct buf *,
203 1.118 christos daddr_t, void *, long);
204 1.97 thorpej static void ccdgetdefaultlabel(struct ccd_softc *, struct disklabel *);
205 1.97 thorpej static void ccdgetdisklabel(dev_t);
206 1.97 thorpej static void ccdmakedisklabel(struct ccd_softc *);
207 1.133 ad static void ccdstart(struct ccd_softc *);
208 1.133 ad static void ccdthread(void *);
209 1.97 thorpej
210 1.97 thorpej static dev_type_open(ccdopen);
211 1.97 thorpej static dev_type_close(ccdclose);
212 1.97 thorpej static dev_type_read(ccdread);
213 1.97 thorpej static dev_type_write(ccdwrite);
214 1.97 thorpej static dev_type_ioctl(ccdioctl);
215 1.97 thorpej static dev_type_strategy(ccdstrategy);
216 1.97 thorpej static dev_type_size(ccdsize);
217 1.78 gehenna
218 1.78 gehenna const struct bdevsw ccd_bdevsw = {
219 1.133 ad .d_open = ccdopen,
220 1.133 ad .d_close = ccdclose,
221 1.133 ad .d_strategy = ccdstrategy,
222 1.133 ad .d_ioctl = ccdioctl,
223 1.133 ad .d_dump = nodump,
224 1.133 ad .d_psize = ccdsize,
225 1.133 ad .d_flag = D_DISK | D_MPSAFE
226 1.78 gehenna };
227 1.78 gehenna
228 1.78 gehenna const struct cdevsw ccd_cdevsw = {
229 1.133 ad .d_open = ccdopen,
230 1.133 ad .d_close = ccdclose,
231 1.133 ad .d_read = ccdread,
232 1.133 ad .d_write = ccdwrite,
233 1.133 ad .d_ioctl = ccdioctl,
234 1.133 ad .d_stop = nostop,
235 1.133 ad .d_tty = notty,
236 1.133 ad .d_poll = nopoll,
237 1.133 ad .d_mmap = nommap,
238 1.133 ad .d_kqfilter = nokqfilter,
239 1.133 ad .d_flag = D_DISK | D_MPSAFE
240 1.78 gehenna };
241 1.3 hpeyerl
242 1.11 thorpej #ifdef DEBUG
243 1.97 thorpej static void printiinfo(struct ccdiinfo *);
244 1.11 thorpej #endif
245 1.11 thorpej
246 1.108 lukem /* Publically visible for the benefit of libkvm and ccdconfig(8). */
247 1.108 lukem struct ccd_softc *ccd_softc;
248 1.108 lukem const int ccd_softc_elemsize = sizeof(struct ccd_softc);
249 1.108 lukem int numccd = 0;
250 1.1 hpeyerl
251 1.3 hpeyerl /*
252 1.11 thorpej * Called by main() during pseudo-device attachment. All we need
253 1.11 thorpej * to do is allocate enough space for devices to be configured later.
254 1.1 hpeyerl */
255 1.1 hpeyerl void
256 1.97 thorpej ccdattach(int num)
257 1.3 hpeyerl {
258 1.57 thorpej struct ccd_softc *cs;
259 1.57 thorpej int i;
260 1.57 thorpej
261 1.11 thorpej if (num <= 0) {
262 1.11 thorpej #ifdef DIAGNOSTIC
263 1.11 thorpej panic("ccdattach: count <= 0");
264 1.11 thorpej #endif
265 1.3 hpeyerl return;
266 1.11 thorpej }
267 1.11 thorpej
268 1.133 ad ccd_softc = kmem_zalloc(num * ccd_softc_elemsize, KM_SLEEP);
269 1.57 thorpej if (ccd_softc == NULL) {
270 1.35 christos printf("WARNING: no memory for concatenated disks\n");
271 1.3 hpeyerl return;
272 1.3 hpeyerl }
273 1.3 hpeyerl numccd = num;
274 1.57 thorpej
275 1.63 thorpej /* Initialize the component buffer pool. */
276 1.133 ad ccd_cache = pool_cache_init(sizeof(struct ccdbuf), 0,
277 1.133 ad 0, 0, "ccdbuf", NULL, IPL_BIO, NULL, NULL, NULL);
278 1.63 thorpej
279 1.57 thorpej /* Initialize per-softc structures. */
280 1.57 thorpej for (i = 0; i < num; i++) {
281 1.57 thorpej cs = &ccd_softc[i];
282 1.96 itojun snprintf(cs->sc_xname, sizeof(cs->sc_xname), "ccd%d", i);
283 1.133 ad mutex_init(&cs->sc_dvlock, MUTEX_DEFAULT, IPL_NONE);
284 1.133 ad cs->sc_iolock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NONE);
285 1.133 ad cv_init(&cs->sc_stop, "ccdstop");
286 1.133 ad cv_init(&cs->sc_push, "ccdthr");
287 1.123 ad disk_init(&cs->sc_dkdev, cs->sc_xname, NULL); /* XXX */
288 1.57 thorpej }
289 1.1 hpeyerl }
290 1.1 hpeyerl
291 1.11 thorpej static int
292 1.97 thorpej ccdinit(struct ccd_softc *cs, char **cpaths, struct vnode **vpp,
293 1.107 christos struct lwp *l)
294 1.1 hpeyerl {
295 1.68 augustss struct ccdcinfo *ci = NULL;
296 1.68 augustss size_t size;
297 1.68 augustss int ix;
298 1.11 thorpej struct vattr va;
299 1.1 hpeyerl size_t minsize;
300 1.11 thorpej int maxsecsize;
301 1.7 cgd struct partinfo dpart;
302 1.11 thorpej struct ccdgeom *ccg = &cs->sc_geom;
303 1.111 christos char *tmppath;
304 1.67 enami int error, path_alloced;
305 1.1 hpeyerl
306 1.1 hpeyerl #ifdef DEBUG
307 1.3 hpeyerl if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
308 1.59 thorpej printf("%s: ccdinit\n", cs->sc_xname);
309 1.1 hpeyerl #endif
310 1.11 thorpej
311 1.11 thorpej /* Allocate space for the component info. */
312 1.133 ad cs->sc_cinfo = kmem_alloc(cs->sc_nccdisks * sizeof(*cs->sc_cinfo),
313 1.133 ad KM_SLEEP);
314 1.133 ad tmppath = kmem_alloc(MAXPATHLEN, KM_SLEEP);
315 1.111 christos
316 1.57 thorpej cs->sc_size = 0;
317 1.57 thorpej
318 1.1 hpeyerl /*
319 1.1 hpeyerl * Verify that each component piece exists and record
320 1.1 hpeyerl * relevant information about it.
321 1.1 hpeyerl */
322 1.11 thorpej maxsecsize = 0;
323 1.1 hpeyerl minsize = 0;
324 1.67 enami for (ix = 0, path_alloced = 0; ix < cs->sc_nccdisks; ix++) {
325 1.1 hpeyerl ci = &cs->sc_cinfo[ix];
326 1.57 thorpej ci->ci_vp = vpp[ix];
327 1.11 thorpej
328 1.11 thorpej /*
329 1.11 thorpej * Copy in the pathname of the component.
330 1.11 thorpej */
331 1.72 thorpej memset(tmppath, 0, sizeof(tmppath)); /* sanity */
332 1.29 christos error = copyinstr(cpaths[ix], tmppath,
333 1.29 christos MAXPATHLEN, &ci->ci_pathlen);
334 1.133 ad if (ci->ci_pathlen == 0)
335 1.133 ad error = EINVAL;
336 1.29 christos if (error) {
337 1.11 thorpej #ifdef DEBUG
338 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
339 1.35 christos printf("%s: can't copy path, error = %d\n",
340 1.23 thorpej cs->sc_xname, error);
341 1.11 thorpej #endif
342 1.67 enami goto out;
343 1.11 thorpej }
344 1.133 ad ci->ci_path = kmem_alloc(ci->ci_pathlen, KM_SLEEP);
345 1.72 thorpej memcpy(ci->ci_path, tmppath, ci->ci_pathlen);
346 1.67 enami path_alloced++;
347 1.11 thorpej
348 1.11 thorpej /*
349 1.11 thorpej * XXX: Cache the component's dev_t.
350 1.11 thorpej */
351 1.124 pooka if ((error = VOP_GETATTR(vpp[ix], &va, l->l_cred)) != 0) {
352 1.11 thorpej #ifdef DEBUG
353 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
354 1.35 christos printf("%s: %s: getattr failed %s = %d\n",
355 1.23 thorpej cs->sc_xname, ci->ci_path,
356 1.11 thorpej "error", error);
357 1.11 thorpej #endif
358 1.67 enami goto out;
359 1.11 thorpej }
360 1.11 thorpej ci->ci_dev = va.va_rdev;
361 1.11 thorpej
362 1.3 hpeyerl /*
363 1.11 thorpej * Get partition information for the component.
364 1.3 hpeyerl */
365 1.84 dsl error = VOP_IOCTL(vpp[ix], DIOCGPART, &dpart,
366 1.124 pooka FREAD, l->l_cred);
367 1.29 christos if (error) {
368 1.11 thorpej #ifdef DEBUG
369 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
370 1.35 christos printf("%s: %s: ioctl failed, error = %d\n",
371 1.23 thorpej cs->sc_xname, ci->ci_path, error);
372 1.11 thorpej #endif
373 1.67 enami goto out;
374 1.11 thorpej }
375 1.69 enami
376 1.69 enami /*
377 1.69 enami * This diagnostic test is disabled (for now?) since not all port supports
378 1.69 enami * on-disk BSD disklabel.
379 1.69 enami */
380 1.69 enami #if 0 /* def DIAGNOSTIC */
381 1.69 enami /* Check fstype field of component. */
382 1.69 enami if (dpart.part->p_fstype != FS_CCD)
383 1.69 enami printf("%s: WARNING: %s: fstype %d != FS_CCD\n",
384 1.69 enami cs->sc_xname, ci->ci_path, dpart.part->p_fstype);
385 1.69 enami #endif
386 1.7 cgd
387 1.11 thorpej /*
388 1.11 thorpej * Calculate the size, truncating to an interleave
389 1.11 thorpej * boundary if necessary.
390 1.11 thorpej */
391 1.46 thorpej maxsecsize =
392 1.46 thorpej ((dpart.disklab->d_secsize > maxsecsize) ?
393 1.46 thorpej dpart.disklab->d_secsize : maxsecsize);
394 1.46 thorpej size = dpart.part->p_size;
395 1.1 hpeyerl if (cs->sc_ileave > 1)
396 1.1 hpeyerl size -= size % cs->sc_ileave;
397 1.11 thorpej
398 1.1 hpeyerl if (size == 0) {
399 1.11 thorpej #ifdef DEBUG
400 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
401 1.35 christos printf("%s: %s: size == 0\n",
402 1.23 thorpej cs->sc_xname, ci->ci_path);
403 1.11 thorpej #endif
404 1.67 enami error = ENODEV;
405 1.67 enami goto out;
406 1.3 hpeyerl }
407 1.11 thorpej
408 1.1 hpeyerl if (minsize == 0 || size < minsize)
409 1.1 hpeyerl minsize = size;
410 1.1 hpeyerl ci->ci_size = size;
411 1.1 hpeyerl cs->sc_size += size;
412 1.1 hpeyerl }
413 1.11 thorpej
414 1.11 thorpej /*
415 1.11 thorpej * Don't allow the interleave to be smaller than
416 1.11 thorpej * the biggest component sector.
417 1.11 thorpej */
418 1.11 thorpej if ((cs->sc_ileave > 0) &&
419 1.11 thorpej (cs->sc_ileave < (maxsecsize / DEV_BSIZE))) {
420 1.11 thorpej #ifdef DEBUG
421 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
422 1.35 christos printf("%s: interleave must be at least %d\n",
423 1.23 thorpej cs->sc_xname, (maxsecsize / DEV_BSIZE));
424 1.11 thorpej #endif
425 1.67 enami error = EINVAL;
426 1.67 enami goto out;
427 1.11 thorpej }
428 1.11 thorpej
429 1.1 hpeyerl /*
430 1.1 hpeyerl * If uniform interleave is desired set all sizes to that of
431 1.1 hpeyerl * the smallest component.
432 1.1 hpeyerl */
433 1.57 thorpej if (cs->sc_flags & CCDF_UNIFORM) {
434 1.1 hpeyerl for (ci = cs->sc_cinfo;
435 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
436 1.1 hpeyerl ci->ci_size = minsize;
437 1.24 thorpej
438 1.53 thorpej cs->sc_size = cs->sc_nccdisks * minsize;
439 1.1 hpeyerl }
440 1.11 thorpej
441 1.11 thorpej /*
442 1.11 thorpej * Construct the interleave table.
443 1.11 thorpej */
444 1.57 thorpej ccdinterleave(cs);
445 1.11 thorpej
446 1.1 hpeyerl /*
447 1.11 thorpej * Create pseudo-geometry based on 1MB cylinders. It's
448 1.11 thorpej * pretty close.
449 1.1 hpeyerl */
450 1.11 thorpej ccg->ccg_secsize = DEV_BSIZE;
451 1.19 thorpej ccg->ccg_ntracks = 1;
452 1.11 thorpej ccg->ccg_nsectors = 1024 * (1024 / ccg->ccg_secsize);
453 1.11 thorpej ccg->ccg_ncylinders = cs->sc_size / ccg->ccg_nsectors;
454 1.11 thorpej
455 1.133 ad /*
456 1.133 ad * Create thread to handle deferred I/O.
457 1.133 ad */
458 1.133 ad cs->sc_zap = false;
459 1.133 ad error = kthread_create(PRI_BIO, KTHREAD_MPSAFE, NULL, ccdthread,
460 1.133 ad cs, &cs->sc_thread, "%s", cs->sc_xname);
461 1.133 ad if (error) {
462 1.133 ad printf("ccdinit: can't create thread: %d\n", error);
463 1.133 ad goto out;
464 1.133 ad }
465 1.133 ad
466 1.133 ad /*
467 1.133 ad * Only now that everything is set up can we enable the device.
468 1.133 ad */
469 1.133 ad mutex_enter(cs->sc_iolock);
470 1.11 thorpej cs->sc_flags |= CCDF_INITED;
471 1.133 ad mutex_exit(cs->sc_iolock);
472 1.133 ad kmem_free(tmppath, MAXPATHLEN);
473 1.11 thorpej return (0);
474 1.67 enami
475 1.67 enami out:
476 1.133 ad for (ix = 0; ix < path_alloced; ix++) {
477 1.133 ad kmem_free(cs->sc_cinfo[ix].ci_path,
478 1.133 ad cs->sc_cinfo[ix].ci_pathlen);
479 1.133 ad }
480 1.133 ad kmem_free(cs->sc_cinfo, cs->sc_nccdisks * sizeof(struct ccdcinfo));
481 1.133 ad kmem_free(tmppath, MAXPATHLEN);
482 1.67 enami return (error);
483 1.1 hpeyerl }
484 1.1 hpeyerl
485 1.11 thorpej static void
486 1.97 thorpej ccdinterleave(struct ccd_softc *cs)
487 1.1 hpeyerl {
488 1.68 augustss struct ccdcinfo *ci, *smallci;
489 1.68 augustss struct ccdiinfo *ii;
490 1.68 augustss daddr_t bn, lbn;
491 1.68 augustss int ix;
492 1.1 hpeyerl u_long size;
493 1.1 hpeyerl
494 1.1 hpeyerl #ifdef DEBUG
495 1.3 hpeyerl if (ccddebug & CCDB_INIT)
496 1.35 christos printf("ccdinterleave(%p): ileave %d\n", cs, cs->sc_ileave);
497 1.1 hpeyerl #endif
498 1.1 hpeyerl /*
499 1.1 hpeyerl * Allocate an interleave table.
500 1.1 hpeyerl * Chances are this is too big, but we don't care.
501 1.1 hpeyerl */
502 1.1 hpeyerl size = (cs->sc_nccdisks + 1) * sizeof(struct ccdiinfo);
503 1.133 ad cs->sc_itable = kmem_zalloc(size, KM_SLEEP);
504 1.11 thorpej
505 1.1 hpeyerl /*
506 1.1 hpeyerl * Trivial case: no interleave (actually interleave of disk size).
507 1.11 thorpej * Each table entry represents a single component in its entirety.
508 1.1 hpeyerl */
509 1.1 hpeyerl if (cs->sc_ileave == 0) {
510 1.1 hpeyerl bn = 0;
511 1.1 hpeyerl ii = cs->sc_itable;
512 1.11 thorpej
513 1.1 hpeyerl for (ix = 0; ix < cs->sc_nccdisks; ix++) {
514 1.19 thorpej /* Allocate space for ii_index. */
515 1.133 ad ii->ii_indexsz = sizeof(int);
516 1.133 ad ii->ii_index = kmem_alloc(ii->ii_indexsz, KM_SLEEP);
517 1.1 hpeyerl ii->ii_ndisk = 1;
518 1.1 hpeyerl ii->ii_startblk = bn;
519 1.1 hpeyerl ii->ii_startoff = 0;
520 1.1 hpeyerl ii->ii_index[0] = ix;
521 1.1 hpeyerl bn += cs->sc_cinfo[ix].ci_size;
522 1.1 hpeyerl ii++;
523 1.1 hpeyerl }
524 1.1 hpeyerl ii->ii_ndisk = 0;
525 1.1 hpeyerl #ifdef DEBUG
526 1.3 hpeyerl if (ccddebug & CCDB_INIT)
527 1.1 hpeyerl printiinfo(cs->sc_itable);
528 1.1 hpeyerl #endif
529 1.11 thorpej return;
530 1.1 hpeyerl }
531 1.11 thorpej
532 1.1 hpeyerl /*
533 1.1 hpeyerl * The following isn't fast or pretty; it doesn't have to be.
534 1.1 hpeyerl */
535 1.1 hpeyerl size = 0;
536 1.1 hpeyerl bn = lbn = 0;
537 1.1 hpeyerl for (ii = cs->sc_itable; ; ii++) {
538 1.11 thorpej /* Allocate space for ii_index. */
539 1.133 ad ii->ii_indexsz = sizeof(int) * cs->sc_nccdisks;
540 1.133 ad ii->ii_index = kmem_alloc(ii->ii_indexsz, KM_SLEEP);
541 1.11 thorpej
542 1.1 hpeyerl /*
543 1.1 hpeyerl * Locate the smallest of the remaining components
544 1.1 hpeyerl */
545 1.1 hpeyerl smallci = NULL;
546 1.1 hpeyerl for (ci = cs->sc_cinfo;
547 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
548 1.1 hpeyerl if (ci->ci_size > size &&
549 1.1 hpeyerl (smallci == NULL ||
550 1.1 hpeyerl ci->ci_size < smallci->ci_size))
551 1.1 hpeyerl smallci = ci;
552 1.11 thorpej
553 1.1 hpeyerl /*
554 1.1 hpeyerl * Nobody left, all done
555 1.1 hpeyerl */
556 1.1 hpeyerl if (smallci == NULL) {
557 1.1 hpeyerl ii->ii_ndisk = 0;
558 1.1 hpeyerl break;
559 1.1 hpeyerl }
560 1.11 thorpej
561 1.1 hpeyerl /*
562 1.1 hpeyerl * Record starting logical block and component offset
563 1.1 hpeyerl */
564 1.1 hpeyerl ii->ii_startblk = bn / cs->sc_ileave;
565 1.1 hpeyerl ii->ii_startoff = lbn;
566 1.11 thorpej
567 1.1 hpeyerl /*
568 1.1 hpeyerl * Determine how many disks take part in this interleave
569 1.1 hpeyerl * and record their indices.
570 1.1 hpeyerl */
571 1.1 hpeyerl ix = 0;
572 1.1 hpeyerl for (ci = cs->sc_cinfo;
573 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
574 1.1 hpeyerl if (ci->ci_size >= smallci->ci_size)
575 1.1 hpeyerl ii->ii_index[ix++] = ci - cs->sc_cinfo;
576 1.1 hpeyerl ii->ii_ndisk = ix;
577 1.1 hpeyerl bn += ix * (smallci->ci_size - size);
578 1.1 hpeyerl lbn = smallci->ci_size / cs->sc_ileave;
579 1.1 hpeyerl size = smallci->ci_size;
580 1.1 hpeyerl }
581 1.1 hpeyerl #ifdef DEBUG
582 1.3 hpeyerl if (ccddebug & CCDB_INIT)
583 1.1 hpeyerl printiinfo(cs->sc_itable);
584 1.1 hpeyerl #endif
585 1.1 hpeyerl }
586 1.1 hpeyerl
587 1.11 thorpej /* ARGSUSED */
588 1.97 thorpej static int
589 1.116 christos ccdopen(dev_t dev, int flags, int fmt, struct lwp *l)
590 1.1 hpeyerl {
591 1.1 hpeyerl int unit = ccdunit(dev);
592 1.11 thorpej struct ccd_softc *cs;
593 1.11 thorpej struct disklabel *lp;
594 1.15 thorpej int error = 0, part, pmask;
595 1.1 hpeyerl
596 1.1 hpeyerl #ifdef DEBUG
597 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
598 1.131 cegger printf("ccdopen(0x%"PRIx64", 0x%x)\n", dev, flags);
599 1.1 hpeyerl #endif
600 1.11 thorpej if (unit >= numccd)
601 1.11 thorpej return (ENXIO);
602 1.11 thorpej cs = &ccd_softc[unit];
603 1.15 thorpej
604 1.133 ad mutex_enter(&cs->sc_dvlock);
605 1.15 thorpej
606 1.23 thorpej lp = cs->sc_dkdev.dk_label;
607 1.11 thorpej
608 1.11 thorpej part = DISKPART(dev);
609 1.11 thorpej pmask = (1 << part);
610 1.11 thorpej
611 1.15 thorpej /*
612 1.15 thorpej * If we're initialized, check to see if there are any other
613 1.15 thorpej * open partitions. If not, then it's safe to update
614 1.87 thorpej * the in-core disklabel. Only read the disklabel if it is
615 1.87 thorpej * not already valid.
616 1.15 thorpej */
617 1.87 thorpej if ((cs->sc_flags & (CCDF_INITED|CCDF_VLABEL)) == CCDF_INITED &&
618 1.87 thorpej cs->sc_dkdev.dk_openmask == 0)
619 1.15 thorpej ccdgetdisklabel(dev);
620 1.15 thorpej
621 1.11 thorpej /* Check that the partition exists. */
622 1.27 thorpej if (part != RAW_PART) {
623 1.27 thorpej if (((cs->sc_flags & CCDF_INITED) == 0) ||
624 1.37 thorpej ((part >= lp->d_npartitions) ||
625 1.27 thorpej (lp->d_partitions[part].p_fstype == FS_UNUSED))) {
626 1.27 thorpej error = ENXIO;
627 1.27 thorpej goto done;
628 1.27 thorpej }
629 1.15 thorpej }
630 1.11 thorpej
631 1.11 thorpej /* Prevent our unit from being unconfigured while open. */
632 1.11 thorpej switch (fmt) {
633 1.11 thorpej case S_IFCHR:
634 1.11 thorpej cs->sc_dkdev.dk_copenmask |= pmask;
635 1.11 thorpej break;
636 1.11 thorpej
637 1.11 thorpej case S_IFBLK:
638 1.11 thorpej cs->sc_dkdev.dk_bopenmask |= pmask;
639 1.11 thorpej break;
640 1.11 thorpej }
641 1.11 thorpej cs->sc_dkdev.dk_openmask =
642 1.11 thorpej cs->sc_dkdev.dk_copenmask | cs->sc_dkdev.dk_bopenmask;
643 1.11 thorpej
644 1.15 thorpej done:
645 1.133 ad mutex_exit(&cs->sc_dvlock);
646 1.33 thorpej return (error);
647 1.7 cgd }
648 1.7 cgd
649 1.11 thorpej /* ARGSUSED */
650 1.97 thorpej static int
651 1.116 christos ccdclose(dev_t dev, int flags, int fmt, struct lwp *l)
652 1.7 cgd {
653 1.11 thorpej int unit = ccdunit(dev);
654 1.11 thorpej struct ccd_softc *cs;
655 1.117 ad int part;
656 1.11 thorpej
657 1.7 cgd #ifdef DEBUG
658 1.7 cgd if (ccddebug & CCDB_FOLLOW)
659 1.131 cegger printf("ccdclose(0x%"PRIx64", 0x%x)\n", dev, flags);
660 1.7 cgd #endif
661 1.11 thorpej
662 1.11 thorpej if (unit >= numccd)
663 1.11 thorpej return (ENXIO);
664 1.11 thorpej cs = &ccd_softc[unit];
665 1.15 thorpej
666 1.133 ad mutex_enter(&cs->sc_dvlock);
667 1.15 thorpej
668 1.11 thorpej part = DISKPART(dev);
669 1.11 thorpej
670 1.11 thorpej /* ...that much closer to allowing unconfiguration... */
671 1.11 thorpej switch (fmt) {
672 1.11 thorpej case S_IFCHR:
673 1.11 thorpej cs->sc_dkdev.dk_copenmask &= ~(1 << part);
674 1.11 thorpej break;
675 1.11 thorpej
676 1.11 thorpej case S_IFBLK:
677 1.11 thorpej cs->sc_dkdev.dk_bopenmask &= ~(1 << part);
678 1.11 thorpej break;
679 1.11 thorpej }
680 1.11 thorpej cs->sc_dkdev.dk_openmask =
681 1.11 thorpej cs->sc_dkdev.dk_copenmask | cs->sc_dkdev.dk_bopenmask;
682 1.11 thorpej
683 1.87 thorpej if (cs->sc_dkdev.dk_openmask == 0) {
684 1.87 thorpej if ((cs->sc_flags & CCDF_KLABEL) == 0)
685 1.87 thorpej cs->sc_flags &= ~CCDF_VLABEL;
686 1.87 thorpej }
687 1.87 thorpej
688 1.133 ad mutex_exit(&cs->sc_dvlock);
689 1.7 cgd return (0);
690 1.1 hpeyerl }
691 1.1 hpeyerl
692 1.133 ad static bool
693 1.133 ad ccdbackoff(struct ccd_softc *cs)
694 1.133 ad {
695 1.133 ad
696 1.133 ad /* XXX Arbitrary, should be a uvm call. */
697 1.133 ad return uvmexp.free < (uvmexp.freemin >> 1) &&
698 1.133 ad disk_isbusy(&cs->sc_dkdev);
699 1.133 ad }
700 1.133 ad
701 1.133 ad static void
702 1.133 ad ccdthread(void *cookie)
703 1.133 ad {
704 1.133 ad struct ccd_softc *cs;
705 1.133 ad
706 1.133 ad cs = cookie;
707 1.133 ad
708 1.133 ad #ifdef DEBUG
709 1.133 ad if (ccddebug & CCDB_FOLLOW)
710 1.133 ad printf("ccdthread: hello\n");
711 1.133 ad #endif
712 1.133 ad
713 1.133 ad mutex_enter(cs->sc_iolock);
714 1.133 ad while (__predict_true(!cs->sc_zap)) {
715 1.133 ad if (bufq_peek(cs->sc_bufq) == NULL) {
716 1.133 ad /* Nothing to do. */
717 1.133 ad cv_wait(&cs->sc_push, cs->sc_iolock);
718 1.133 ad continue;
719 1.133 ad }
720 1.133 ad if (ccdbackoff(cs)) {
721 1.133 ad /* Wait for memory to become available. */
722 1.133 ad (void)cv_timedwait(&cs->sc_push, cs->sc_iolock, 1);
723 1.133 ad continue;
724 1.133 ad }
725 1.133 ad #ifdef DEBUG
726 1.133 ad if (ccddebug & CCDB_FOLLOW)
727 1.133 ad printf("ccdthread: dispatching I/O\n");
728 1.133 ad #endif
729 1.133 ad ccdstart(cs);
730 1.133 ad mutex_enter(cs->sc_iolock);
731 1.133 ad }
732 1.133 ad cs->sc_thread = NULL;
733 1.133 ad mutex_exit(cs->sc_iolock);
734 1.133 ad #ifdef DEBUG
735 1.133 ad if (ccddebug & CCDB_FOLLOW)
736 1.133 ad printf("ccdthread: goodbye\n");
737 1.133 ad #endif
738 1.133 ad kthread_exit(0);
739 1.133 ad }
740 1.133 ad
741 1.97 thorpej static void
742 1.97 thorpej ccdstrategy(struct buf *bp)
743 1.1 hpeyerl {
744 1.68 augustss int unit = ccdunit(bp->b_dev);
745 1.68 augustss struct ccd_softc *cs = &ccd_softc[unit];
746 1.133 ad
747 1.133 ad /* Must be open or reading label. */
748 1.133 ad KASSERT(cs->sc_dkdev.dk_openmask != 0 ||
749 1.133 ad (cs->sc_flags & CCDF_RLABEL) != 0);
750 1.133 ad
751 1.133 ad mutex_enter(cs->sc_iolock);
752 1.133 ad /* Synchronize with device init/uninit. */
753 1.133 ad if (__predict_false((cs->sc_flags & CCDF_INITED) == 0)) {
754 1.133 ad mutex_exit(cs->sc_iolock);
755 1.133 ad #ifdef DEBUG
756 1.133 ad if (ccddebug & CCDB_FOLLOW)
757 1.133 ad printf("ccdstrategy: unit %d: not inited\n", unit);
758 1.133 ad #endif
759 1.133 ad bp->b_error = ENXIO;
760 1.133 ad bp->b_resid = bp->b_bcount;
761 1.133 ad biodone(bp);
762 1.133 ad return;
763 1.133 ad }
764 1.133 ad
765 1.133 ad /* Defer to thread if system is low on memory. */
766 1.133 ad bufq_put(cs->sc_bufq, bp);
767 1.133 ad if (__predict_false(ccdbackoff(cs))) {
768 1.133 ad mutex_exit(cs->sc_iolock);
769 1.133 ad #ifdef DEBUG
770 1.133 ad if (ccddebug & CCDB_FOLLOW)
771 1.133 ad printf("ccdstrategy: holding off on I/O\n");
772 1.133 ad #endif
773 1.133 ad return;
774 1.133 ad }
775 1.133 ad ccdstart(cs);
776 1.133 ad }
777 1.133 ad
778 1.133 ad static void
779 1.133 ad ccdstart(struct ccd_softc *cs)
780 1.133 ad {
781 1.88 thorpej daddr_t blkno;
782 1.11 thorpej int wlabel;
783 1.15 thorpej struct disklabel *lp;
784 1.133 ad long bcount, rcount;
785 1.133 ad struct ccdbuf *cbp;
786 1.133 ad char *addr;
787 1.133 ad daddr_t bn;
788 1.133 ad vnode_t *vp;
789 1.133 ad buf_t *bp;
790 1.133 ad
791 1.133 ad KASSERT(mutex_owned(cs->sc_iolock));
792 1.133 ad
793 1.133 ad disk_busy(&cs->sc_dkdev);
794 1.133 ad bp = bufq_get(cs->sc_bufq);
795 1.133 ad KASSERT(bp != NULL);
796 1.1 hpeyerl
797 1.1 hpeyerl #ifdef DEBUG
798 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
799 1.133 ad printf("ccdstart(%s, %p)\n", cs->sc_xname, bp);
800 1.59 thorpej #endif
801 1.11 thorpej
802 1.11 thorpej /* If it's a nil transfer, wake up the top half now. */
803 1.11 thorpej if (bp->b_bcount == 0)
804 1.11 thorpej goto done;
805 1.11 thorpej
806 1.23 thorpej lp = cs->sc_dkdev.dk_label;
807 1.15 thorpej
808 1.11 thorpej /*
809 1.17 thorpej * Do bounds checking and adjust transfer. If there's an
810 1.88 thorpej * error, the bounds check will flag that for us. Convert
811 1.88 thorpej * the partition relative block number to an absolute.
812 1.11 thorpej */
813 1.88 thorpej blkno = bp->b_blkno;
814 1.11 thorpej wlabel = cs->sc_flags & (CCDF_WLABEL|CCDF_LABELLING);
815 1.88 thorpej if (DISKPART(bp->b_dev) != RAW_PART) {
816 1.86 thorpej if (bounds_check_with_label(&cs->sc_dkdev, bp, wlabel) <= 0)
817 1.1 hpeyerl goto done;
818 1.88 thorpej blkno += lp->d_partitions[DISKPART(bp->b_dev)].p_offset;
819 1.88 thorpej }
820 1.133 ad mutex_exit(cs->sc_iolock);
821 1.88 thorpej bp->b_rawblkno = blkno;
822 1.11 thorpej
823 1.133 ad /* Allocate the component buffers and start I/O! */
824 1.133 ad bp->b_resid = bp->b_bcount;
825 1.133 ad bn = bp->b_rawblkno;
826 1.133 ad addr = bp->b_data;
827 1.133 ad for (bcount = bp->b_bcount; bcount > 0; bcount -= rcount) {
828 1.133 ad cbp = ccdbuffer(cs, bp, bn, addr, bcount);
829 1.133 ad rcount = cbp->cb_buf.b_bcount;
830 1.133 ad bn += btodb(rcount);
831 1.133 ad addr += rcount;
832 1.133 ad vp = cbp->cb_buf.b_vp;
833 1.133 ad if ((cbp->cb_buf.b_flags & B_READ) == 0) {
834 1.133 ad mutex_enter(&vp->v_interlock);
835 1.133 ad vp->v_numoutput++;
836 1.133 ad mutex_exit(&vp->v_interlock);
837 1.133 ad }
838 1.133 ad (void)VOP_STRATEGY(vp, &cbp->cb_buf);
839 1.133 ad }
840 1.1 hpeyerl return;
841 1.88 thorpej
842 1.88 thorpej done:
843 1.133 ad disk_unbusy(&cs->sc_dkdev, 0, 0);
844 1.133 ad cv_broadcast(&cs->sc_stop);
845 1.133 ad cv_broadcast(&cs->sc_push);
846 1.133 ad mutex_exit(cs->sc_iolock);
847 1.88 thorpej bp->b_resid = bp->b_bcount;
848 1.1 hpeyerl biodone(bp);
849 1.1 hpeyerl }
850 1.1 hpeyerl
851 1.1 hpeyerl /*
852 1.1 hpeyerl * Build a component buffer header.
853 1.1 hpeyerl */
854 1.55 thorpej static struct ccdbuf *
855 1.118 christos ccdbuffer(struct ccd_softc *cs, struct buf *bp, daddr_t bn, void *addr,
856 1.97 thorpej long bcount)
857 1.1 hpeyerl {
858 1.68 augustss struct ccdcinfo *ci;
859 1.68 augustss struct ccdbuf *cbp;
860 1.68 augustss daddr_t cbn, cboff;
861 1.68 augustss u_int64_t cbc;
862 1.36 thorpej int ccdisk;
863 1.1 hpeyerl
864 1.1 hpeyerl #ifdef DEBUG
865 1.3 hpeyerl if (ccddebug & CCDB_IO)
866 1.81 kleink printf("ccdbuffer(%p, %p, %" PRId64 ", %p, %ld)\n",
867 1.1 hpeyerl cs, bp, bn, addr, bcount);
868 1.1 hpeyerl #endif
869 1.1 hpeyerl /*
870 1.1 hpeyerl * Determine which component bn falls in.
871 1.1 hpeyerl */
872 1.1 hpeyerl cbn = bn;
873 1.1 hpeyerl cboff = 0;
874 1.11 thorpej
875 1.1 hpeyerl /*
876 1.1 hpeyerl * Serially concatenated
877 1.1 hpeyerl */
878 1.1 hpeyerl if (cs->sc_ileave == 0) {
879 1.68 augustss daddr_t sblk;
880 1.1 hpeyerl
881 1.1 hpeyerl sblk = 0;
882 1.36 thorpej for (ccdisk = 0, ci = &cs->sc_cinfo[ccdisk];
883 1.36 thorpej cbn >= sblk + ci->ci_size;
884 1.36 thorpej ccdisk++, ci = &cs->sc_cinfo[ccdisk])
885 1.1 hpeyerl sblk += ci->ci_size;
886 1.1 hpeyerl cbn -= sblk;
887 1.1 hpeyerl }
888 1.1 hpeyerl /*
889 1.1 hpeyerl * Interleaved
890 1.1 hpeyerl */
891 1.1 hpeyerl else {
892 1.68 augustss struct ccdiinfo *ii;
893 1.36 thorpej int off;
894 1.1 hpeyerl
895 1.1 hpeyerl cboff = cbn % cs->sc_ileave;
896 1.1 hpeyerl cbn /= cs->sc_ileave;
897 1.1 hpeyerl for (ii = cs->sc_itable; ii->ii_ndisk; ii++)
898 1.1 hpeyerl if (ii->ii_startblk > cbn)
899 1.1 hpeyerl break;
900 1.1 hpeyerl ii--;
901 1.1 hpeyerl off = cbn - ii->ii_startblk;
902 1.1 hpeyerl if (ii->ii_ndisk == 1) {
903 1.1 hpeyerl ccdisk = ii->ii_index[0];
904 1.1 hpeyerl cbn = ii->ii_startoff + off;
905 1.1 hpeyerl } else {
906 1.53 thorpej ccdisk = ii->ii_index[off % ii->ii_ndisk];
907 1.53 thorpej cbn = ii->ii_startoff + off / ii->ii_ndisk;
908 1.1 hpeyerl }
909 1.1 hpeyerl cbn *= cs->sc_ileave;
910 1.1 hpeyerl ci = &cs->sc_cinfo[ccdisk];
911 1.1 hpeyerl }
912 1.11 thorpej
913 1.1 hpeyerl /*
914 1.1 hpeyerl * Fill in the component buf structure.
915 1.1 hpeyerl */
916 1.63 thorpej cbp = CCD_GETBUF();
917 1.133 ad KASSERT(cbp != NULL);
918 1.126 ad buf_init(&cbp->cb_buf);
919 1.126 ad cbp->cb_buf.b_flags = bp->b_flags;
920 1.126 ad cbp->cb_buf.b_oflags = bp->b_oflags;
921 1.126 ad cbp->cb_buf.b_cflags = bp->b_cflags;
922 1.29 christos cbp->cb_buf.b_iodone = ccdiodone;
923 1.6 cgd cbp->cb_buf.b_proc = bp->b_proc;
924 1.95 hannken cbp->cb_buf.b_dev = ci->ci_dev;
925 1.6 cgd cbp->cb_buf.b_blkno = cbn + cboff;
926 1.6 cgd cbp->cb_buf.b_data = addr;
927 1.11 thorpej cbp->cb_buf.b_vp = ci->ci_vp;
928 1.127 hannken cbp->cb_buf.b_objlock = &ci->ci_vp->v_interlock;
929 1.1 hpeyerl if (cs->sc_ileave == 0)
930 1.50 thorpej cbc = dbtob((u_int64_t)(ci->ci_size - cbn));
931 1.1 hpeyerl else
932 1.50 thorpej cbc = dbtob((u_int64_t)(cs->sc_ileave - cboff));
933 1.50 thorpej cbp->cb_buf.b_bcount = cbc < bcount ? cbc : bcount;
934 1.6 cgd
935 1.1 hpeyerl /*
936 1.6 cgd * context for ccdiodone
937 1.1 hpeyerl */
938 1.6 cgd cbp->cb_obp = bp;
939 1.59 thorpej cbp->cb_sc = cs;
940 1.36 thorpej cbp->cb_comp = ccdisk;
941 1.6 cgd
942 1.94 yamt BIO_COPYPRIO(&cbp->cb_buf, bp);
943 1.94 yamt
944 1.1 hpeyerl #ifdef DEBUG
945 1.3 hpeyerl if (ccddebug & CCDB_IO)
946 1.131 cegger printf(" dev 0x%"PRIx64"(u%lu): cbp %p bn %" PRId64 " addr %p"
947 1.99 yamt " bcnt %d\n",
948 1.62 mjacob ci->ci_dev, (unsigned long) (ci-cs->sc_cinfo), cbp,
949 1.62 mjacob cbp->cb_buf.b_blkno, cbp->cb_buf.b_data,
950 1.62 mjacob cbp->cb_buf.b_bcount);
951 1.1 hpeyerl #endif
952 1.55 thorpej
953 1.55 thorpej return (cbp);
954 1.1 hpeyerl }
955 1.1 hpeyerl
956 1.1 hpeyerl /*
957 1.11 thorpej * Called at interrupt time.
958 1.1 hpeyerl * Mark the component as done and if all components are done,
959 1.1 hpeyerl * take a ccd interrupt.
960 1.1 hpeyerl */
961 1.97 thorpej static void
962 1.97 thorpej ccdiodone(struct buf *vbp)
963 1.1 hpeyerl {
964 1.29 christos struct ccdbuf *cbp = (struct ccdbuf *) vbp;
965 1.59 thorpej struct buf *bp = cbp->cb_obp;
966 1.59 thorpej struct ccd_softc *cs = cbp->cb_sc;
967 1.133 ad int count;
968 1.1 hpeyerl
969 1.1 hpeyerl #ifdef DEBUG
970 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
971 1.35 christos printf("ccdiodone(%p)\n", cbp);
972 1.3 hpeyerl if (ccddebug & CCDB_IO) {
973 1.99 yamt printf("ccdiodone: bp %p bcount %d resid %d\n",
974 1.53 thorpej bp, bp->b_bcount, bp->b_resid);
975 1.131 cegger printf(" dev 0x%"PRIx64"(u%d), cbp %p bn %" PRId64 " addr %p"
976 1.99 yamt " bcnt %d\n",
977 1.6 cgd cbp->cb_buf.b_dev, cbp->cb_comp, cbp,
978 1.6 cgd cbp->cb_buf.b_blkno, cbp->cb_buf.b_data,
979 1.6 cgd cbp->cb_buf.b_bcount);
980 1.1 hpeyerl }
981 1.1 hpeyerl #endif
982 1.1 hpeyerl
983 1.122 ad if (cbp->cb_buf.b_error != 0) {
984 1.122 ad bp->b_error = cbp->cb_buf.b_error;
985 1.53 thorpej printf("%s: error %d on component %d\n",
986 1.53 thorpej cs->sc_xname, bp->b_error, cbp->cb_comp);
987 1.1 hpeyerl }
988 1.6 cgd count = cbp->cb_buf.b_bcount;
989 1.126 ad buf_destroy(&cbp->cb_buf);
990 1.63 thorpej CCD_PUTBUF(cbp);
991 1.1 hpeyerl
992 1.1 hpeyerl /*
993 1.1 hpeyerl * If all done, "interrupt".
994 1.53 thorpej */
995 1.133 ad mutex_enter(cs->sc_iolock);
996 1.53 thorpej bp->b_resid -= count;
997 1.53 thorpej if (bp->b_resid < 0)
998 1.53 thorpej panic("ccdiodone: count");
999 1.133 ad if (bp->b_resid == 0) {
1000 1.133 ad /*
1001 1.133 ad * Request is done for better or worse, wakeup the top half.
1002 1.133 ad */
1003 1.133 ad if (bp->b_error != 0)
1004 1.133 ad bp->b_resid = bp->b_bcount;
1005 1.133 ad disk_unbusy(&cs->sc_dkdev, (bp->b_bcount - bp->b_resid),
1006 1.133 ad (bp->b_flags & B_READ));
1007 1.133 ad if (!disk_isbusy(&cs->sc_dkdev)) {
1008 1.133 ad if (bufq_peek(cs->sc_bufq) != NULL) {
1009 1.133 ad cv_broadcast(&cs->sc_push);
1010 1.133 ad }
1011 1.133 ad cv_broadcast(&cs->sc_stop);
1012 1.133 ad }
1013 1.133 ad mutex_exit(cs->sc_iolock);
1014 1.133 ad biodone(bp);
1015 1.133 ad } else
1016 1.133 ad mutex_exit(cs->sc_iolock);
1017 1.1 hpeyerl }
1018 1.1 hpeyerl
1019 1.11 thorpej /* ARGSUSED */
1020 1.97 thorpej static int
1021 1.116 christos ccdread(dev_t dev, struct uio *uio, int flags)
1022 1.3 hpeyerl {
1023 1.11 thorpej int unit = ccdunit(dev);
1024 1.11 thorpej struct ccd_softc *cs;
1025 1.3 hpeyerl
1026 1.3 hpeyerl #ifdef DEBUG
1027 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
1028 1.131 cegger printf("ccdread(0x%"PRIx64", %p)\n", dev, uio);
1029 1.3 hpeyerl #endif
1030 1.11 thorpej if (unit >= numccd)
1031 1.11 thorpej return (ENXIO);
1032 1.11 thorpej cs = &ccd_softc[unit];
1033 1.11 thorpej
1034 1.133 ad /* Unlocked advisory check, ccdstrategy check is synchronous. */
1035 1.11 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1036 1.11 thorpej return (ENXIO);
1037 1.11 thorpej
1038 1.10 mycroft return (physio(ccdstrategy, NULL, dev, B_READ, minphys, uio));
1039 1.3 hpeyerl }
1040 1.3 hpeyerl
1041 1.11 thorpej /* ARGSUSED */
1042 1.97 thorpej static int
1043 1.116 christos ccdwrite(dev_t dev, struct uio *uio, int flags)
1044 1.3 hpeyerl {
1045 1.11 thorpej int unit = ccdunit(dev);
1046 1.11 thorpej struct ccd_softc *cs;
1047 1.3 hpeyerl
1048 1.3 hpeyerl #ifdef DEBUG
1049 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
1050 1.131 cegger printf("ccdwrite(0x%"PRIx64", %p)\n", dev, uio);
1051 1.3 hpeyerl #endif
1052 1.11 thorpej if (unit >= numccd)
1053 1.11 thorpej return (ENXIO);
1054 1.11 thorpej cs = &ccd_softc[unit];
1055 1.11 thorpej
1056 1.133 ad /* Unlocked advisory check, ccdstrategy check is synchronous. */
1057 1.11 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1058 1.11 thorpej return (ENXIO);
1059 1.11 thorpej
1060 1.10 mycroft return (physio(ccdstrategy, NULL, dev, B_WRITE, minphys, uio));
1061 1.3 hpeyerl }
1062 1.3 hpeyerl
1063 1.97 thorpej static int
1064 1.118 christos ccdioctl(dev_t dev, u_long cmd, void *data, int flag, struct lwp *l)
1065 1.1 hpeyerl {
1066 1.11 thorpej int unit = ccdunit(dev);
1067 1.133 ad int i, j, lookedup = 0, error = 0;
1068 1.39 mycroft int part, pmask;
1069 1.11 thorpej struct ccd_softc *cs;
1070 1.11 thorpej struct ccd_ioctl *ccio = (struct ccd_ioctl *)data;
1071 1.110 elad kauth_cred_t uc;
1072 1.11 thorpej char **cpp;
1073 1.11 thorpej struct vnode **vpp;
1074 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1075 1.70 fvdl struct disklabel newlabel;
1076 1.70 fvdl #endif
1077 1.11 thorpej
1078 1.11 thorpej if (unit >= numccd)
1079 1.11 thorpej return (ENXIO);
1080 1.11 thorpej cs = &ccd_softc[unit];
1081 1.133 ad uc = kauth_cred_get();
1082 1.109 jld
1083 1.41 thorpej /* Must be open for writes for these commands... */
1084 1.41 thorpej switch (cmd) {
1085 1.41 thorpej case CCDIOCSET:
1086 1.41 thorpej case CCDIOCCLR:
1087 1.41 thorpej case DIOCSDINFO:
1088 1.41 thorpej case DIOCWDINFO:
1089 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1090 1.70 fvdl case ODIOCSDINFO:
1091 1.70 fvdl case ODIOCWDINFO:
1092 1.70 fvdl #endif
1093 1.87 thorpej case DIOCKLABEL:
1094 1.41 thorpej case DIOCWLABEL:
1095 1.41 thorpej if ((flag & FWRITE) == 0)
1096 1.41 thorpej return (EBADF);
1097 1.41 thorpej }
1098 1.41 thorpej
1099 1.133 ad mutex_enter(&cs->sc_dvlock);
1100 1.57 thorpej
1101 1.41 thorpej /* Must be initialized for these... */
1102 1.41 thorpej switch (cmd) {
1103 1.41 thorpej case CCDIOCCLR:
1104 1.42 kleink case DIOCGDINFO:
1105 1.100 thorpej case DIOCCACHESYNC:
1106 1.42 kleink case DIOCSDINFO:
1107 1.42 kleink case DIOCWDINFO:
1108 1.42 kleink case DIOCGPART:
1109 1.41 thorpej case DIOCWLABEL:
1110 1.87 thorpej case DIOCKLABEL:
1111 1.44 thorpej case DIOCGDEFLABEL:
1112 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1113 1.70 fvdl case ODIOCGDINFO:
1114 1.70 fvdl case ODIOCSDINFO:
1115 1.70 fvdl case ODIOCWDINFO:
1116 1.70 fvdl case ODIOCGDEFLABEL:
1117 1.70 fvdl #endif
1118 1.57 thorpej if ((cs->sc_flags & CCDF_INITED) == 0) {
1119 1.57 thorpej error = ENXIO;
1120 1.57 thorpej goto out;
1121 1.57 thorpej }
1122 1.41 thorpej }
1123 1.41 thorpej
1124 1.11 thorpej switch (cmd) {
1125 1.11 thorpej case CCDIOCSET:
1126 1.57 thorpej if (cs->sc_flags & CCDF_INITED) {
1127 1.57 thorpej error = EBUSY;
1128 1.57 thorpej goto out;
1129 1.57 thorpej }
1130 1.54 thorpej
1131 1.54 thorpej /* Validate the flags. */
1132 1.57 thorpej if ((ccio->ccio_flags & CCDF_USERMASK) != ccio->ccio_flags) {
1133 1.57 thorpej error = EINVAL;
1134 1.57 thorpej goto out;
1135 1.57 thorpej }
1136 1.15 thorpej
1137 1.133 ad if (ccio->ccio_ndisks > CCD_MAXNDISKS ||
1138 1.133 ad ccio->ccio_ndisks == 0) {
1139 1.73 jdolecek error = EINVAL;
1140 1.73 jdolecek goto out;
1141 1.73 jdolecek }
1142 1.102 perry
1143 1.11 thorpej /* Fill in some important bits. */
1144 1.57 thorpej cs->sc_ileave = ccio->ccio_ileave;
1145 1.57 thorpej cs->sc_nccdisks = ccio->ccio_ndisks;
1146 1.57 thorpej cs->sc_flags = ccio->ccio_flags & CCDF_USERMASK;
1147 1.11 thorpej
1148 1.11 thorpej /*
1149 1.11 thorpej * Allocate space for and copy in the array of
1150 1.11 thorpej * componet pathnames and device numbers.
1151 1.11 thorpej */
1152 1.133 ad cpp = kmem_alloc(ccio->ccio_ndisks * sizeof(*cpp), KM_SLEEP);
1153 1.133 ad vpp = kmem_alloc(ccio->ccio_ndisks * sizeof(*vpp), KM_SLEEP);
1154 1.84 dsl error = copyin(ccio->ccio_disks, cpp,
1155 1.133 ad ccio->ccio_ndisks * sizeof(*cpp));
1156 1.11 thorpej if (error) {
1157 1.133 ad kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1158 1.133 ad kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1159 1.57 thorpej goto out;
1160 1.11 thorpej }
1161 1.11 thorpej
1162 1.11 thorpej #ifdef DEBUG
1163 1.11 thorpej if (ccddebug & CCDB_INIT)
1164 1.11 thorpej for (i = 0; i < ccio->ccio_ndisks; ++i)
1165 1.104 christos printf("ccdioctl: component %d: %p\n",
1166 1.11 thorpej i, cpp[i]);
1167 1.11 thorpej #endif
1168 1.11 thorpej
1169 1.11 thorpej for (i = 0; i < ccio->ccio_ndisks; ++i) {
1170 1.11 thorpej #ifdef DEBUG
1171 1.11 thorpej if (ccddebug & CCDB_INIT)
1172 1.35 christos printf("ccdioctl: lookedup = %d\n", lookedup);
1173 1.11 thorpej #endif
1174 1.120 cube if ((error = dk_lookup(cpp[i], l, &vpp[i],
1175 1.120 cube UIO_USERSPACE)) != 0) {
1176 1.11 thorpej for (j = 0; j < lookedup; ++j)
1177 1.12 thorpej (void)vn_close(vpp[j], FREAD|FWRITE,
1178 1.128 ad uc);
1179 1.133 ad kmem_free(vpp, ccio->ccio_ndisks *
1180 1.133 ad sizeof(*vpp));
1181 1.133 ad kmem_free(cpp, ccio->ccio_ndisks *
1182 1.133 ad sizeof(*cpp));
1183 1.57 thorpej goto out;
1184 1.11 thorpej }
1185 1.11 thorpej ++lookedup;
1186 1.11 thorpej }
1187 1.11 thorpej
1188 1.133 ad /* Attach the disk. */
1189 1.133 ad disk_attach(&cs->sc_dkdev);
1190 1.133 ad bufq_alloc(&cs->sc_bufq, "fcfs", 0);
1191 1.133 ad
1192 1.11 thorpej /*
1193 1.11 thorpej * Initialize the ccd. Fills in the softc for us.
1194 1.11 thorpej */
1195 1.107 christos if ((error = ccdinit(cs, cpp, vpp, l)) != 0) {
1196 1.11 thorpej for (j = 0; j < lookedup; ++j)
1197 1.18 thorpej (void)vn_close(vpp[j], FREAD|FWRITE,
1198 1.128 ad uc);
1199 1.133 ad kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1200 1.133 ad kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1201 1.133 ad disk_detach(&cs->sc_dkdev);
1202 1.133 ad bufq_free(cs->sc_bufq);
1203 1.57 thorpej goto out;
1204 1.11 thorpej }
1205 1.11 thorpej
1206 1.57 thorpej /* We can free the temporary variables now. */
1207 1.133 ad kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1208 1.133 ad kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1209 1.57 thorpej
1210 1.11 thorpej /*
1211 1.11 thorpej * The ccd has been successfully initialized, so
1212 1.23 thorpej * we can place it into the array. Don't try to
1213 1.23 thorpej * read the disklabel until the disk has been attached,
1214 1.23 thorpej * because space for the disklabel is allocated
1215 1.23 thorpej * in disk_attach();
1216 1.11 thorpej */
1217 1.11 thorpej ccio->ccio_unit = unit;
1218 1.11 thorpej ccio->ccio_size = cs->sc_size;
1219 1.23 thorpej
1220 1.23 thorpej /* Try and read the disklabel. */
1221 1.11 thorpej ccdgetdisklabel(dev);
1222 1.11 thorpej break;
1223 1.11 thorpej
1224 1.11 thorpej case CCDIOCCLR:
1225 1.11 thorpej /*
1226 1.11 thorpej * Don't unconfigure if any other partitions are open
1227 1.11 thorpej * or if both the character and block flavors of this
1228 1.11 thorpej * partition are open.
1229 1.11 thorpej */
1230 1.11 thorpej part = DISKPART(dev);
1231 1.11 thorpej pmask = (1 << part);
1232 1.11 thorpej if ((cs->sc_dkdev.dk_openmask & ~pmask) ||
1233 1.11 thorpej ((cs->sc_dkdev.dk_bopenmask & pmask) &&
1234 1.15 thorpej (cs->sc_dkdev.dk_copenmask & pmask))) {
1235 1.57 thorpej error = EBUSY;
1236 1.57 thorpej goto out;
1237 1.15 thorpej }
1238 1.88 thorpej
1239 1.133 ad /* Stop new I/O, wait for in-flight I/O to complete. */
1240 1.133 ad mutex_enter(cs->sc_iolock);
1241 1.133 ad cs->sc_flags &= ~(CCDF_INITED|CCDF_VLABEL);
1242 1.133 ad cs->sc_zap = true;
1243 1.133 ad while (disk_isbusy(&cs->sc_dkdev) ||
1244 1.133 ad bufq_peek(cs->sc_bufq) != NULL ||
1245 1.133 ad cs->sc_thread != NULL) {
1246 1.133 ad cv_broadcast(&cs->sc_push);
1247 1.133 ad (void)cv_timedwait(&cs->sc_stop, cs->sc_iolock, hz);
1248 1.133 ad }
1249 1.133 ad mutex_exit(cs->sc_iolock);
1250 1.11 thorpej
1251 1.11 thorpej /*
1252 1.11 thorpej * Free ccd_softc information and clear entry.
1253 1.11 thorpej */
1254 1.22 thorpej
1255 1.22 thorpej /* Close the components and free their pathnames. */
1256 1.11 thorpej for (i = 0; i < cs->sc_nccdisks; ++i) {
1257 1.11 thorpej /*
1258 1.11 thorpej * XXX: this close could potentially fail and
1259 1.11 thorpej * cause Bad Things. Maybe we need to force
1260 1.11 thorpej * the close to happen?
1261 1.11 thorpej */
1262 1.11 thorpej #ifdef DEBUG
1263 1.11 thorpej if (ccddebug & CCDB_VNODE)
1264 1.11 thorpej vprint("CCDIOCCLR: vnode info",
1265 1.11 thorpej cs->sc_cinfo[i].ci_vp);
1266 1.11 thorpej #endif
1267 1.11 thorpej (void)vn_close(cs->sc_cinfo[i].ci_vp, FREAD|FWRITE,
1268 1.128 ad uc);
1269 1.133 ad kmem_free(cs->sc_cinfo[i].ci_path,
1270 1.133 ad cs->sc_cinfo[i].ci_pathlen);
1271 1.38 thorpej }
1272 1.38 thorpej
1273 1.22 thorpej /* Free interleave index. */
1274 1.133 ad for (i = 0; cs->sc_itable[i].ii_ndisk; ++i) {
1275 1.133 ad kmem_free(cs->sc_itable[i].ii_index,
1276 1.133 ad cs->sc_itable[i].ii_indexsz);
1277 1.133 ad }
1278 1.22 thorpej
1279 1.22 thorpej /* Free component info and interleave table. */
1280 1.133 ad kmem_free(cs->sc_cinfo, cs->sc_nccdisks *
1281 1.133 ad sizeof(struct ccdcinfo));
1282 1.133 ad kmem_free(cs->sc_itable, (cs->sc_nccdisks + 1) *
1283 1.133 ad sizeof(struct ccdiinfo));
1284 1.15 thorpej
1285 1.23 thorpej /* Detatch the disk. */
1286 1.123 ad disk_detach(&cs->sc_dkdev);
1287 1.133 ad bufq_free(cs->sc_bufq);
1288 1.11 thorpej break;
1289 1.11 thorpej
1290 1.11 thorpej case DIOCGDINFO:
1291 1.23 thorpej *(struct disklabel *)data = *(cs->sc_dkdev.dk_label);
1292 1.11 thorpej break;
1293 1.133 ad
1294 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1295 1.70 fvdl case ODIOCGDINFO:
1296 1.70 fvdl newlabel = *(cs->sc_dkdev.dk_label);
1297 1.70 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
1298 1.71 fvdl return ENOTTY;
1299 1.70 fvdl memcpy(data, &newlabel, sizeof (struct olddisklabel));
1300 1.70 fvdl break;
1301 1.70 fvdl #endif
1302 1.11 thorpej
1303 1.11 thorpej case DIOCGPART:
1304 1.23 thorpej ((struct partinfo *)data)->disklab = cs->sc_dkdev.dk_label;
1305 1.11 thorpej ((struct partinfo *)data)->part =
1306 1.23 thorpej &cs->sc_dkdev.dk_label->d_partitions[DISKPART(dev)];
1307 1.11 thorpej break;
1308 1.11 thorpej
1309 1.100 thorpej case DIOCCACHESYNC:
1310 1.100 thorpej /*
1311 1.100 thorpej * XXX Do we really need to care about having a writable
1312 1.100 thorpej * file descriptor here?
1313 1.100 thorpej */
1314 1.100 thorpej if ((flag & FWRITE) == 0)
1315 1.100 thorpej return (EBADF);
1316 1.100 thorpej
1317 1.100 thorpej /*
1318 1.100 thorpej * We pass this call down to all components and report
1319 1.100 thorpej * the first error we encounter.
1320 1.100 thorpej */
1321 1.100 thorpej for (error = 0, i = 0; i < cs->sc_nccdisks; i++) {
1322 1.100 thorpej j = VOP_IOCTL(cs->sc_cinfo[i].ci_vp, cmd, data,
1323 1.124 pooka flag, uc);
1324 1.100 thorpej if (j != 0 && error == 0)
1325 1.100 thorpej error = j;
1326 1.100 thorpej }
1327 1.100 thorpej break;
1328 1.100 thorpej
1329 1.11 thorpej case DIOCWDINFO:
1330 1.11 thorpej case DIOCSDINFO:
1331 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1332 1.70 fvdl case ODIOCWDINFO:
1333 1.70 fvdl case ODIOCSDINFO:
1334 1.70 fvdl #endif
1335 1.70 fvdl {
1336 1.70 fvdl struct disklabel *lp;
1337 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1338 1.70 fvdl if (cmd == ODIOCSDINFO || cmd == ODIOCWDINFO) {
1339 1.70 fvdl memset(&newlabel, 0, sizeof newlabel);
1340 1.70 fvdl memcpy(&newlabel, data, sizeof (struct olddisklabel));
1341 1.70 fvdl lp = &newlabel;
1342 1.70 fvdl } else
1343 1.70 fvdl #endif
1344 1.70 fvdl lp = (struct disklabel *)data;
1345 1.70 fvdl
1346 1.11 thorpej cs->sc_flags |= CCDF_LABELLING;
1347 1.11 thorpej
1348 1.23 thorpej error = setdisklabel(cs->sc_dkdev.dk_label,
1349 1.70 fvdl lp, 0, cs->sc_dkdev.dk_cpulabel);
1350 1.11 thorpej if (error == 0) {
1351 1.70 fvdl if (cmd == DIOCWDINFO
1352 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1353 1.70 fvdl || cmd == ODIOCWDINFO
1354 1.70 fvdl #endif
1355 1.70 fvdl )
1356 1.11 thorpej error = writedisklabel(CCDLABELDEV(dev),
1357 1.23 thorpej ccdstrategy, cs->sc_dkdev.dk_label,
1358 1.23 thorpej cs->sc_dkdev.dk_cpulabel);
1359 1.11 thorpej }
1360 1.11 thorpej
1361 1.11 thorpej cs->sc_flags &= ~CCDF_LABELLING;
1362 1.11 thorpej break;
1363 1.70 fvdl }
1364 1.11 thorpej
1365 1.87 thorpej case DIOCKLABEL:
1366 1.87 thorpej if (*(int *)data != 0)
1367 1.87 thorpej cs->sc_flags |= CCDF_KLABEL;
1368 1.87 thorpej else
1369 1.87 thorpej cs->sc_flags &= ~CCDF_KLABEL;
1370 1.87 thorpej break;
1371 1.87 thorpej
1372 1.11 thorpej case DIOCWLABEL:
1373 1.11 thorpej if (*(int *)data != 0)
1374 1.11 thorpej cs->sc_flags |= CCDF_WLABEL;
1375 1.11 thorpej else
1376 1.11 thorpej cs->sc_flags &= ~CCDF_WLABEL;
1377 1.11 thorpej break;
1378 1.11 thorpej
1379 1.44 thorpej case DIOCGDEFLABEL:
1380 1.44 thorpej ccdgetdefaultlabel(cs, (struct disklabel *)data);
1381 1.44 thorpej break;
1382 1.70 fvdl
1383 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1384 1.70 fvdl case ODIOCGDEFLABEL:
1385 1.70 fvdl ccdgetdefaultlabel(cs, &newlabel);
1386 1.70 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
1387 1.71 fvdl return ENOTTY;
1388 1.70 fvdl memcpy(data, &newlabel, sizeof (struct olddisklabel));
1389 1.70 fvdl break;
1390 1.70 fvdl #endif
1391 1.44 thorpej
1392 1.11 thorpej default:
1393 1.57 thorpej error = ENOTTY;
1394 1.11 thorpej }
1395 1.11 thorpej
1396 1.57 thorpej out:
1397 1.133 ad mutex_exit(&cs->sc_dvlock);
1398 1.57 thorpej return (error);
1399 1.1 hpeyerl }
1400 1.1 hpeyerl
1401 1.97 thorpej static int
1402 1.97 thorpej ccdsize(dev_t dev)
1403 1.1 hpeyerl {
1404 1.11 thorpej struct ccd_softc *cs;
1405 1.40 thorpej struct disklabel *lp;
1406 1.40 thorpej int part, unit, omask, size;
1407 1.40 thorpej
1408 1.40 thorpej unit = ccdunit(dev);
1409 1.40 thorpej if (unit >= numccd)
1410 1.40 thorpej return (-1);
1411 1.40 thorpej cs = &ccd_softc[unit];
1412 1.11 thorpej
1413 1.40 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1414 1.11 thorpej return (-1);
1415 1.11 thorpej
1416 1.11 thorpej part = DISKPART(dev);
1417 1.40 thorpej omask = cs->sc_dkdev.dk_openmask & (1 << part);
1418 1.40 thorpej lp = cs->sc_dkdev.dk_label;
1419 1.11 thorpej
1420 1.107 christos if (omask == 0 && ccdopen(dev, 0, S_IFBLK, curlwp))
1421 1.11 thorpej return (-1);
1422 1.11 thorpej
1423 1.40 thorpej if (lp->d_partitions[part].p_fstype != FS_SWAP)
1424 1.11 thorpej size = -1;
1425 1.11 thorpej else
1426 1.40 thorpej size = lp->d_partitions[part].p_size *
1427 1.40 thorpej (lp->d_secsize / DEV_BSIZE);
1428 1.11 thorpej
1429 1.107 christos if (omask == 0 && ccdclose(dev, 0, S_IFBLK, curlwp))
1430 1.11 thorpej return (-1);
1431 1.1 hpeyerl
1432 1.11 thorpej return (size);
1433 1.1 hpeyerl }
1434 1.1 hpeyerl
1435 1.11 thorpej static void
1436 1.97 thorpej ccdgetdefaultlabel(struct ccd_softc *cs, struct disklabel *lp)
1437 1.11 thorpej {
1438 1.11 thorpej struct ccdgeom *ccg = &cs->sc_geom;
1439 1.11 thorpej
1440 1.72 thorpej memset(lp, 0, sizeof(*lp));
1441 1.11 thorpej
1442 1.11 thorpej lp->d_secperunit = cs->sc_size;
1443 1.11 thorpej lp->d_secsize = ccg->ccg_secsize;
1444 1.11 thorpej lp->d_nsectors = ccg->ccg_nsectors;
1445 1.11 thorpej lp->d_ntracks = ccg->ccg_ntracks;
1446 1.11 thorpej lp->d_ncylinders = ccg->ccg_ncylinders;
1447 1.19 thorpej lp->d_secpercyl = lp->d_ntracks * lp->d_nsectors;
1448 1.11 thorpej
1449 1.11 thorpej strncpy(lp->d_typename, "ccd", sizeof(lp->d_typename));
1450 1.11 thorpej lp->d_type = DTYPE_CCD;
1451 1.11 thorpej strncpy(lp->d_packname, "fictitious", sizeof(lp->d_packname));
1452 1.11 thorpej lp->d_rpm = 3600;
1453 1.11 thorpej lp->d_interleave = 1;
1454 1.11 thorpej lp->d_flags = 0;
1455 1.11 thorpej
1456 1.11 thorpej lp->d_partitions[RAW_PART].p_offset = 0;
1457 1.11 thorpej lp->d_partitions[RAW_PART].p_size = cs->sc_size;
1458 1.11 thorpej lp->d_partitions[RAW_PART].p_fstype = FS_UNUSED;
1459 1.11 thorpej lp->d_npartitions = RAW_PART + 1;
1460 1.11 thorpej
1461 1.11 thorpej lp->d_magic = DISKMAGIC;
1462 1.11 thorpej lp->d_magic2 = DISKMAGIC;
1463 1.23 thorpej lp->d_checksum = dkcksum(cs->sc_dkdev.dk_label);
1464 1.44 thorpej }
1465 1.44 thorpej
1466 1.44 thorpej /*
1467 1.44 thorpej * Read the disklabel from the ccd. If one is not present, fake one
1468 1.44 thorpej * up.
1469 1.44 thorpej */
1470 1.44 thorpej static void
1471 1.97 thorpej ccdgetdisklabel(dev_t dev)
1472 1.44 thorpej {
1473 1.44 thorpej int unit = ccdunit(dev);
1474 1.44 thorpej struct ccd_softc *cs = &ccd_softc[unit];
1475 1.85 dsl const char *errstring;
1476 1.44 thorpej struct disklabel *lp = cs->sc_dkdev.dk_label;
1477 1.44 thorpej struct cpu_disklabel *clp = cs->sc_dkdev.dk_cpulabel;
1478 1.44 thorpej
1479 1.133 ad KASSERT(mutex_owned(&cs->sc_dvlock));
1480 1.133 ad
1481 1.72 thorpej memset(clp, 0, sizeof(*clp));
1482 1.44 thorpej
1483 1.44 thorpej ccdgetdefaultlabel(cs, lp);
1484 1.11 thorpej
1485 1.11 thorpej /*
1486 1.11 thorpej * Call the generic disklabel extraction routine.
1487 1.11 thorpej */
1488 1.133 ad cs->sc_flags |= CCDF_RLABEL;
1489 1.92 lukem if ((cs->sc_flags & CCDF_NOLABEL) != 0)
1490 1.92 lukem errstring = "CCDF_NOLABEL set; ignoring on-disk label";
1491 1.92 lukem else
1492 1.92 lukem errstring = readdisklabel(CCDLABELDEV(dev), ccdstrategy,
1493 1.92 lukem cs->sc_dkdev.dk_label, cs->sc_dkdev.dk_cpulabel);
1494 1.29 christos if (errstring)
1495 1.11 thorpej ccdmakedisklabel(cs);
1496 1.47 enami else {
1497 1.47 enami int i;
1498 1.47 enami struct partition *pp;
1499 1.47 enami
1500 1.47 enami /*
1501 1.47 enami * Sanity check whether the found disklabel is valid.
1502 1.47 enami *
1503 1.47 enami * This is necessary since total size of ccd may vary
1504 1.47 enami * when an interleave is changed even though exactly
1505 1.47 enami * same componets are used, and old disklabel may used
1506 1.47 enami * if that is found.
1507 1.47 enami */
1508 1.47 enami if (lp->d_secperunit != cs->sc_size)
1509 1.47 enami printf("WARNING: %s: "
1510 1.47 enami "total sector size in disklabel (%d) != "
1511 1.60 thorpej "the size of ccd (%lu)\n", cs->sc_xname,
1512 1.60 thorpej lp->d_secperunit, (u_long)cs->sc_size);
1513 1.47 enami for (i = 0; i < lp->d_npartitions; i++) {
1514 1.47 enami pp = &lp->d_partitions[i];
1515 1.47 enami if (pp->p_offset + pp->p_size > cs->sc_size)
1516 1.48 enami printf("WARNING: %s: end of partition `%c' "
1517 1.60 thorpej "exceeds the size of ccd (%lu)\n",
1518 1.60 thorpej cs->sc_xname, 'a' + i, (u_long)cs->sc_size);
1519 1.47 enami }
1520 1.47 enami }
1521 1.11 thorpej
1522 1.11 thorpej #ifdef DEBUG
1523 1.11 thorpej /* It's actually extremely common to have unlabeled ccds. */
1524 1.11 thorpej if (ccddebug & CCDB_LABEL)
1525 1.11 thorpej if (errstring != NULL)
1526 1.35 christos printf("%s: %s\n", cs->sc_xname, errstring);
1527 1.11 thorpej #endif
1528 1.87 thorpej
1529 1.87 thorpej /* In-core label now valid. */
1530 1.133 ad cs->sc_flags = (cs->sc_flags | CCDF_VLABEL) & ~CCDF_RLABEL;
1531 1.11 thorpej }
1532 1.11 thorpej
1533 1.11 thorpej /*
1534 1.11 thorpej * Take care of things one might want to take care of in the event
1535 1.11 thorpej * that a disklabel isn't present.
1536 1.11 thorpej */
1537 1.11 thorpej static void
1538 1.97 thorpej ccdmakedisklabel(struct ccd_softc *cs)
1539 1.11 thorpej {
1540 1.23 thorpej struct disklabel *lp = cs->sc_dkdev.dk_label;
1541 1.11 thorpej
1542 1.11 thorpej /*
1543 1.11 thorpej * For historical reasons, if there's no disklabel present
1544 1.11 thorpej * the raw partition must be marked FS_BSDFFS.
1545 1.11 thorpej */
1546 1.11 thorpej lp->d_partitions[RAW_PART].p_fstype = FS_BSDFFS;
1547 1.11 thorpej
1548 1.11 thorpej strncpy(lp->d_packname, "default label", sizeof(lp->d_packname));
1549 1.44 thorpej
1550 1.44 thorpej lp->d_checksum = dkcksum(lp);
1551 1.11 thorpej }
1552 1.11 thorpej
1553 1.11 thorpej #ifdef DEBUG
1554 1.11 thorpej static void
1555 1.97 thorpej printiinfo(struct ccdiinfo *ii)
1556 1.11 thorpej {
1557 1.68 augustss int ix, i;
1558 1.11 thorpej
1559 1.11 thorpej for (ix = 0; ii->ii_ndisk; ix++, ii++) {
1560 1.81 kleink printf(" itab[%d]: #dk %d sblk %" PRId64 " soff %" PRId64,
1561 1.34 christos ix, ii->ii_ndisk, ii->ii_startblk, ii->ii_startoff);
1562 1.11 thorpej for (i = 0; i < ii->ii_ndisk; i++)
1563 1.35 christos printf(" %d", ii->ii_index[i]);
1564 1.35 christos printf("\n");
1565 1.11 thorpej }
1566 1.1 hpeyerl }
1567 1.1 hpeyerl #endif
1568 1.134 haad
1569 1.134 haad #ifdef _MODULE
1570 1.134 haad
1571 1.134 haad #include <sys/module.h>
1572 1.134 haad
1573 1.134 haad MODULE(MODULE_CLASS_DRIVER, ccd, NULL);
1574 1.134 haad
1575 1.134 haad static int
1576 1.134 haad ccd_modcmd(modcmd_t cmd, void *arg)
1577 1.134 haad {
1578 1.134 haad int bmajor = -1, cmajor = -1, error = 0;
1579 1.134 haad
1580 1.134 haad switch (cmd) {
1581 1.134 haad case MODULE_CMD_INIT:
1582 1.134 haad ccdattach(4);
1583 1.134 haad
1584 1.134 haad return devsw_attach("ccd", &ccd_bdevsw, &bmajor,
1585 1.134 haad &ccd_cdevsw, &cmajor);
1586 1.134 haad break;
1587 1.134 haad
1588 1.134 haad case MODULE_CMD_FINI:
1589 1.134 haad return devsw_detach(&ccd_bdevsw, &ccd_cdevsw);
1590 1.134 haad break;
1591 1.134 haad
1592 1.134 haad case MODULE_CMD_STAT:
1593 1.134 haad return ENOTTY;
1594 1.134 haad
1595 1.134 haad default:
1596 1.134 haad return ENOTTY;
1597 1.134 haad }
1598 1.134 haad
1599 1.134 haad return error;
1600 1.134 haad }
1601 1.134 haad
1602 1.134 haad #endif
1603