ccd.c revision 1.129.10.2 1 1.129.10.2 msaitoh /* $NetBSD: ccd.c,v 1.129.10.2 2014/08/27 05:47:43 msaitoh Exp $ */
2 1.11 thorpej
3 1.28 thorpej /*-
4 1.129.10.1 snj * Copyright (c) 1996, 1997, 1998, 1999, 2007, 2009 The NetBSD Foundation, Inc.
5 1.11 thorpej * All rights reserved.
6 1.11 thorpej *
7 1.28 thorpej * This code is derived from software contributed to The NetBSD Foundation
8 1.129.10.1 snj * by Jason R. Thorpe, and by Andrew Doran.
9 1.28 thorpej *
10 1.11 thorpej * Redistribution and use in source and binary forms, with or without
11 1.11 thorpej * modification, are permitted provided that the following conditions
12 1.11 thorpej * are met:
13 1.11 thorpej * 1. Redistributions of source code must retain the above copyright
14 1.11 thorpej * notice, this list of conditions and the following disclaimer.
15 1.11 thorpej * 2. Redistributions in binary form must reproduce the above copyright
16 1.11 thorpej * notice, this list of conditions and the following disclaimer in the
17 1.11 thorpej * documentation and/or other materials provided with the distribution.
18 1.11 thorpej *
19 1.28 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.28 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.28 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.45 jtc * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.45 jtc * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.28 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.28 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.28 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.28 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.28 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.28 thorpej * POSSIBILITY OF SUCH DAMAGE.
30 1.11 thorpej */
31 1.2 cgd
32 1.1 hpeyerl /*
33 1.3 hpeyerl * Copyright (c) 1990, 1993
34 1.3 hpeyerl * The Regents of the University of California. All rights reserved.
35 1.1 hpeyerl *
36 1.1 hpeyerl * This code is derived from software contributed to Berkeley by
37 1.1 hpeyerl * the Systems Programming Group of the University of Utah Computer
38 1.1 hpeyerl * Science Department.
39 1.1 hpeyerl *
40 1.1 hpeyerl * Redistribution and use in source and binary forms, with or without
41 1.1 hpeyerl * modification, are permitted provided that the following conditions
42 1.1 hpeyerl * are met:
43 1.1 hpeyerl * 1. Redistributions of source code must retain the above copyright
44 1.1 hpeyerl * notice, this list of conditions and the following disclaimer.
45 1.1 hpeyerl * 2. Redistributions in binary form must reproduce the above copyright
46 1.1 hpeyerl * notice, this list of conditions and the following disclaimer in the
47 1.1 hpeyerl * documentation and/or other materials provided with the distribution.
48 1.91 agc * 3. Neither the name of the University nor the names of its contributors
49 1.91 agc * may be used to endorse or promote products derived from this software
50 1.91 agc * without specific prior written permission.
51 1.91 agc *
52 1.91 agc * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 1.91 agc * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 1.91 agc * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 1.91 agc * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 1.91 agc * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 1.91 agc * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 1.91 agc * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 1.91 agc * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 1.91 agc * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 1.91 agc * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
62 1.91 agc * SUCH DAMAGE.
63 1.91 agc *
64 1.91 agc * from: Utah $Hdr: cd.c 1.6 90/11/28$
65 1.91 agc *
66 1.91 agc * @(#)cd.c 8.2 (Berkeley) 11/16/93
67 1.91 agc */
68 1.91 agc
69 1.91 agc /*
70 1.91 agc * Copyright (c) 1988 University of Utah.
71 1.91 agc *
72 1.91 agc * This code is derived from software contributed to Berkeley by
73 1.91 agc * the Systems Programming Group of the University of Utah Computer
74 1.91 agc * Science Department.
75 1.91 agc *
76 1.91 agc * Redistribution and use in source and binary forms, with or without
77 1.91 agc * modification, are permitted provided that the following conditions
78 1.91 agc * are met:
79 1.91 agc * 1. Redistributions of source code must retain the above copyright
80 1.91 agc * notice, this list of conditions and the following disclaimer.
81 1.91 agc * 2. Redistributions in binary form must reproduce the above copyright
82 1.91 agc * notice, this list of conditions and the following disclaimer in the
83 1.91 agc * documentation and/or other materials provided with the distribution.
84 1.1 hpeyerl * 3. All advertising materials mentioning features or use of this software
85 1.1 hpeyerl * must display the following acknowledgement:
86 1.1 hpeyerl * This product includes software developed by the University of
87 1.1 hpeyerl * California, Berkeley and its contributors.
88 1.1 hpeyerl * 4. Neither the name of the University nor the names of its contributors
89 1.1 hpeyerl * may be used to endorse or promote products derived from this software
90 1.1 hpeyerl * without specific prior written permission.
91 1.1 hpeyerl *
92 1.1 hpeyerl * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
93 1.1 hpeyerl * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
94 1.1 hpeyerl * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
95 1.1 hpeyerl * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
96 1.1 hpeyerl * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
97 1.1 hpeyerl * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
98 1.1 hpeyerl * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
99 1.1 hpeyerl * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
100 1.1 hpeyerl * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
101 1.1 hpeyerl * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
102 1.1 hpeyerl * SUCH DAMAGE.
103 1.1 hpeyerl *
104 1.2 cgd * from: Utah $Hdr: cd.c 1.6 90/11/28$
105 1.2 cgd *
106 1.3 hpeyerl * @(#)cd.c 8.2 (Berkeley) 11/16/93
107 1.1 hpeyerl */
108 1.1 hpeyerl
109 1.1 hpeyerl /*
110 1.1 hpeyerl * "Concatenated" disk driver.
111 1.11 thorpej *
112 1.129.10.1 snj * Notes on concurrency:
113 1.129.10.1 snj *
114 1.129.10.1 snj * => sc_dvlock serializes access to the device nodes, excluding block I/O.
115 1.129.10.1 snj *
116 1.129.10.1 snj * => sc_iolock serializes access to (sc_flags & CCDF_INITED), disk stats,
117 1.129.10.1 snj * sc_stop, sc_bufq and b_resid from master buffers.
118 1.129.10.1 snj *
119 1.129.10.1 snj * => a combination of CCDF_INITED, sc_inflight, and sc_iolock is used to
120 1.129.10.1 snj * serialize I/O and configuration changes.
121 1.129.10.1 snj *
122 1.129.10.1 snj * => the in-core disk label does not change while the device is open.
123 1.129.10.1 snj *
124 1.129.10.1 snj * On memory consumption: ccd fans out I/O requests and so needs to
125 1.129.10.1 snj * allocate memory. If the system is desperately low on memory, we
126 1.129.10.1 snj * single thread I/O.
127 1.1 hpeyerl */
128 1.74 lukem
129 1.74 lukem #include <sys/cdefs.h>
130 1.129.10.2 msaitoh __KERNEL_RCSID(0, "$NetBSD: ccd.c,v 1.129.10.2 2014/08/27 05:47:43 msaitoh Exp $");
131 1.129.10.2 msaitoh
132 1.129.10.2 msaitoh #if defined(_KERNEL_OPT)
133 1.129.10.2 msaitoh #include "opt_compat_netbsd.h"
134 1.129.10.2 msaitoh #endif
135 1.1 hpeyerl
136 1.1 hpeyerl #include <sys/param.h>
137 1.1 hpeyerl #include <sys/systm.h>
138 1.129.10.1 snj #include <sys/kernel.h>
139 1.3 hpeyerl #include <sys/proc.h>
140 1.1 hpeyerl #include <sys/errno.h>
141 1.1 hpeyerl #include <sys/buf.h>
142 1.129.10.1 snj #include <sys/kmem.h>
143 1.63 thorpej #include <sys/pool.h>
144 1.11 thorpej #include <sys/namei.h>
145 1.3 hpeyerl #include <sys/stat.h>
146 1.3 hpeyerl #include <sys/ioctl.h>
147 1.3 hpeyerl #include <sys/disklabel.h>
148 1.11 thorpej #include <sys/device.h>
149 1.11 thorpej #include <sys/disk.h>
150 1.11 thorpej #include <sys/syslog.h>
151 1.3 hpeyerl #include <sys/fcntl.h>
152 1.11 thorpej #include <sys/vnode.h>
153 1.31 christos #include <sys/conf.h>
154 1.117 ad #include <sys/mutex.h>
155 1.56 thorpej #include <sys/queue.h>
156 1.110 elad #include <sys/kauth.h>
157 1.129.10.1 snj #include <sys/kthread.h>
158 1.129.10.1 snj #include <sys/bufq.h>
159 1.1 hpeyerl
160 1.1 hpeyerl #include <dev/ccdvar.h>
161 1.113 christos #include <dev/dkvar.h>
162 1.1 hpeyerl
163 1.11 thorpej #if defined(CCDDEBUG) && !defined(DEBUG)
164 1.11 thorpej #define DEBUG
165 1.11 thorpej #endif
166 1.11 thorpej
167 1.1 hpeyerl #ifdef DEBUG
168 1.3 hpeyerl #define CCDB_FOLLOW 0x01
169 1.3 hpeyerl #define CCDB_INIT 0x02
170 1.3 hpeyerl #define CCDB_IO 0x04
171 1.11 thorpej #define CCDB_LABEL 0x08
172 1.11 thorpej #define CCDB_VNODE 0x10
173 1.24 thorpej int ccddebug = 0x00;
174 1.1 hpeyerl #endif
175 1.1 hpeyerl
176 1.6 cgd #define ccdunit(x) DISKUNIT(x)
177 1.6 cgd
178 1.6 cgd struct ccdbuf {
179 1.6 cgd struct buf cb_buf; /* new I/O buf */
180 1.6 cgd struct buf *cb_obp; /* ptr. to original I/O buf */
181 1.59 thorpej struct ccd_softc *cb_sc; /* pointer to ccd softc */
182 1.6 cgd int cb_comp; /* target component */
183 1.56 thorpej SIMPLEQ_ENTRY(ccdbuf) cb_q; /* fifo of component buffers */
184 1.38 thorpej };
185 1.24 thorpej
186 1.63 thorpej /* component buffer pool */
187 1.129.10.1 snj static pool_cache_t ccd_cache;
188 1.63 thorpej
189 1.129.10.1 snj #define CCD_GETBUF() pool_cache_get(ccd_cache, PR_WAITOK)
190 1.129.10.1 snj #define CCD_PUTBUF(cbp) pool_cache_put(ccd_cache, cbp)
191 1.1 hpeyerl
192 1.11 thorpej #define CCDLABELDEV(dev) \
193 1.11 thorpej (MAKEDISKDEV(major((dev)), ccdunit((dev)), RAW_PART))
194 1.1 hpeyerl
195 1.11 thorpej /* called by main() at boot time */
196 1.97 thorpej void ccdattach(int);
197 1.11 thorpej
198 1.11 thorpej /* called by biodone() at interrupt time */
199 1.97 thorpej static void ccdiodone(struct buf *);
200 1.11 thorpej
201 1.97 thorpej static void ccdinterleave(struct ccd_softc *);
202 1.97 thorpej static int ccdinit(struct ccd_softc *, char **, struct vnode **,
203 1.107 christos struct lwp *);
204 1.97 thorpej static struct ccdbuf *ccdbuffer(struct ccd_softc *, struct buf *,
205 1.118 christos daddr_t, void *, long);
206 1.97 thorpej static void ccdgetdefaultlabel(struct ccd_softc *, struct disklabel *);
207 1.97 thorpej static void ccdgetdisklabel(dev_t);
208 1.97 thorpej static void ccdmakedisklabel(struct ccd_softc *);
209 1.129.10.1 snj static void ccdstart(struct ccd_softc *);
210 1.129.10.1 snj static void ccdthread(void *);
211 1.97 thorpej
212 1.97 thorpej static dev_type_open(ccdopen);
213 1.97 thorpej static dev_type_close(ccdclose);
214 1.97 thorpej static dev_type_read(ccdread);
215 1.97 thorpej static dev_type_write(ccdwrite);
216 1.97 thorpej static dev_type_ioctl(ccdioctl);
217 1.97 thorpej static dev_type_strategy(ccdstrategy);
218 1.97 thorpej static dev_type_size(ccdsize);
219 1.78 gehenna
220 1.78 gehenna const struct bdevsw ccd_bdevsw = {
221 1.129.10.1 snj .d_open = ccdopen,
222 1.129.10.1 snj .d_close = ccdclose,
223 1.129.10.1 snj .d_strategy = ccdstrategy,
224 1.129.10.1 snj .d_ioctl = ccdioctl,
225 1.129.10.1 snj .d_dump = nodump,
226 1.129.10.1 snj .d_psize = ccdsize,
227 1.129.10.1 snj .d_flag = D_DISK | D_MPSAFE
228 1.78 gehenna };
229 1.78 gehenna
230 1.78 gehenna const struct cdevsw ccd_cdevsw = {
231 1.129.10.1 snj .d_open = ccdopen,
232 1.129.10.1 snj .d_close = ccdclose,
233 1.129.10.1 snj .d_read = ccdread,
234 1.129.10.1 snj .d_write = ccdwrite,
235 1.129.10.1 snj .d_ioctl = ccdioctl,
236 1.129.10.1 snj .d_stop = nostop,
237 1.129.10.1 snj .d_tty = notty,
238 1.129.10.1 snj .d_poll = nopoll,
239 1.129.10.1 snj .d_mmap = nommap,
240 1.129.10.1 snj .d_kqfilter = nokqfilter,
241 1.129.10.1 snj .d_flag = D_DISK | D_MPSAFE
242 1.78 gehenna };
243 1.3 hpeyerl
244 1.11 thorpej #ifdef DEBUG
245 1.97 thorpej static void printiinfo(struct ccdiinfo *);
246 1.11 thorpej #endif
247 1.11 thorpej
248 1.108 lukem /* Publically visible for the benefit of libkvm and ccdconfig(8). */
249 1.108 lukem struct ccd_softc *ccd_softc;
250 1.108 lukem const int ccd_softc_elemsize = sizeof(struct ccd_softc);
251 1.108 lukem int numccd = 0;
252 1.1 hpeyerl
253 1.3 hpeyerl /*
254 1.11 thorpej * Called by main() during pseudo-device attachment. All we need
255 1.11 thorpej * to do is allocate enough space for devices to be configured later.
256 1.1 hpeyerl */
257 1.1 hpeyerl void
258 1.97 thorpej ccdattach(int num)
259 1.3 hpeyerl {
260 1.57 thorpej struct ccd_softc *cs;
261 1.57 thorpej int i;
262 1.57 thorpej
263 1.11 thorpej if (num <= 0) {
264 1.11 thorpej #ifdef DIAGNOSTIC
265 1.11 thorpej panic("ccdattach: count <= 0");
266 1.11 thorpej #endif
267 1.3 hpeyerl return;
268 1.11 thorpej }
269 1.11 thorpej
270 1.129.10.1 snj ccd_softc = kmem_zalloc(num * ccd_softc_elemsize, KM_SLEEP);
271 1.57 thorpej if (ccd_softc == NULL) {
272 1.35 christos printf("WARNING: no memory for concatenated disks\n");
273 1.3 hpeyerl return;
274 1.3 hpeyerl }
275 1.3 hpeyerl numccd = num;
276 1.57 thorpej
277 1.63 thorpej /* Initialize the component buffer pool. */
278 1.129.10.1 snj ccd_cache = pool_cache_init(sizeof(struct ccdbuf), 0,
279 1.129.10.1 snj 0, 0, "ccdbuf", NULL, IPL_BIO, NULL, NULL, NULL);
280 1.63 thorpej
281 1.57 thorpej /* Initialize per-softc structures. */
282 1.57 thorpej for (i = 0; i < num; i++) {
283 1.57 thorpej cs = &ccd_softc[i];
284 1.96 itojun snprintf(cs->sc_xname, sizeof(cs->sc_xname), "ccd%d", i);
285 1.129.10.1 snj mutex_init(&cs->sc_dvlock, MUTEX_DEFAULT, IPL_NONE);
286 1.129.10.1 snj cs->sc_iolock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NONE);
287 1.129.10.1 snj cv_init(&cs->sc_stop, "ccdstop");
288 1.129.10.1 snj cv_init(&cs->sc_push, "ccdthr");
289 1.123 ad disk_init(&cs->sc_dkdev, cs->sc_xname, NULL); /* XXX */
290 1.57 thorpej }
291 1.1 hpeyerl }
292 1.1 hpeyerl
293 1.11 thorpej static int
294 1.97 thorpej ccdinit(struct ccd_softc *cs, char **cpaths, struct vnode **vpp,
295 1.107 christos struct lwp *l)
296 1.1 hpeyerl {
297 1.68 augustss struct ccdcinfo *ci = NULL;
298 1.68 augustss size_t size;
299 1.68 augustss int ix;
300 1.11 thorpej struct vattr va;
301 1.1 hpeyerl size_t minsize;
302 1.11 thorpej int maxsecsize;
303 1.7 cgd struct partinfo dpart;
304 1.11 thorpej struct ccdgeom *ccg = &cs->sc_geom;
305 1.111 christos char *tmppath;
306 1.67 enami int error, path_alloced;
307 1.1 hpeyerl
308 1.1 hpeyerl #ifdef DEBUG
309 1.3 hpeyerl if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
310 1.59 thorpej printf("%s: ccdinit\n", cs->sc_xname);
311 1.1 hpeyerl #endif
312 1.11 thorpej
313 1.11 thorpej /* Allocate space for the component info. */
314 1.129.10.1 snj cs->sc_cinfo = kmem_alloc(cs->sc_nccdisks * sizeof(*cs->sc_cinfo),
315 1.129.10.1 snj KM_SLEEP);
316 1.129.10.1 snj tmppath = kmem_alloc(MAXPATHLEN, KM_SLEEP);
317 1.111 christos
318 1.57 thorpej cs->sc_size = 0;
319 1.57 thorpej
320 1.1 hpeyerl /*
321 1.1 hpeyerl * Verify that each component piece exists and record
322 1.1 hpeyerl * relevant information about it.
323 1.1 hpeyerl */
324 1.11 thorpej maxsecsize = 0;
325 1.1 hpeyerl minsize = 0;
326 1.67 enami for (ix = 0, path_alloced = 0; ix < cs->sc_nccdisks; ix++) {
327 1.1 hpeyerl ci = &cs->sc_cinfo[ix];
328 1.57 thorpej ci->ci_vp = vpp[ix];
329 1.11 thorpej
330 1.11 thorpej /*
331 1.11 thorpej * Copy in the pathname of the component.
332 1.11 thorpej */
333 1.72 thorpej memset(tmppath, 0, sizeof(tmppath)); /* sanity */
334 1.29 christos error = copyinstr(cpaths[ix], tmppath,
335 1.29 christos MAXPATHLEN, &ci->ci_pathlen);
336 1.129.10.1 snj if (ci->ci_pathlen == 0)
337 1.129.10.1 snj error = EINVAL;
338 1.29 christos if (error) {
339 1.11 thorpej #ifdef DEBUG
340 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
341 1.35 christos printf("%s: can't copy path, error = %d\n",
342 1.23 thorpej cs->sc_xname, error);
343 1.11 thorpej #endif
344 1.67 enami goto out;
345 1.11 thorpej }
346 1.129.10.1 snj ci->ci_path = kmem_alloc(ci->ci_pathlen, KM_SLEEP);
347 1.72 thorpej memcpy(ci->ci_path, tmppath, ci->ci_pathlen);
348 1.67 enami path_alloced++;
349 1.11 thorpej
350 1.11 thorpej /*
351 1.11 thorpej * XXX: Cache the component's dev_t.
352 1.11 thorpej */
353 1.124 pooka if ((error = VOP_GETATTR(vpp[ix], &va, l->l_cred)) != 0) {
354 1.11 thorpej #ifdef DEBUG
355 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
356 1.35 christos printf("%s: %s: getattr failed %s = %d\n",
357 1.23 thorpej cs->sc_xname, ci->ci_path,
358 1.11 thorpej "error", error);
359 1.11 thorpej #endif
360 1.67 enami goto out;
361 1.11 thorpej }
362 1.11 thorpej ci->ci_dev = va.va_rdev;
363 1.11 thorpej
364 1.3 hpeyerl /*
365 1.11 thorpej * Get partition information for the component.
366 1.3 hpeyerl */
367 1.84 dsl error = VOP_IOCTL(vpp[ix], DIOCGPART, &dpart,
368 1.124 pooka FREAD, l->l_cred);
369 1.29 christos if (error) {
370 1.11 thorpej #ifdef DEBUG
371 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
372 1.35 christos printf("%s: %s: ioctl failed, error = %d\n",
373 1.23 thorpej cs->sc_xname, ci->ci_path, error);
374 1.11 thorpej #endif
375 1.67 enami goto out;
376 1.11 thorpej }
377 1.69 enami
378 1.69 enami /*
379 1.69 enami * This diagnostic test is disabled (for now?) since not all port supports
380 1.69 enami * on-disk BSD disklabel.
381 1.69 enami */
382 1.69 enami #if 0 /* def DIAGNOSTIC */
383 1.69 enami /* Check fstype field of component. */
384 1.69 enami if (dpart.part->p_fstype != FS_CCD)
385 1.69 enami printf("%s: WARNING: %s: fstype %d != FS_CCD\n",
386 1.69 enami cs->sc_xname, ci->ci_path, dpart.part->p_fstype);
387 1.69 enami #endif
388 1.7 cgd
389 1.11 thorpej /*
390 1.11 thorpej * Calculate the size, truncating to an interleave
391 1.11 thorpej * boundary if necessary.
392 1.11 thorpej */
393 1.46 thorpej maxsecsize =
394 1.46 thorpej ((dpart.disklab->d_secsize > maxsecsize) ?
395 1.46 thorpej dpart.disklab->d_secsize : maxsecsize);
396 1.46 thorpej size = dpart.part->p_size;
397 1.1 hpeyerl if (cs->sc_ileave > 1)
398 1.1 hpeyerl size -= size % cs->sc_ileave;
399 1.11 thorpej
400 1.1 hpeyerl if (size == 0) {
401 1.11 thorpej #ifdef DEBUG
402 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
403 1.35 christos printf("%s: %s: size == 0\n",
404 1.23 thorpej cs->sc_xname, ci->ci_path);
405 1.11 thorpej #endif
406 1.67 enami error = ENODEV;
407 1.67 enami goto out;
408 1.3 hpeyerl }
409 1.11 thorpej
410 1.1 hpeyerl if (minsize == 0 || size < minsize)
411 1.1 hpeyerl minsize = size;
412 1.1 hpeyerl ci->ci_size = size;
413 1.1 hpeyerl cs->sc_size += size;
414 1.1 hpeyerl }
415 1.11 thorpej
416 1.11 thorpej /*
417 1.11 thorpej * Don't allow the interleave to be smaller than
418 1.11 thorpej * the biggest component sector.
419 1.11 thorpej */
420 1.11 thorpej if ((cs->sc_ileave > 0) &&
421 1.11 thorpej (cs->sc_ileave < (maxsecsize / DEV_BSIZE))) {
422 1.11 thorpej #ifdef DEBUG
423 1.11 thorpej if (ccddebug & (CCDB_FOLLOW|CCDB_INIT))
424 1.35 christos printf("%s: interleave must be at least %d\n",
425 1.23 thorpej cs->sc_xname, (maxsecsize / DEV_BSIZE));
426 1.11 thorpej #endif
427 1.67 enami error = EINVAL;
428 1.67 enami goto out;
429 1.11 thorpej }
430 1.11 thorpej
431 1.1 hpeyerl /*
432 1.1 hpeyerl * If uniform interleave is desired set all sizes to that of
433 1.1 hpeyerl * the smallest component.
434 1.1 hpeyerl */
435 1.57 thorpej if (cs->sc_flags & CCDF_UNIFORM) {
436 1.1 hpeyerl for (ci = cs->sc_cinfo;
437 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
438 1.1 hpeyerl ci->ci_size = minsize;
439 1.24 thorpej
440 1.53 thorpej cs->sc_size = cs->sc_nccdisks * minsize;
441 1.1 hpeyerl }
442 1.11 thorpej
443 1.11 thorpej /*
444 1.11 thorpej * Construct the interleave table.
445 1.11 thorpej */
446 1.57 thorpej ccdinterleave(cs);
447 1.11 thorpej
448 1.1 hpeyerl /*
449 1.11 thorpej * Create pseudo-geometry based on 1MB cylinders. It's
450 1.11 thorpej * pretty close.
451 1.1 hpeyerl */
452 1.11 thorpej ccg->ccg_secsize = DEV_BSIZE;
453 1.19 thorpej ccg->ccg_ntracks = 1;
454 1.11 thorpej ccg->ccg_nsectors = 1024 * (1024 / ccg->ccg_secsize);
455 1.11 thorpej ccg->ccg_ncylinders = cs->sc_size / ccg->ccg_nsectors;
456 1.129.10.2 msaitoh
457 1.129.10.2 msaitoh if (cs->sc_ileave > 0)
458 1.129.10.2 msaitoh aprint_normal("%s: Interleaving %d component%s "
459 1.129.10.2 msaitoh "(%d block interleave)\n", cs->sc_xname,
460 1.129.10.2 msaitoh cs->sc_nccdisks, (cs->sc_nccdisks != 0 ? "s" : ""),
461 1.129.10.2 msaitoh cs->sc_ileave);
462 1.129.10.2 msaitoh else
463 1.129.10.2 msaitoh aprint_normal("%s: Concatenating %d component%s\n",
464 1.129.10.2 msaitoh cs->sc_xname,
465 1.129.10.2 msaitoh cs->sc_nccdisks, (cs->sc_nccdisks != 0 ? "s" : ""));
466 1.129.10.2 msaitoh for (ix = 0; ix < cs->sc_nccdisks; ix++) {
467 1.129.10.2 msaitoh ci = &cs->sc_cinfo[ix];
468 1.129.10.2 msaitoh aprint_normal("%s: %s (%ju blocks)\n", cs->sc_xname,
469 1.129.10.2 msaitoh ci->ci_path, (uintmax_t)ci->ci_size);
470 1.129.10.2 msaitoh }
471 1.129.10.2 msaitoh aprint_normal("%s: total %ju blocks\n", cs->sc_xname, cs->sc_size);
472 1.11 thorpej
473 1.129.10.1 snj /*
474 1.129.10.1 snj * Create thread to handle deferred I/O.
475 1.129.10.1 snj */
476 1.129.10.1 snj cs->sc_zap = false;
477 1.129.10.1 snj error = kthread_create(PRI_BIO, KTHREAD_MPSAFE, NULL, ccdthread,
478 1.129.10.1 snj cs, &cs->sc_thread, "%s", cs->sc_xname);
479 1.129.10.1 snj if (error) {
480 1.129.10.1 snj printf("ccdinit: can't create thread: %d\n", error);
481 1.129.10.1 snj goto out;
482 1.129.10.1 snj }
483 1.114 christos
484 1.129.10.1 snj /*
485 1.129.10.1 snj * Only now that everything is set up can we enable the device.
486 1.129.10.1 snj */
487 1.129.10.1 snj mutex_enter(cs->sc_iolock);
488 1.129.10.1 snj cs->sc_flags |= CCDF_INITED;
489 1.129.10.1 snj mutex_exit(cs->sc_iolock);
490 1.129.10.1 snj kmem_free(tmppath, MAXPATHLEN);
491 1.11 thorpej return (0);
492 1.67 enami
493 1.67 enami out:
494 1.129.10.1 snj for (ix = 0; ix < path_alloced; ix++) {
495 1.129.10.1 snj kmem_free(cs->sc_cinfo[ix].ci_path,
496 1.129.10.1 snj cs->sc_cinfo[ix].ci_pathlen);
497 1.129.10.1 snj }
498 1.129.10.1 snj kmem_free(cs->sc_cinfo, cs->sc_nccdisks * sizeof(struct ccdcinfo));
499 1.129.10.1 snj kmem_free(tmppath, MAXPATHLEN);
500 1.67 enami return (error);
501 1.1 hpeyerl }
502 1.1 hpeyerl
503 1.11 thorpej static void
504 1.97 thorpej ccdinterleave(struct ccd_softc *cs)
505 1.1 hpeyerl {
506 1.68 augustss struct ccdcinfo *ci, *smallci;
507 1.68 augustss struct ccdiinfo *ii;
508 1.68 augustss daddr_t bn, lbn;
509 1.68 augustss int ix;
510 1.1 hpeyerl u_long size;
511 1.1 hpeyerl
512 1.1 hpeyerl #ifdef DEBUG
513 1.3 hpeyerl if (ccddebug & CCDB_INIT)
514 1.35 christos printf("ccdinterleave(%p): ileave %d\n", cs, cs->sc_ileave);
515 1.1 hpeyerl #endif
516 1.1 hpeyerl /*
517 1.1 hpeyerl * Allocate an interleave table.
518 1.1 hpeyerl * Chances are this is too big, but we don't care.
519 1.1 hpeyerl */
520 1.1 hpeyerl size = (cs->sc_nccdisks + 1) * sizeof(struct ccdiinfo);
521 1.129.10.1 snj cs->sc_itable = kmem_zalloc(size, KM_SLEEP);
522 1.11 thorpej
523 1.1 hpeyerl /*
524 1.1 hpeyerl * Trivial case: no interleave (actually interleave of disk size).
525 1.11 thorpej * Each table entry represents a single component in its entirety.
526 1.1 hpeyerl */
527 1.1 hpeyerl if (cs->sc_ileave == 0) {
528 1.1 hpeyerl bn = 0;
529 1.1 hpeyerl ii = cs->sc_itable;
530 1.11 thorpej
531 1.1 hpeyerl for (ix = 0; ix < cs->sc_nccdisks; ix++) {
532 1.19 thorpej /* Allocate space for ii_index. */
533 1.129.10.1 snj ii->ii_indexsz = sizeof(int);
534 1.129.10.1 snj ii->ii_index = kmem_alloc(ii->ii_indexsz, KM_SLEEP);
535 1.1 hpeyerl ii->ii_ndisk = 1;
536 1.1 hpeyerl ii->ii_startblk = bn;
537 1.1 hpeyerl ii->ii_startoff = 0;
538 1.1 hpeyerl ii->ii_index[0] = ix;
539 1.1 hpeyerl bn += cs->sc_cinfo[ix].ci_size;
540 1.1 hpeyerl ii++;
541 1.1 hpeyerl }
542 1.1 hpeyerl ii->ii_ndisk = 0;
543 1.1 hpeyerl #ifdef DEBUG
544 1.3 hpeyerl if (ccddebug & CCDB_INIT)
545 1.1 hpeyerl printiinfo(cs->sc_itable);
546 1.1 hpeyerl #endif
547 1.11 thorpej return;
548 1.1 hpeyerl }
549 1.11 thorpej
550 1.1 hpeyerl /*
551 1.1 hpeyerl * The following isn't fast or pretty; it doesn't have to be.
552 1.1 hpeyerl */
553 1.1 hpeyerl size = 0;
554 1.1 hpeyerl bn = lbn = 0;
555 1.1 hpeyerl for (ii = cs->sc_itable; ; ii++) {
556 1.11 thorpej /* Allocate space for ii_index. */
557 1.129.10.1 snj ii->ii_indexsz = sizeof(int) * cs->sc_nccdisks;
558 1.129.10.1 snj ii->ii_index = kmem_alloc(ii->ii_indexsz, KM_SLEEP);
559 1.11 thorpej
560 1.1 hpeyerl /*
561 1.1 hpeyerl * Locate the smallest of the remaining components
562 1.1 hpeyerl */
563 1.1 hpeyerl smallci = NULL;
564 1.1 hpeyerl for (ci = cs->sc_cinfo;
565 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
566 1.1 hpeyerl if (ci->ci_size > size &&
567 1.1 hpeyerl (smallci == NULL ||
568 1.1 hpeyerl ci->ci_size < smallci->ci_size))
569 1.1 hpeyerl smallci = ci;
570 1.11 thorpej
571 1.1 hpeyerl /*
572 1.1 hpeyerl * Nobody left, all done
573 1.1 hpeyerl */
574 1.1 hpeyerl if (smallci == NULL) {
575 1.1 hpeyerl ii->ii_ndisk = 0;
576 1.1 hpeyerl break;
577 1.1 hpeyerl }
578 1.11 thorpej
579 1.1 hpeyerl /*
580 1.1 hpeyerl * Record starting logical block and component offset
581 1.1 hpeyerl */
582 1.1 hpeyerl ii->ii_startblk = bn / cs->sc_ileave;
583 1.1 hpeyerl ii->ii_startoff = lbn;
584 1.11 thorpej
585 1.1 hpeyerl /*
586 1.1 hpeyerl * Determine how many disks take part in this interleave
587 1.1 hpeyerl * and record their indices.
588 1.1 hpeyerl */
589 1.1 hpeyerl ix = 0;
590 1.1 hpeyerl for (ci = cs->sc_cinfo;
591 1.1 hpeyerl ci < &cs->sc_cinfo[cs->sc_nccdisks]; ci++)
592 1.1 hpeyerl if (ci->ci_size >= smallci->ci_size)
593 1.1 hpeyerl ii->ii_index[ix++] = ci - cs->sc_cinfo;
594 1.1 hpeyerl ii->ii_ndisk = ix;
595 1.1 hpeyerl bn += ix * (smallci->ci_size - size);
596 1.1 hpeyerl lbn = smallci->ci_size / cs->sc_ileave;
597 1.1 hpeyerl size = smallci->ci_size;
598 1.1 hpeyerl }
599 1.1 hpeyerl #ifdef DEBUG
600 1.3 hpeyerl if (ccddebug & CCDB_INIT)
601 1.1 hpeyerl printiinfo(cs->sc_itable);
602 1.1 hpeyerl #endif
603 1.1 hpeyerl }
604 1.1 hpeyerl
605 1.11 thorpej /* ARGSUSED */
606 1.97 thorpej static int
607 1.116 christos ccdopen(dev_t dev, int flags, int fmt, struct lwp *l)
608 1.1 hpeyerl {
609 1.1 hpeyerl int unit = ccdunit(dev);
610 1.11 thorpej struct ccd_softc *cs;
611 1.11 thorpej struct disklabel *lp;
612 1.15 thorpej int error = 0, part, pmask;
613 1.1 hpeyerl
614 1.1 hpeyerl #ifdef DEBUG
615 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
616 1.43 fair printf("ccdopen(0x%x, 0x%x)\n", dev, flags);
617 1.1 hpeyerl #endif
618 1.11 thorpej if (unit >= numccd)
619 1.11 thorpej return (ENXIO);
620 1.11 thorpej cs = &ccd_softc[unit];
621 1.15 thorpej
622 1.129.10.1 snj mutex_enter(&cs->sc_dvlock);
623 1.15 thorpej
624 1.23 thorpej lp = cs->sc_dkdev.dk_label;
625 1.11 thorpej
626 1.11 thorpej part = DISKPART(dev);
627 1.11 thorpej pmask = (1 << part);
628 1.11 thorpej
629 1.15 thorpej /*
630 1.15 thorpej * If we're initialized, check to see if there are any other
631 1.15 thorpej * open partitions. If not, then it's safe to update
632 1.87 thorpej * the in-core disklabel. Only read the disklabel if it is
633 1.87 thorpej * not already valid.
634 1.15 thorpej */
635 1.87 thorpej if ((cs->sc_flags & (CCDF_INITED|CCDF_VLABEL)) == CCDF_INITED &&
636 1.87 thorpej cs->sc_dkdev.dk_openmask == 0)
637 1.15 thorpej ccdgetdisklabel(dev);
638 1.15 thorpej
639 1.11 thorpej /* Check that the partition exists. */
640 1.27 thorpej if (part != RAW_PART) {
641 1.27 thorpej if (((cs->sc_flags & CCDF_INITED) == 0) ||
642 1.37 thorpej ((part >= lp->d_npartitions) ||
643 1.27 thorpej (lp->d_partitions[part].p_fstype == FS_UNUSED))) {
644 1.27 thorpej error = ENXIO;
645 1.27 thorpej goto done;
646 1.27 thorpej }
647 1.15 thorpej }
648 1.11 thorpej
649 1.11 thorpej /* Prevent our unit from being unconfigured while open. */
650 1.11 thorpej switch (fmt) {
651 1.11 thorpej case S_IFCHR:
652 1.11 thorpej cs->sc_dkdev.dk_copenmask |= pmask;
653 1.11 thorpej break;
654 1.11 thorpej
655 1.11 thorpej case S_IFBLK:
656 1.11 thorpej cs->sc_dkdev.dk_bopenmask |= pmask;
657 1.11 thorpej break;
658 1.11 thorpej }
659 1.11 thorpej cs->sc_dkdev.dk_openmask =
660 1.11 thorpej cs->sc_dkdev.dk_copenmask | cs->sc_dkdev.dk_bopenmask;
661 1.11 thorpej
662 1.15 thorpej done:
663 1.129.10.1 snj mutex_exit(&cs->sc_dvlock);
664 1.33 thorpej return (error);
665 1.7 cgd }
666 1.7 cgd
667 1.11 thorpej /* ARGSUSED */
668 1.97 thorpej static int
669 1.116 christos ccdclose(dev_t dev, int flags, int fmt, struct lwp *l)
670 1.7 cgd {
671 1.11 thorpej int unit = ccdunit(dev);
672 1.11 thorpej struct ccd_softc *cs;
673 1.117 ad int part;
674 1.11 thorpej
675 1.7 cgd #ifdef DEBUG
676 1.7 cgd if (ccddebug & CCDB_FOLLOW)
677 1.43 fair printf("ccdclose(0x%x, 0x%x)\n", dev, flags);
678 1.7 cgd #endif
679 1.11 thorpej
680 1.11 thorpej if (unit >= numccd)
681 1.11 thorpej return (ENXIO);
682 1.11 thorpej cs = &ccd_softc[unit];
683 1.15 thorpej
684 1.129.10.1 snj mutex_enter(&cs->sc_dvlock);
685 1.15 thorpej
686 1.11 thorpej part = DISKPART(dev);
687 1.11 thorpej
688 1.11 thorpej /* ...that much closer to allowing unconfiguration... */
689 1.11 thorpej switch (fmt) {
690 1.11 thorpej case S_IFCHR:
691 1.11 thorpej cs->sc_dkdev.dk_copenmask &= ~(1 << part);
692 1.11 thorpej break;
693 1.11 thorpej
694 1.11 thorpej case S_IFBLK:
695 1.11 thorpej cs->sc_dkdev.dk_bopenmask &= ~(1 << part);
696 1.11 thorpej break;
697 1.11 thorpej }
698 1.11 thorpej cs->sc_dkdev.dk_openmask =
699 1.11 thorpej cs->sc_dkdev.dk_copenmask | cs->sc_dkdev.dk_bopenmask;
700 1.11 thorpej
701 1.87 thorpej if (cs->sc_dkdev.dk_openmask == 0) {
702 1.87 thorpej if ((cs->sc_flags & CCDF_KLABEL) == 0)
703 1.87 thorpej cs->sc_flags &= ~CCDF_VLABEL;
704 1.87 thorpej }
705 1.87 thorpej
706 1.129.10.1 snj mutex_exit(&cs->sc_dvlock);
707 1.7 cgd return (0);
708 1.1 hpeyerl }
709 1.1 hpeyerl
710 1.129.10.1 snj static bool
711 1.129.10.1 snj ccdbackoff(struct ccd_softc *cs)
712 1.129.10.1 snj {
713 1.129.10.1 snj
714 1.129.10.1 snj /* XXX Arbitrary, should be a uvm call. */
715 1.129.10.1 snj return uvmexp.free < (uvmexp.freemin >> 1) &&
716 1.129.10.1 snj disk_isbusy(&cs->sc_dkdev);
717 1.129.10.1 snj }
718 1.129.10.1 snj
719 1.129.10.1 snj static void
720 1.129.10.1 snj ccdthread(void *cookie)
721 1.129.10.1 snj {
722 1.129.10.1 snj struct ccd_softc *cs;
723 1.129.10.1 snj
724 1.129.10.1 snj cs = cookie;
725 1.129.10.1 snj
726 1.129.10.1 snj #ifdef DEBUG
727 1.129.10.1 snj if (ccddebug & CCDB_FOLLOW)
728 1.129.10.1 snj printf("ccdthread: hello\n");
729 1.129.10.1 snj #endif
730 1.129.10.1 snj
731 1.129.10.1 snj mutex_enter(cs->sc_iolock);
732 1.129.10.1 snj while (__predict_true(!cs->sc_zap)) {
733 1.129.10.1 snj if (bufq_peek(cs->sc_bufq) == NULL) {
734 1.129.10.1 snj /* Nothing to do. */
735 1.129.10.1 snj cv_wait(&cs->sc_push, cs->sc_iolock);
736 1.129.10.1 snj continue;
737 1.129.10.1 snj }
738 1.129.10.1 snj if (ccdbackoff(cs)) {
739 1.129.10.1 snj /* Wait for memory to become available. */
740 1.129.10.1 snj (void)cv_timedwait(&cs->sc_push, cs->sc_iolock, 1);
741 1.129.10.1 snj continue;
742 1.129.10.1 snj }
743 1.129.10.1 snj #ifdef DEBUG
744 1.129.10.1 snj if (ccddebug & CCDB_FOLLOW)
745 1.129.10.1 snj printf("ccdthread: dispatching I/O\n");
746 1.129.10.1 snj #endif
747 1.129.10.1 snj ccdstart(cs);
748 1.129.10.1 snj mutex_enter(cs->sc_iolock);
749 1.129.10.1 snj }
750 1.129.10.1 snj cs->sc_thread = NULL;
751 1.129.10.1 snj mutex_exit(cs->sc_iolock);
752 1.129.10.1 snj #ifdef DEBUG
753 1.129.10.1 snj if (ccddebug & CCDB_FOLLOW)
754 1.129.10.1 snj printf("ccdthread: goodbye\n");
755 1.129.10.1 snj #endif
756 1.129.10.1 snj kthread_exit(0);
757 1.129.10.1 snj }
758 1.129.10.1 snj
759 1.97 thorpej static void
760 1.97 thorpej ccdstrategy(struct buf *bp)
761 1.1 hpeyerl {
762 1.68 augustss int unit = ccdunit(bp->b_dev);
763 1.68 augustss struct ccd_softc *cs = &ccd_softc[unit];
764 1.129.10.1 snj
765 1.129.10.1 snj /* Must be open or reading label. */
766 1.129.10.1 snj KASSERT(cs->sc_dkdev.dk_openmask != 0 ||
767 1.129.10.1 snj (cs->sc_flags & CCDF_RLABEL) != 0);
768 1.129.10.1 snj
769 1.129.10.1 snj mutex_enter(cs->sc_iolock);
770 1.129.10.1 snj /* Synchronize with device init/uninit. */
771 1.129.10.1 snj if (__predict_false((cs->sc_flags & CCDF_INITED) == 0)) {
772 1.129.10.1 snj mutex_exit(cs->sc_iolock);
773 1.129.10.1 snj #ifdef DEBUG
774 1.129.10.1 snj if (ccddebug & CCDB_FOLLOW)
775 1.129.10.1 snj printf("ccdstrategy: unit %d: not inited\n", unit);
776 1.129.10.1 snj #endif
777 1.129.10.1 snj bp->b_error = ENXIO;
778 1.129.10.1 snj bp->b_resid = bp->b_bcount;
779 1.129.10.1 snj biodone(bp);
780 1.129.10.1 snj return;
781 1.129.10.1 snj }
782 1.129.10.1 snj
783 1.129.10.1 snj /* Defer to thread if system is low on memory. */
784 1.129.10.1 snj bufq_put(cs->sc_bufq, bp);
785 1.129.10.1 snj if (__predict_false(ccdbackoff(cs))) {
786 1.129.10.1 snj mutex_exit(cs->sc_iolock);
787 1.129.10.1 snj #ifdef DEBUG
788 1.129.10.1 snj if (ccddebug & CCDB_FOLLOW)
789 1.129.10.1 snj printf("ccdstrategy: holding off on I/O\n");
790 1.129.10.1 snj #endif
791 1.129.10.1 snj return;
792 1.129.10.1 snj }
793 1.129.10.1 snj ccdstart(cs);
794 1.129.10.1 snj }
795 1.129.10.1 snj
796 1.129.10.1 snj static void
797 1.129.10.1 snj ccdstart(struct ccd_softc *cs)
798 1.129.10.1 snj {
799 1.88 thorpej daddr_t blkno;
800 1.11 thorpej int wlabel;
801 1.15 thorpej struct disklabel *lp;
802 1.129.10.1 snj long bcount, rcount;
803 1.129.10.1 snj struct ccdbuf *cbp;
804 1.129.10.1 snj char *addr;
805 1.129.10.1 snj daddr_t bn;
806 1.129.10.1 snj vnode_t *vp;
807 1.129.10.1 snj buf_t *bp;
808 1.129.10.1 snj
809 1.129.10.1 snj KASSERT(mutex_owned(cs->sc_iolock));
810 1.129.10.1 snj
811 1.129.10.1 snj disk_busy(&cs->sc_dkdev);
812 1.129.10.1 snj bp = bufq_get(cs->sc_bufq);
813 1.129.10.1 snj KASSERT(bp != NULL);
814 1.1 hpeyerl
815 1.1 hpeyerl #ifdef DEBUG
816 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
817 1.129.10.1 snj printf("ccdstart(%s, %p)\n", cs->sc_xname, bp);
818 1.59 thorpej #endif
819 1.11 thorpej
820 1.11 thorpej /* If it's a nil transfer, wake up the top half now. */
821 1.11 thorpej if (bp->b_bcount == 0)
822 1.11 thorpej goto done;
823 1.11 thorpej
824 1.23 thorpej lp = cs->sc_dkdev.dk_label;
825 1.15 thorpej
826 1.11 thorpej /*
827 1.17 thorpej * Do bounds checking and adjust transfer. If there's an
828 1.88 thorpej * error, the bounds check will flag that for us. Convert
829 1.88 thorpej * the partition relative block number to an absolute.
830 1.11 thorpej */
831 1.88 thorpej blkno = bp->b_blkno;
832 1.11 thorpej wlabel = cs->sc_flags & (CCDF_WLABEL|CCDF_LABELLING);
833 1.88 thorpej if (DISKPART(bp->b_dev) != RAW_PART) {
834 1.86 thorpej if (bounds_check_with_label(&cs->sc_dkdev, bp, wlabel) <= 0)
835 1.1 hpeyerl goto done;
836 1.88 thorpej blkno += lp->d_partitions[DISKPART(bp->b_dev)].p_offset;
837 1.88 thorpej }
838 1.129.10.1 snj mutex_exit(cs->sc_iolock);
839 1.88 thorpej bp->b_rawblkno = blkno;
840 1.11 thorpej
841 1.129.10.1 snj /* Allocate the component buffers and start I/O! */
842 1.129.10.1 snj bp->b_resid = bp->b_bcount;
843 1.129.10.1 snj bn = bp->b_rawblkno;
844 1.129.10.1 snj addr = bp->b_data;
845 1.129.10.1 snj for (bcount = bp->b_bcount; bcount > 0; bcount -= rcount) {
846 1.129.10.1 snj cbp = ccdbuffer(cs, bp, bn, addr, bcount);
847 1.129.10.1 snj rcount = cbp->cb_buf.b_bcount;
848 1.129.10.1 snj bn += btodb(rcount);
849 1.129.10.1 snj addr += rcount;
850 1.129.10.1 snj vp = cbp->cb_buf.b_vp;
851 1.129.10.1 snj if ((cbp->cb_buf.b_flags & B_READ) == 0) {
852 1.129.10.1 snj mutex_enter(&vp->v_interlock);
853 1.129.10.1 snj vp->v_numoutput++;
854 1.129.10.1 snj mutex_exit(&vp->v_interlock);
855 1.129.10.1 snj }
856 1.129.10.1 snj (void)VOP_STRATEGY(vp, &cbp->cb_buf);
857 1.129.10.1 snj }
858 1.1 hpeyerl return;
859 1.88 thorpej
860 1.88 thorpej done:
861 1.129.10.1 snj disk_unbusy(&cs->sc_dkdev, 0, 0);
862 1.129.10.1 snj cv_broadcast(&cs->sc_stop);
863 1.129.10.1 snj cv_broadcast(&cs->sc_push);
864 1.129.10.1 snj mutex_exit(cs->sc_iolock);
865 1.88 thorpej bp->b_resid = bp->b_bcount;
866 1.1 hpeyerl biodone(bp);
867 1.1 hpeyerl }
868 1.1 hpeyerl
869 1.1 hpeyerl /*
870 1.1 hpeyerl * Build a component buffer header.
871 1.1 hpeyerl */
872 1.55 thorpej static struct ccdbuf *
873 1.118 christos ccdbuffer(struct ccd_softc *cs, struct buf *bp, daddr_t bn, void *addr,
874 1.97 thorpej long bcount)
875 1.1 hpeyerl {
876 1.68 augustss struct ccdcinfo *ci;
877 1.68 augustss struct ccdbuf *cbp;
878 1.68 augustss daddr_t cbn, cboff;
879 1.68 augustss u_int64_t cbc;
880 1.36 thorpej int ccdisk;
881 1.1 hpeyerl
882 1.1 hpeyerl #ifdef DEBUG
883 1.3 hpeyerl if (ccddebug & CCDB_IO)
884 1.81 kleink printf("ccdbuffer(%p, %p, %" PRId64 ", %p, %ld)\n",
885 1.1 hpeyerl cs, bp, bn, addr, bcount);
886 1.1 hpeyerl #endif
887 1.1 hpeyerl /*
888 1.1 hpeyerl * Determine which component bn falls in.
889 1.1 hpeyerl */
890 1.1 hpeyerl cbn = bn;
891 1.1 hpeyerl cboff = 0;
892 1.11 thorpej
893 1.1 hpeyerl /*
894 1.1 hpeyerl * Serially concatenated
895 1.1 hpeyerl */
896 1.1 hpeyerl if (cs->sc_ileave == 0) {
897 1.68 augustss daddr_t sblk;
898 1.1 hpeyerl
899 1.1 hpeyerl sblk = 0;
900 1.36 thorpej for (ccdisk = 0, ci = &cs->sc_cinfo[ccdisk];
901 1.36 thorpej cbn >= sblk + ci->ci_size;
902 1.36 thorpej ccdisk++, ci = &cs->sc_cinfo[ccdisk])
903 1.1 hpeyerl sblk += ci->ci_size;
904 1.1 hpeyerl cbn -= sblk;
905 1.1 hpeyerl }
906 1.1 hpeyerl /*
907 1.1 hpeyerl * Interleaved
908 1.1 hpeyerl */
909 1.1 hpeyerl else {
910 1.68 augustss struct ccdiinfo *ii;
911 1.36 thorpej int off;
912 1.1 hpeyerl
913 1.1 hpeyerl cboff = cbn % cs->sc_ileave;
914 1.1 hpeyerl cbn /= cs->sc_ileave;
915 1.1 hpeyerl for (ii = cs->sc_itable; ii->ii_ndisk; ii++)
916 1.1 hpeyerl if (ii->ii_startblk > cbn)
917 1.1 hpeyerl break;
918 1.1 hpeyerl ii--;
919 1.1 hpeyerl off = cbn - ii->ii_startblk;
920 1.1 hpeyerl if (ii->ii_ndisk == 1) {
921 1.1 hpeyerl ccdisk = ii->ii_index[0];
922 1.1 hpeyerl cbn = ii->ii_startoff + off;
923 1.1 hpeyerl } else {
924 1.53 thorpej ccdisk = ii->ii_index[off % ii->ii_ndisk];
925 1.53 thorpej cbn = ii->ii_startoff + off / ii->ii_ndisk;
926 1.1 hpeyerl }
927 1.1 hpeyerl cbn *= cs->sc_ileave;
928 1.1 hpeyerl ci = &cs->sc_cinfo[ccdisk];
929 1.1 hpeyerl }
930 1.11 thorpej
931 1.1 hpeyerl /*
932 1.1 hpeyerl * Fill in the component buf structure.
933 1.1 hpeyerl */
934 1.63 thorpej cbp = CCD_GETBUF();
935 1.129.10.1 snj KASSERT(cbp != NULL);
936 1.126 ad buf_init(&cbp->cb_buf);
937 1.126 ad cbp->cb_buf.b_flags = bp->b_flags;
938 1.126 ad cbp->cb_buf.b_oflags = bp->b_oflags;
939 1.126 ad cbp->cb_buf.b_cflags = bp->b_cflags;
940 1.29 christos cbp->cb_buf.b_iodone = ccdiodone;
941 1.6 cgd cbp->cb_buf.b_proc = bp->b_proc;
942 1.95 hannken cbp->cb_buf.b_dev = ci->ci_dev;
943 1.6 cgd cbp->cb_buf.b_blkno = cbn + cboff;
944 1.6 cgd cbp->cb_buf.b_data = addr;
945 1.11 thorpej cbp->cb_buf.b_vp = ci->ci_vp;
946 1.127 hannken cbp->cb_buf.b_objlock = &ci->ci_vp->v_interlock;
947 1.1 hpeyerl if (cs->sc_ileave == 0)
948 1.50 thorpej cbc = dbtob((u_int64_t)(ci->ci_size - cbn));
949 1.1 hpeyerl else
950 1.50 thorpej cbc = dbtob((u_int64_t)(cs->sc_ileave - cboff));
951 1.50 thorpej cbp->cb_buf.b_bcount = cbc < bcount ? cbc : bcount;
952 1.6 cgd
953 1.1 hpeyerl /*
954 1.6 cgd * context for ccdiodone
955 1.1 hpeyerl */
956 1.6 cgd cbp->cb_obp = bp;
957 1.59 thorpej cbp->cb_sc = cs;
958 1.36 thorpej cbp->cb_comp = ccdisk;
959 1.6 cgd
960 1.94 yamt BIO_COPYPRIO(&cbp->cb_buf, bp);
961 1.94 yamt
962 1.1 hpeyerl #ifdef DEBUG
963 1.3 hpeyerl if (ccddebug & CCDB_IO)
964 1.81 kleink printf(" dev 0x%x(u%lu): cbp %p bn %" PRId64 " addr %p"
965 1.99 yamt " bcnt %d\n",
966 1.62 mjacob ci->ci_dev, (unsigned long) (ci-cs->sc_cinfo), cbp,
967 1.62 mjacob cbp->cb_buf.b_blkno, cbp->cb_buf.b_data,
968 1.62 mjacob cbp->cb_buf.b_bcount);
969 1.1 hpeyerl #endif
970 1.55 thorpej
971 1.55 thorpej return (cbp);
972 1.1 hpeyerl }
973 1.1 hpeyerl
974 1.1 hpeyerl /*
975 1.11 thorpej * Called at interrupt time.
976 1.1 hpeyerl * Mark the component as done and if all components are done,
977 1.1 hpeyerl * take a ccd interrupt.
978 1.1 hpeyerl */
979 1.97 thorpej static void
980 1.97 thorpej ccdiodone(struct buf *vbp)
981 1.1 hpeyerl {
982 1.29 christos struct ccdbuf *cbp = (struct ccdbuf *) vbp;
983 1.59 thorpej struct buf *bp = cbp->cb_obp;
984 1.59 thorpej struct ccd_softc *cs = cbp->cb_sc;
985 1.129.10.1 snj int count;
986 1.1 hpeyerl
987 1.1 hpeyerl #ifdef DEBUG
988 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
989 1.35 christos printf("ccdiodone(%p)\n", cbp);
990 1.3 hpeyerl if (ccddebug & CCDB_IO) {
991 1.99 yamt printf("ccdiodone: bp %p bcount %d resid %d\n",
992 1.53 thorpej bp, bp->b_bcount, bp->b_resid);
993 1.81 kleink printf(" dev 0x%x(u%d), cbp %p bn %" PRId64 " addr %p"
994 1.99 yamt " bcnt %d\n",
995 1.6 cgd cbp->cb_buf.b_dev, cbp->cb_comp, cbp,
996 1.6 cgd cbp->cb_buf.b_blkno, cbp->cb_buf.b_data,
997 1.6 cgd cbp->cb_buf.b_bcount);
998 1.1 hpeyerl }
999 1.1 hpeyerl #endif
1000 1.1 hpeyerl
1001 1.122 ad if (cbp->cb_buf.b_error != 0) {
1002 1.122 ad bp->b_error = cbp->cb_buf.b_error;
1003 1.53 thorpej printf("%s: error %d on component %d\n",
1004 1.53 thorpej cs->sc_xname, bp->b_error, cbp->cb_comp);
1005 1.1 hpeyerl }
1006 1.6 cgd count = cbp->cb_buf.b_bcount;
1007 1.126 ad buf_destroy(&cbp->cb_buf);
1008 1.63 thorpej CCD_PUTBUF(cbp);
1009 1.1 hpeyerl
1010 1.1 hpeyerl /*
1011 1.1 hpeyerl * If all done, "interrupt".
1012 1.53 thorpej */
1013 1.129.10.1 snj mutex_enter(cs->sc_iolock);
1014 1.53 thorpej bp->b_resid -= count;
1015 1.53 thorpej if (bp->b_resid < 0)
1016 1.53 thorpej panic("ccdiodone: count");
1017 1.129.10.1 snj if (bp->b_resid == 0) {
1018 1.129.10.1 snj /*
1019 1.129.10.1 snj * Request is done for better or worse, wakeup the top half.
1020 1.129.10.1 snj */
1021 1.129.10.1 snj if (bp->b_error != 0)
1022 1.129.10.1 snj bp->b_resid = bp->b_bcount;
1023 1.129.10.1 snj disk_unbusy(&cs->sc_dkdev, (bp->b_bcount - bp->b_resid),
1024 1.129.10.1 snj (bp->b_flags & B_READ));
1025 1.129.10.1 snj if (!disk_isbusy(&cs->sc_dkdev)) {
1026 1.129.10.1 snj if (bufq_peek(cs->sc_bufq) != NULL) {
1027 1.129.10.1 snj cv_broadcast(&cs->sc_push);
1028 1.129.10.1 snj }
1029 1.129.10.1 snj cv_broadcast(&cs->sc_stop);
1030 1.129.10.1 snj }
1031 1.129.10.1 snj mutex_exit(cs->sc_iolock);
1032 1.129.10.1 snj biodone(bp);
1033 1.129.10.1 snj } else
1034 1.129.10.1 snj mutex_exit(cs->sc_iolock);
1035 1.1 hpeyerl }
1036 1.1 hpeyerl
1037 1.11 thorpej /* ARGSUSED */
1038 1.97 thorpej static int
1039 1.116 christos ccdread(dev_t dev, struct uio *uio, int flags)
1040 1.3 hpeyerl {
1041 1.11 thorpej int unit = ccdunit(dev);
1042 1.11 thorpej struct ccd_softc *cs;
1043 1.3 hpeyerl
1044 1.3 hpeyerl #ifdef DEBUG
1045 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
1046 1.43 fair printf("ccdread(0x%x, %p)\n", dev, uio);
1047 1.3 hpeyerl #endif
1048 1.11 thorpej if (unit >= numccd)
1049 1.11 thorpej return (ENXIO);
1050 1.11 thorpej cs = &ccd_softc[unit];
1051 1.11 thorpej
1052 1.129.10.1 snj /* Unlocked advisory check, ccdstrategy check is synchronous. */
1053 1.11 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1054 1.11 thorpej return (ENXIO);
1055 1.11 thorpej
1056 1.10 mycroft return (physio(ccdstrategy, NULL, dev, B_READ, minphys, uio));
1057 1.3 hpeyerl }
1058 1.3 hpeyerl
1059 1.11 thorpej /* ARGSUSED */
1060 1.97 thorpej static int
1061 1.116 christos ccdwrite(dev_t dev, struct uio *uio, int flags)
1062 1.3 hpeyerl {
1063 1.11 thorpej int unit = ccdunit(dev);
1064 1.11 thorpej struct ccd_softc *cs;
1065 1.3 hpeyerl
1066 1.3 hpeyerl #ifdef DEBUG
1067 1.3 hpeyerl if (ccddebug & CCDB_FOLLOW)
1068 1.43 fair printf("ccdwrite(0x%x, %p)\n", dev, uio);
1069 1.3 hpeyerl #endif
1070 1.11 thorpej if (unit >= numccd)
1071 1.11 thorpej return (ENXIO);
1072 1.11 thorpej cs = &ccd_softc[unit];
1073 1.11 thorpej
1074 1.129.10.1 snj /* Unlocked advisory check, ccdstrategy check is synchronous. */
1075 1.11 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1076 1.11 thorpej return (ENXIO);
1077 1.11 thorpej
1078 1.10 mycroft return (physio(ccdstrategy, NULL, dev, B_WRITE, minphys, uio));
1079 1.3 hpeyerl }
1080 1.3 hpeyerl
1081 1.97 thorpej static int
1082 1.118 christos ccdioctl(dev_t dev, u_long cmd, void *data, int flag, struct lwp *l)
1083 1.1 hpeyerl {
1084 1.11 thorpej int unit = ccdunit(dev);
1085 1.129.10.1 snj int i, j, lookedup = 0, error = 0;
1086 1.39 mycroft int part, pmask;
1087 1.11 thorpej struct ccd_softc *cs;
1088 1.11 thorpej struct ccd_ioctl *ccio = (struct ccd_ioctl *)data;
1089 1.110 elad kauth_cred_t uc;
1090 1.11 thorpej char **cpp;
1091 1.11 thorpej struct vnode **vpp;
1092 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1093 1.70 fvdl struct disklabel newlabel;
1094 1.70 fvdl #endif
1095 1.11 thorpej
1096 1.11 thorpej if (unit >= numccd)
1097 1.11 thorpej return (ENXIO);
1098 1.11 thorpej cs = &ccd_softc[unit];
1099 1.129.10.1 snj uc = kauth_cred_get();
1100 1.109 jld
1101 1.129.10.2 msaitoh /*
1102 1.129.10.2 msaitoh * Compat code must not be called if on a platform where
1103 1.129.10.2 msaitoh * sizeof (size_t) == sizeof (uint64_t) as CCDIOCSET will
1104 1.129.10.2 msaitoh * be the same as CCDIOCSET_60
1105 1.129.10.2 msaitoh */
1106 1.129.10.2 msaitoh #ifndef _LP64
1107 1.129.10.2 msaitoh switch (cmd) {
1108 1.129.10.2 msaitoh case CCDIOCSET_60: {
1109 1.129.10.2 msaitoh struct ccd_ioctl ccionew;
1110 1.129.10.2 msaitoh struct ccd_ioctl_60 *ccio60 =
1111 1.129.10.2 msaitoh (struct ccd_ioctl_60 *)data;
1112 1.129.10.2 msaitoh ccionew.ccio_disks = ccio->ccio_disks;
1113 1.129.10.2 msaitoh ccionew.ccio_ndisks = ccio->ccio_ndisks;
1114 1.129.10.2 msaitoh ccionew.ccio_ileave = ccio->ccio_ileave;
1115 1.129.10.2 msaitoh ccionew.ccio_flags = ccio->ccio_flags;
1116 1.129.10.2 msaitoh ccionew.ccio_unit = ccio->ccio_unit;
1117 1.129.10.2 msaitoh error = ccdioctl(dev, CCDIOCSET, &ccionew, flag, l);
1118 1.129.10.2 msaitoh if (!error) {
1119 1.129.10.2 msaitoh /* Copy data back, adjust types if necessary */
1120 1.129.10.2 msaitoh ccio60->ccio_disks = ccionew.ccio_disks;
1121 1.129.10.2 msaitoh ccio60->ccio_ndisks = ccionew.ccio_ndisks;
1122 1.129.10.2 msaitoh ccio60->ccio_ileave = ccionew.ccio_ileave;
1123 1.129.10.2 msaitoh ccio60->ccio_flags = ccionew.ccio_flags;
1124 1.129.10.2 msaitoh ccio60->ccio_unit = ccionew.ccio_unit;
1125 1.129.10.2 msaitoh ccio60->ccio_size = (size_t)ccionew.ccio_size;
1126 1.129.10.2 msaitoh }
1127 1.129.10.2 msaitoh return error;
1128 1.129.10.2 msaitoh }
1129 1.129.10.2 msaitoh break;
1130 1.129.10.2 msaitoh
1131 1.129.10.2 msaitoh case CCDIOCCLR_60:
1132 1.129.10.2 msaitoh /*
1133 1.129.10.2 msaitoh * ccio_size member not used, so existing struct OK
1134 1.129.10.2 msaitoh * drop through to existing non-compat version
1135 1.129.10.2 msaitoh */
1136 1.129.10.2 msaitoh cmd = CCDIOCCLR;
1137 1.129.10.2 msaitoh break;
1138 1.129.10.2 msaitoh }
1139 1.129.10.2 msaitoh #endif /* !_LP64*/
1140 1.129.10.2 msaitoh
1141 1.41 thorpej /* Must be open for writes for these commands... */
1142 1.41 thorpej switch (cmd) {
1143 1.41 thorpej case CCDIOCSET:
1144 1.41 thorpej case CCDIOCCLR:
1145 1.41 thorpej case DIOCSDINFO:
1146 1.41 thorpej case DIOCWDINFO:
1147 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1148 1.70 fvdl case ODIOCSDINFO:
1149 1.70 fvdl case ODIOCWDINFO:
1150 1.70 fvdl #endif
1151 1.87 thorpej case DIOCKLABEL:
1152 1.41 thorpej case DIOCWLABEL:
1153 1.41 thorpej if ((flag & FWRITE) == 0)
1154 1.41 thorpej return (EBADF);
1155 1.41 thorpej }
1156 1.41 thorpej
1157 1.129.10.1 snj mutex_enter(&cs->sc_dvlock);
1158 1.57 thorpej
1159 1.41 thorpej /* Must be initialized for these... */
1160 1.41 thorpej switch (cmd) {
1161 1.41 thorpej case CCDIOCCLR:
1162 1.42 kleink case DIOCGDINFO:
1163 1.100 thorpej case DIOCCACHESYNC:
1164 1.42 kleink case DIOCSDINFO:
1165 1.42 kleink case DIOCWDINFO:
1166 1.42 kleink case DIOCGPART:
1167 1.41 thorpej case DIOCWLABEL:
1168 1.87 thorpej case DIOCKLABEL:
1169 1.44 thorpej case DIOCGDEFLABEL:
1170 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1171 1.70 fvdl case ODIOCGDINFO:
1172 1.70 fvdl case ODIOCSDINFO:
1173 1.70 fvdl case ODIOCWDINFO:
1174 1.70 fvdl case ODIOCGDEFLABEL:
1175 1.70 fvdl #endif
1176 1.57 thorpej if ((cs->sc_flags & CCDF_INITED) == 0) {
1177 1.57 thorpej error = ENXIO;
1178 1.57 thorpej goto out;
1179 1.57 thorpej }
1180 1.41 thorpej }
1181 1.41 thorpej
1182 1.11 thorpej switch (cmd) {
1183 1.11 thorpej case CCDIOCSET:
1184 1.57 thorpej if (cs->sc_flags & CCDF_INITED) {
1185 1.57 thorpej error = EBUSY;
1186 1.57 thorpej goto out;
1187 1.57 thorpej }
1188 1.54 thorpej
1189 1.54 thorpej /* Validate the flags. */
1190 1.57 thorpej if ((ccio->ccio_flags & CCDF_USERMASK) != ccio->ccio_flags) {
1191 1.57 thorpej error = EINVAL;
1192 1.57 thorpej goto out;
1193 1.57 thorpej }
1194 1.15 thorpej
1195 1.129.10.1 snj if (ccio->ccio_ndisks > CCD_MAXNDISKS ||
1196 1.129.10.1 snj ccio->ccio_ndisks == 0) {
1197 1.73 jdolecek error = EINVAL;
1198 1.73 jdolecek goto out;
1199 1.73 jdolecek }
1200 1.102 perry
1201 1.11 thorpej /* Fill in some important bits. */
1202 1.57 thorpej cs->sc_ileave = ccio->ccio_ileave;
1203 1.57 thorpej cs->sc_nccdisks = ccio->ccio_ndisks;
1204 1.57 thorpej cs->sc_flags = ccio->ccio_flags & CCDF_USERMASK;
1205 1.11 thorpej
1206 1.11 thorpej /*
1207 1.11 thorpej * Allocate space for and copy in the array of
1208 1.129.10.2 msaitoh * component pathnames and device numbers.
1209 1.11 thorpej */
1210 1.129.10.1 snj cpp = kmem_alloc(ccio->ccio_ndisks * sizeof(*cpp), KM_SLEEP);
1211 1.129.10.1 snj vpp = kmem_alloc(ccio->ccio_ndisks * sizeof(*vpp), KM_SLEEP);
1212 1.84 dsl error = copyin(ccio->ccio_disks, cpp,
1213 1.129.10.1 snj ccio->ccio_ndisks * sizeof(*cpp));
1214 1.11 thorpej if (error) {
1215 1.129.10.1 snj kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1216 1.129.10.1 snj kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1217 1.57 thorpej goto out;
1218 1.11 thorpej }
1219 1.11 thorpej
1220 1.11 thorpej #ifdef DEBUG
1221 1.11 thorpej if (ccddebug & CCDB_INIT)
1222 1.11 thorpej for (i = 0; i < ccio->ccio_ndisks; ++i)
1223 1.104 christos printf("ccdioctl: component %d: %p\n",
1224 1.11 thorpej i, cpp[i]);
1225 1.11 thorpej #endif
1226 1.11 thorpej
1227 1.11 thorpej for (i = 0; i < ccio->ccio_ndisks; ++i) {
1228 1.11 thorpej #ifdef DEBUG
1229 1.11 thorpej if (ccddebug & CCDB_INIT)
1230 1.35 christos printf("ccdioctl: lookedup = %d\n", lookedup);
1231 1.11 thorpej #endif
1232 1.120 cube if ((error = dk_lookup(cpp[i], l, &vpp[i],
1233 1.120 cube UIO_USERSPACE)) != 0) {
1234 1.11 thorpej for (j = 0; j < lookedup; ++j)
1235 1.12 thorpej (void)vn_close(vpp[j], FREAD|FWRITE,
1236 1.128 ad uc);
1237 1.129.10.1 snj kmem_free(vpp, ccio->ccio_ndisks *
1238 1.129.10.1 snj sizeof(*vpp));
1239 1.129.10.1 snj kmem_free(cpp, ccio->ccio_ndisks *
1240 1.129.10.1 snj sizeof(*cpp));
1241 1.57 thorpej goto out;
1242 1.11 thorpej }
1243 1.11 thorpej ++lookedup;
1244 1.11 thorpej }
1245 1.11 thorpej
1246 1.129.10.1 snj /* Attach the disk. */
1247 1.129.10.1 snj disk_attach(&cs->sc_dkdev);
1248 1.129.10.1 snj bufq_alloc(&cs->sc_bufq, "fcfs", 0);
1249 1.129.10.1 snj
1250 1.11 thorpej /*
1251 1.11 thorpej * Initialize the ccd. Fills in the softc for us.
1252 1.11 thorpej */
1253 1.107 christos if ((error = ccdinit(cs, cpp, vpp, l)) != 0) {
1254 1.11 thorpej for (j = 0; j < lookedup; ++j)
1255 1.18 thorpej (void)vn_close(vpp[j], FREAD|FWRITE,
1256 1.128 ad uc);
1257 1.129.10.1 snj kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1258 1.129.10.1 snj kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1259 1.129.10.1 snj disk_detach(&cs->sc_dkdev);
1260 1.129.10.1 snj bufq_free(cs->sc_bufq);
1261 1.57 thorpej goto out;
1262 1.11 thorpej }
1263 1.11 thorpej
1264 1.57 thorpej /* We can free the temporary variables now. */
1265 1.129.10.1 snj kmem_free(vpp, ccio->ccio_ndisks * sizeof(*vpp));
1266 1.129.10.1 snj kmem_free(cpp, ccio->ccio_ndisks * sizeof(*cpp));
1267 1.57 thorpej
1268 1.11 thorpej /*
1269 1.11 thorpej * The ccd has been successfully initialized, so
1270 1.23 thorpej * we can place it into the array. Don't try to
1271 1.23 thorpej * read the disklabel until the disk has been attached,
1272 1.23 thorpej * because space for the disklabel is allocated
1273 1.23 thorpej * in disk_attach();
1274 1.11 thorpej */
1275 1.11 thorpej ccio->ccio_unit = unit;
1276 1.11 thorpej ccio->ccio_size = cs->sc_size;
1277 1.23 thorpej
1278 1.23 thorpej /* Try and read the disklabel. */
1279 1.11 thorpej ccdgetdisklabel(dev);
1280 1.11 thorpej break;
1281 1.11 thorpej
1282 1.11 thorpej case CCDIOCCLR:
1283 1.11 thorpej /*
1284 1.11 thorpej * Don't unconfigure if any other partitions are open
1285 1.11 thorpej * or if both the character and block flavors of this
1286 1.11 thorpej * partition are open.
1287 1.11 thorpej */
1288 1.11 thorpej part = DISKPART(dev);
1289 1.11 thorpej pmask = (1 << part);
1290 1.11 thorpej if ((cs->sc_dkdev.dk_openmask & ~pmask) ||
1291 1.11 thorpej ((cs->sc_dkdev.dk_bopenmask & pmask) &&
1292 1.15 thorpej (cs->sc_dkdev.dk_copenmask & pmask))) {
1293 1.57 thorpej error = EBUSY;
1294 1.57 thorpej goto out;
1295 1.15 thorpej }
1296 1.88 thorpej
1297 1.129.10.1 snj /* Stop new I/O, wait for in-flight I/O to complete. */
1298 1.129.10.1 snj mutex_enter(cs->sc_iolock);
1299 1.129.10.1 snj cs->sc_flags &= ~(CCDF_INITED|CCDF_VLABEL);
1300 1.129.10.1 snj cs->sc_zap = true;
1301 1.129.10.1 snj while (disk_isbusy(&cs->sc_dkdev) ||
1302 1.129.10.1 snj bufq_peek(cs->sc_bufq) != NULL ||
1303 1.129.10.1 snj cs->sc_thread != NULL) {
1304 1.129.10.1 snj cv_broadcast(&cs->sc_push);
1305 1.129.10.1 snj (void)cv_timedwait(&cs->sc_stop, cs->sc_iolock, hz);
1306 1.129.10.1 snj }
1307 1.129.10.1 snj mutex_exit(cs->sc_iolock);
1308 1.11 thorpej
1309 1.11 thorpej /*
1310 1.11 thorpej * Free ccd_softc information and clear entry.
1311 1.11 thorpej */
1312 1.22 thorpej
1313 1.22 thorpej /* Close the components and free their pathnames. */
1314 1.11 thorpej for (i = 0; i < cs->sc_nccdisks; ++i) {
1315 1.11 thorpej /*
1316 1.11 thorpej * XXX: this close could potentially fail and
1317 1.11 thorpej * cause Bad Things. Maybe we need to force
1318 1.11 thorpej * the close to happen?
1319 1.11 thorpej */
1320 1.11 thorpej #ifdef DEBUG
1321 1.11 thorpej if (ccddebug & CCDB_VNODE)
1322 1.11 thorpej vprint("CCDIOCCLR: vnode info",
1323 1.11 thorpej cs->sc_cinfo[i].ci_vp);
1324 1.11 thorpej #endif
1325 1.11 thorpej (void)vn_close(cs->sc_cinfo[i].ci_vp, FREAD|FWRITE,
1326 1.128 ad uc);
1327 1.129.10.1 snj kmem_free(cs->sc_cinfo[i].ci_path,
1328 1.129.10.1 snj cs->sc_cinfo[i].ci_pathlen);
1329 1.38 thorpej }
1330 1.38 thorpej
1331 1.22 thorpej /* Free interleave index. */
1332 1.129.10.1 snj for (i = 0; cs->sc_itable[i].ii_ndisk; ++i) {
1333 1.129.10.1 snj kmem_free(cs->sc_itable[i].ii_index,
1334 1.129.10.1 snj cs->sc_itable[i].ii_indexsz);
1335 1.129.10.1 snj }
1336 1.22 thorpej
1337 1.22 thorpej /* Free component info and interleave table. */
1338 1.129.10.1 snj kmem_free(cs->sc_cinfo, cs->sc_nccdisks *
1339 1.129.10.1 snj sizeof(struct ccdcinfo));
1340 1.129.10.1 snj kmem_free(cs->sc_itable, (cs->sc_nccdisks + 1) *
1341 1.129.10.1 snj sizeof(struct ccdiinfo));
1342 1.15 thorpej
1343 1.129.10.2 msaitoh aprint_normal("%s: detached\n", cs->sc_xname);
1344 1.129.10.2 msaitoh
1345 1.129.10.2 msaitoh /* Detach the disk. */
1346 1.123 ad disk_detach(&cs->sc_dkdev);
1347 1.129.10.1 snj bufq_free(cs->sc_bufq);
1348 1.11 thorpej break;
1349 1.11 thorpej
1350 1.11 thorpej case DIOCGDINFO:
1351 1.23 thorpej *(struct disklabel *)data = *(cs->sc_dkdev.dk_label);
1352 1.11 thorpej break;
1353 1.129.10.1 snj
1354 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1355 1.70 fvdl case ODIOCGDINFO:
1356 1.70 fvdl newlabel = *(cs->sc_dkdev.dk_label);
1357 1.70 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
1358 1.71 fvdl return ENOTTY;
1359 1.70 fvdl memcpy(data, &newlabel, sizeof (struct olddisklabel));
1360 1.70 fvdl break;
1361 1.70 fvdl #endif
1362 1.11 thorpej
1363 1.11 thorpej case DIOCGPART:
1364 1.23 thorpej ((struct partinfo *)data)->disklab = cs->sc_dkdev.dk_label;
1365 1.11 thorpej ((struct partinfo *)data)->part =
1366 1.23 thorpej &cs->sc_dkdev.dk_label->d_partitions[DISKPART(dev)];
1367 1.11 thorpej break;
1368 1.11 thorpej
1369 1.100 thorpej case DIOCCACHESYNC:
1370 1.100 thorpej /*
1371 1.100 thorpej * XXX Do we really need to care about having a writable
1372 1.100 thorpej * file descriptor here?
1373 1.100 thorpej */
1374 1.100 thorpej if ((flag & FWRITE) == 0)
1375 1.100 thorpej return (EBADF);
1376 1.100 thorpej
1377 1.100 thorpej /*
1378 1.100 thorpej * We pass this call down to all components and report
1379 1.100 thorpej * the first error we encounter.
1380 1.100 thorpej */
1381 1.100 thorpej for (error = 0, i = 0; i < cs->sc_nccdisks; i++) {
1382 1.100 thorpej j = VOP_IOCTL(cs->sc_cinfo[i].ci_vp, cmd, data,
1383 1.124 pooka flag, uc);
1384 1.100 thorpej if (j != 0 && error == 0)
1385 1.100 thorpej error = j;
1386 1.100 thorpej }
1387 1.100 thorpej break;
1388 1.100 thorpej
1389 1.11 thorpej case DIOCWDINFO:
1390 1.11 thorpej case DIOCSDINFO:
1391 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1392 1.70 fvdl case ODIOCWDINFO:
1393 1.70 fvdl case ODIOCSDINFO:
1394 1.70 fvdl #endif
1395 1.70 fvdl {
1396 1.70 fvdl struct disklabel *lp;
1397 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1398 1.70 fvdl if (cmd == ODIOCSDINFO || cmd == ODIOCWDINFO) {
1399 1.70 fvdl memset(&newlabel, 0, sizeof newlabel);
1400 1.70 fvdl memcpy(&newlabel, data, sizeof (struct olddisklabel));
1401 1.70 fvdl lp = &newlabel;
1402 1.70 fvdl } else
1403 1.70 fvdl #endif
1404 1.70 fvdl lp = (struct disklabel *)data;
1405 1.70 fvdl
1406 1.11 thorpej cs->sc_flags |= CCDF_LABELLING;
1407 1.11 thorpej
1408 1.23 thorpej error = setdisklabel(cs->sc_dkdev.dk_label,
1409 1.70 fvdl lp, 0, cs->sc_dkdev.dk_cpulabel);
1410 1.11 thorpej if (error == 0) {
1411 1.70 fvdl if (cmd == DIOCWDINFO
1412 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1413 1.70 fvdl || cmd == ODIOCWDINFO
1414 1.70 fvdl #endif
1415 1.70 fvdl )
1416 1.11 thorpej error = writedisklabel(CCDLABELDEV(dev),
1417 1.23 thorpej ccdstrategy, cs->sc_dkdev.dk_label,
1418 1.23 thorpej cs->sc_dkdev.dk_cpulabel);
1419 1.11 thorpej }
1420 1.11 thorpej
1421 1.11 thorpej cs->sc_flags &= ~CCDF_LABELLING;
1422 1.11 thorpej break;
1423 1.70 fvdl }
1424 1.11 thorpej
1425 1.87 thorpej case DIOCKLABEL:
1426 1.87 thorpej if (*(int *)data != 0)
1427 1.87 thorpej cs->sc_flags |= CCDF_KLABEL;
1428 1.87 thorpej else
1429 1.87 thorpej cs->sc_flags &= ~CCDF_KLABEL;
1430 1.87 thorpej break;
1431 1.87 thorpej
1432 1.11 thorpej case DIOCWLABEL:
1433 1.11 thorpej if (*(int *)data != 0)
1434 1.11 thorpej cs->sc_flags |= CCDF_WLABEL;
1435 1.11 thorpej else
1436 1.11 thorpej cs->sc_flags &= ~CCDF_WLABEL;
1437 1.11 thorpej break;
1438 1.11 thorpej
1439 1.44 thorpej case DIOCGDEFLABEL:
1440 1.44 thorpej ccdgetdefaultlabel(cs, (struct disklabel *)data);
1441 1.44 thorpej break;
1442 1.70 fvdl
1443 1.70 fvdl #ifdef __HAVE_OLD_DISKLABEL
1444 1.70 fvdl case ODIOCGDEFLABEL:
1445 1.70 fvdl ccdgetdefaultlabel(cs, &newlabel);
1446 1.70 fvdl if (newlabel.d_npartitions > OLDMAXPARTITIONS)
1447 1.71 fvdl return ENOTTY;
1448 1.70 fvdl memcpy(data, &newlabel, sizeof (struct olddisklabel));
1449 1.70 fvdl break;
1450 1.70 fvdl #endif
1451 1.44 thorpej
1452 1.11 thorpej default:
1453 1.57 thorpej error = ENOTTY;
1454 1.11 thorpej }
1455 1.11 thorpej
1456 1.57 thorpej out:
1457 1.129.10.1 snj mutex_exit(&cs->sc_dvlock);
1458 1.57 thorpej return (error);
1459 1.1 hpeyerl }
1460 1.1 hpeyerl
1461 1.97 thorpej static int
1462 1.97 thorpej ccdsize(dev_t dev)
1463 1.1 hpeyerl {
1464 1.11 thorpej struct ccd_softc *cs;
1465 1.40 thorpej struct disklabel *lp;
1466 1.40 thorpej int part, unit, omask, size;
1467 1.40 thorpej
1468 1.40 thorpej unit = ccdunit(dev);
1469 1.40 thorpej if (unit >= numccd)
1470 1.40 thorpej return (-1);
1471 1.40 thorpej cs = &ccd_softc[unit];
1472 1.11 thorpej
1473 1.40 thorpej if ((cs->sc_flags & CCDF_INITED) == 0)
1474 1.11 thorpej return (-1);
1475 1.11 thorpej
1476 1.11 thorpej part = DISKPART(dev);
1477 1.40 thorpej omask = cs->sc_dkdev.dk_openmask & (1 << part);
1478 1.40 thorpej lp = cs->sc_dkdev.dk_label;
1479 1.11 thorpej
1480 1.107 christos if (omask == 0 && ccdopen(dev, 0, S_IFBLK, curlwp))
1481 1.11 thorpej return (-1);
1482 1.11 thorpej
1483 1.40 thorpej if (lp->d_partitions[part].p_fstype != FS_SWAP)
1484 1.11 thorpej size = -1;
1485 1.11 thorpej else
1486 1.40 thorpej size = lp->d_partitions[part].p_size *
1487 1.40 thorpej (lp->d_secsize / DEV_BSIZE);
1488 1.11 thorpej
1489 1.107 christos if (omask == 0 && ccdclose(dev, 0, S_IFBLK, curlwp))
1490 1.11 thorpej return (-1);
1491 1.1 hpeyerl
1492 1.11 thorpej return (size);
1493 1.1 hpeyerl }
1494 1.1 hpeyerl
1495 1.11 thorpej static void
1496 1.97 thorpej ccdgetdefaultlabel(struct ccd_softc *cs, struct disklabel *lp)
1497 1.11 thorpej {
1498 1.11 thorpej struct ccdgeom *ccg = &cs->sc_geom;
1499 1.11 thorpej
1500 1.72 thorpej memset(lp, 0, sizeof(*lp));
1501 1.11 thorpej
1502 1.11 thorpej lp->d_secperunit = cs->sc_size;
1503 1.11 thorpej lp->d_secsize = ccg->ccg_secsize;
1504 1.11 thorpej lp->d_nsectors = ccg->ccg_nsectors;
1505 1.11 thorpej lp->d_ntracks = ccg->ccg_ntracks;
1506 1.11 thorpej lp->d_ncylinders = ccg->ccg_ncylinders;
1507 1.19 thorpej lp->d_secpercyl = lp->d_ntracks * lp->d_nsectors;
1508 1.11 thorpej
1509 1.11 thorpej strncpy(lp->d_typename, "ccd", sizeof(lp->d_typename));
1510 1.11 thorpej lp->d_type = DTYPE_CCD;
1511 1.11 thorpej strncpy(lp->d_packname, "fictitious", sizeof(lp->d_packname));
1512 1.11 thorpej lp->d_rpm = 3600;
1513 1.11 thorpej lp->d_interleave = 1;
1514 1.11 thorpej lp->d_flags = 0;
1515 1.11 thorpej
1516 1.11 thorpej lp->d_partitions[RAW_PART].p_offset = 0;
1517 1.11 thorpej lp->d_partitions[RAW_PART].p_size = cs->sc_size;
1518 1.11 thorpej lp->d_partitions[RAW_PART].p_fstype = FS_UNUSED;
1519 1.11 thorpej lp->d_npartitions = RAW_PART + 1;
1520 1.11 thorpej
1521 1.11 thorpej lp->d_magic = DISKMAGIC;
1522 1.11 thorpej lp->d_magic2 = DISKMAGIC;
1523 1.23 thorpej lp->d_checksum = dkcksum(cs->sc_dkdev.dk_label);
1524 1.44 thorpej }
1525 1.44 thorpej
1526 1.44 thorpej /*
1527 1.44 thorpej * Read the disklabel from the ccd. If one is not present, fake one
1528 1.44 thorpej * up.
1529 1.44 thorpej */
1530 1.44 thorpej static void
1531 1.97 thorpej ccdgetdisklabel(dev_t dev)
1532 1.44 thorpej {
1533 1.44 thorpej int unit = ccdunit(dev);
1534 1.44 thorpej struct ccd_softc *cs = &ccd_softc[unit];
1535 1.85 dsl const char *errstring;
1536 1.44 thorpej struct disklabel *lp = cs->sc_dkdev.dk_label;
1537 1.44 thorpej struct cpu_disklabel *clp = cs->sc_dkdev.dk_cpulabel;
1538 1.44 thorpej
1539 1.129.10.1 snj KASSERT(mutex_owned(&cs->sc_dvlock));
1540 1.129.10.1 snj
1541 1.72 thorpej memset(clp, 0, sizeof(*clp));
1542 1.44 thorpej
1543 1.44 thorpej ccdgetdefaultlabel(cs, lp);
1544 1.11 thorpej
1545 1.11 thorpej /*
1546 1.11 thorpej * Call the generic disklabel extraction routine.
1547 1.11 thorpej */
1548 1.129.10.1 snj cs->sc_flags |= CCDF_RLABEL;
1549 1.92 lukem if ((cs->sc_flags & CCDF_NOLABEL) != 0)
1550 1.92 lukem errstring = "CCDF_NOLABEL set; ignoring on-disk label";
1551 1.92 lukem else
1552 1.92 lukem errstring = readdisklabel(CCDLABELDEV(dev), ccdstrategy,
1553 1.92 lukem cs->sc_dkdev.dk_label, cs->sc_dkdev.dk_cpulabel);
1554 1.29 christos if (errstring)
1555 1.11 thorpej ccdmakedisklabel(cs);
1556 1.47 enami else {
1557 1.47 enami int i;
1558 1.47 enami struct partition *pp;
1559 1.47 enami
1560 1.47 enami /*
1561 1.47 enami * Sanity check whether the found disklabel is valid.
1562 1.47 enami *
1563 1.47 enami * This is necessary since total size of ccd may vary
1564 1.47 enami * when an interleave is changed even though exactly
1565 1.47 enami * same componets are used, and old disklabel may used
1566 1.47 enami * if that is found.
1567 1.47 enami */
1568 1.47 enami if (lp->d_secperunit != cs->sc_size)
1569 1.47 enami printf("WARNING: %s: "
1570 1.129.10.2 msaitoh "total sector size in disklabel (%ju) != "
1571 1.129.10.2 msaitoh "the size of ccd (%ju)\n", cs->sc_xname,
1572 1.129.10.2 msaitoh (uintmax_t)lp->d_secperunit,
1573 1.129.10.2 msaitoh (uintmax_t)cs->sc_size);
1574 1.47 enami for (i = 0; i < lp->d_npartitions; i++) {
1575 1.47 enami pp = &lp->d_partitions[i];
1576 1.47 enami if (pp->p_offset + pp->p_size > cs->sc_size)
1577 1.48 enami printf("WARNING: %s: end of partition `%c' "
1578 1.129.10.2 msaitoh "exceeds the size of ccd (%ju)\n",
1579 1.129.10.2 msaitoh cs->sc_xname, 'a' + i, (uintmax_t)cs->sc_size);
1580 1.47 enami }
1581 1.47 enami }
1582 1.11 thorpej
1583 1.11 thorpej #ifdef DEBUG
1584 1.11 thorpej /* It's actually extremely common to have unlabeled ccds. */
1585 1.11 thorpej if (ccddebug & CCDB_LABEL)
1586 1.11 thorpej if (errstring != NULL)
1587 1.35 christos printf("%s: %s\n", cs->sc_xname, errstring);
1588 1.11 thorpej #endif
1589 1.87 thorpej
1590 1.87 thorpej /* In-core label now valid. */
1591 1.129.10.1 snj cs->sc_flags = (cs->sc_flags | CCDF_VLABEL) & ~CCDF_RLABEL;
1592 1.11 thorpej }
1593 1.11 thorpej
1594 1.11 thorpej /*
1595 1.11 thorpej * Take care of things one might want to take care of in the event
1596 1.11 thorpej * that a disklabel isn't present.
1597 1.11 thorpej */
1598 1.11 thorpej static void
1599 1.97 thorpej ccdmakedisklabel(struct ccd_softc *cs)
1600 1.11 thorpej {
1601 1.23 thorpej struct disklabel *lp = cs->sc_dkdev.dk_label;
1602 1.11 thorpej
1603 1.11 thorpej /*
1604 1.11 thorpej * For historical reasons, if there's no disklabel present
1605 1.11 thorpej * the raw partition must be marked FS_BSDFFS.
1606 1.11 thorpej */
1607 1.11 thorpej lp->d_partitions[RAW_PART].p_fstype = FS_BSDFFS;
1608 1.11 thorpej
1609 1.11 thorpej strncpy(lp->d_packname, "default label", sizeof(lp->d_packname));
1610 1.44 thorpej
1611 1.44 thorpej lp->d_checksum = dkcksum(lp);
1612 1.11 thorpej }
1613 1.11 thorpej
1614 1.11 thorpej #ifdef DEBUG
1615 1.11 thorpej static void
1616 1.97 thorpej printiinfo(struct ccdiinfo *ii)
1617 1.11 thorpej {
1618 1.68 augustss int ix, i;
1619 1.11 thorpej
1620 1.11 thorpej for (ix = 0; ii->ii_ndisk; ix++, ii++) {
1621 1.81 kleink printf(" itab[%d]: #dk %d sblk %" PRId64 " soff %" PRId64,
1622 1.34 christos ix, ii->ii_ndisk, ii->ii_startblk, ii->ii_startoff);
1623 1.11 thorpej for (i = 0; i < ii->ii_ndisk; i++)
1624 1.35 christos printf(" %d", ii->ii_index[i]);
1625 1.35 christos printf("\n");
1626 1.11 thorpej }
1627 1.1 hpeyerl }
1628 1.1 hpeyerl #endif
1629