Home | History | Annotate | Line # | Download | only in raidframe
rf_netbsdkintf.c revision 1.10
      1  1.10     oster /*	$NetBSD: rf_netbsdkintf.c,v 1.10 1999/02/11 01:23:32 oster Exp $	*/
      2   1.1     oster /*-
      3   1.1     oster  * Copyright (c) 1996, 1997, 1998 The NetBSD Foundation, Inc.
      4   1.1     oster  * All rights reserved.
      5   1.1     oster  *
      6   1.1     oster  * This code is derived from software contributed to The NetBSD Foundation
      7   1.1     oster  * by Greg Oster; Jason R. Thorpe.
      8   1.1     oster  *
      9   1.1     oster  * Redistribution and use in source and binary forms, with or without
     10   1.1     oster  * modification, are permitted provided that the following conditions
     11   1.1     oster  * are met:
     12   1.1     oster  * 1. Redistributions of source code must retain the above copyright
     13   1.1     oster  *    notice, this list of conditions and the following disclaimer.
     14   1.1     oster  * 2. Redistributions in binary form must reproduce the above copyright
     15   1.1     oster  *    notice, this list of conditions and the following disclaimer in the
     16   1.1     oster  *    documentation and/or other materials provided with the distribution.
     17   1.1     oster  * 3. All advertising materials mentioning features or use of this software
     18   1.1     oster  *    must display the following acknowledgement:
     19   1.1     oster  *        This product includes software developed by the NetBSD
     20   1.1     oster  *        Foundation, Inc. and its contributors.
     21   1.1     oster  * 4. Neither the name of The NetBSD Foundation nor the names of its
     22   1.1     oster  *    contributors may be used to endorse or promote products derived
     23   1.1     oster  *    from this software without specific prior written permission.
     24   1.1     oster  *
     25   1.1     oster  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     26   1.1     oster  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     27   1.1     oster  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     28   1.1     oster  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     29   1.1     oster  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     30   1.1     oster  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     31   1.1     oster  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     32   1.1     oster  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     33   1.1     oster  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     34   1.1     oster  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     35   1.1     oster  * POSSIBILITY OF SUCH DAMAGE.
     36   1.1     oster  */
     37   1.1     oster 
     38   1.1     oster /*
     39   1.1     oster  * Copyright (c) 1988 University of Utah.
     40   1.1     oster  * Copyright (c) 1990, 1993
     41   1.1     oster  *      The Regents of the University of California.  All rights reserved.
     42   1.1     oster  *
     43   1.1     oster  * This code is derived from software contributed to Berkeley by
     44   1.1     oster  * the Systems Programming Group of the University of Utah Computer
     45   1.1     oster  * Science Department.
     46   1.1     oster  *
     47   1.1     oster  * Redistribution and use in source and binary forms, with or without
     48   1.1     oster  * modification, are permitted provided that the following conditions
     49   1.1     oster  * are met:
     50   1.1     oster  * 1. Redistributions of source code must retain the above copyright
     51   1.1     oster  *    notice, this list of conditions and the following disclaimer.
     52   1.1     oster  * 2. Redistributions in binary form must reproduce the above copyright
     53   1.1     oster  *    notice, this list of conditions and the following disclaimer in the
     54   1.1     oster  *    documentation and/or other materials provided with the distribution.
     55   1.1     oster  * 3. All advertising materials mentioning features or use of this software
     56   1.1     oster  *    must display the following acknowledgement:
     57   1.1     oster  *      This product includes software developed by the University of
     58   1.1     oster  *      California, Berkeley and its contributors.
     59   1.1     oster  * 4. Neither the name of the University nor the names of its contributors
     60   1.1     oster  *    may be used to endorse or promote products derived from this software
     61   1.1     oster  *    without specific prior written permission.
     62   1.1     oster  *
     63   1.1     oster  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     64   1.1     oster  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     65   1.1     oster  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     66   1.1     oster  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     67   1.1     oster  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     68   1.1     oster  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     69   1.1     oster  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     70   1.1     oster  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     71   1.1     oster  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     72   1.1     oster  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     73   1.1     oster  * SUCH DAMAGE.
     74   1.1     oster  *
     75   1.1     oster  * from: Utah $Hdr: cd.c 1.6 90/11/28$
     76   1.1     oster  *
     77   1.1     oster  *      @(#)cd.c        8.2 (Berkeley) 11/16/93
     78   1.1     oster  */
     79   1.1     oster 
     80   1.1     oster 
     81   1.1     oster 
     82   1.1     oster 
     83   1.1     oster /*
     84   1.1     oster  * Copyright (c) 1995 Carnegie-Mellon University.
     85   1.1     oster  * All rights reserved.
     86   1.1     oster  *
     87   1.1     oster  * Authors: Mark Holland, Jim Zelenka
     88   1.1     oster  *
     89   1.1     oster  * Permission to use, copy, modify and distribute this software and
     90   1.1     oster  * its documentation is hereby granted, provided that both the copyright
     91   1.1     oster  * notice and this permission notice appear in all copies of the
     92   1.1     oster  * software, derivative works or modified versions, and any portions
     93   1.1     oster  * thereof, and that both notices appear in supporting documentation.
     94   1.1     oster  *
     95   1.1     oster  * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
     96   1.1     oster  * CONDITION.  CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
     97   1.1     oster  * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
     98   1.1     oster  *
     99   1.1     oster  * Carnegie Mellon requests users of this software to return to
    100   1.1     oster  *
    101   1.1     oster  *  Software Distribution Coordinator  or  Software.Distribution (at) CS.CMU.EDU
    102   1.1     oster  *  School of Computer Science
    103   1.1     oster  *  Carnegie Mellon University
    104   1.1     oster  *  Pittsburgh PA 15213-3890
    105   1.1     oster  *
    106   1.1     oster  * any improvements or extensions that they make and grant Carnegie the
    107   1.1     oster  * rights to redistribute these changes.
    108   1.1     oster  */
    109   1.1     oster 
    110   1.1     oster /***********************************************************
    111   1.1     oster  *
    112   1.1     oster  * rf_kintf.c -- the kernel interface routines for RAIDframe
    113   1.1     oster  *
    114   1.1     oster  ***********************************************************/
    115   1.1     oster 
    116   1.1     oster #include <sys/errno.h>
    117   1.1     oster #include <sys/param.h>
    118   1.1     oster #include <sys/pool.h>
    119   1.1     oster #include <sys/queue.h>
    120   1.1     oster #include <sys/disk.h>
    121   1.1     oster #include <sys/device.h>
    122   1.1     oster #include <sys/stat.h>
    123   1.1     oster #include <sys/ioctl.h>
    124   1.1     oster #include <sys/fcntl.h>
    125   1.1     oster #include <sys/systm.h>
    126   1.1     oster #include <sys/namei.h>
    127   1.1     oster #include <sys/vnode.h>
    128   1.1     oster #include <sys/param.h>
    129   1.1     oster #include <sys/types.h>
    130   1.1     oster #include <machine/types.h>
    131   1.1     oster #include <sys/disklabel.h>
    132   1.1     oster #include <sys/conf.h>
    133   1.1     oster #include <sys/lock.h>
    134   1.1     oster #include <sys/buf.h>
    135   1.1     oster #include <sys/user.h>
    136   1.8     oster 
    137   1.8     oster #include "raid.h"
    138   1.1     oster #include "rf_raid.h"
    139   1.1     oster #include "rf_raidframe.h"
    140   1.1     oster #include "rf_dag.h"
    141   1.1     oster #include "rf_dagflags.h"
    142   1.1     oster #include "rf_diskqueue.h"
    143   1.1     oster #include "rf_acctrace.h"
    144   1.1     oster #include "rf_etimer.h"
    145   1.1     oster #include "rf_general.h"
    146   1.1     oster #include "rf_debugMem.h"
    147   1.1     oster #include "rf_kintf.h"
    148   1.1     oster #include "rf_options.h"
    149   1.1     oster #include "rf_driver.h"
    150   1.1     oster #include "rf_parityscan.h"
    151   1.1     oster #include "rf_debugprint.h"
    152   1.1     oster #include "rf_threadstuff.h"
    153   1.1     oster 
    154   1.9     oster int     rf_kdebug_level = 0;
    155   1.1     oster 
    156   1.1     oster #define RFK_BOOT_NONE 0
    157   1.1     oster #define RFK_BOOT_GOOD 1
    158   1.1     oster #define RFK_BOOT_BAD  2
    159   1.1     oster static int rf_kbooted = RFK_BOOT_NONE;
    160   1.1     oster 
    161   1.1     oster #ifdef DEBUG
    162   1.1     oster #define db0_printf(a) printf a
    163   1.1     oster #define db_printf(a) if (rf_kdebug_level > 0) printf a
    164   1.1     oster #define db1_printf(a) if (rf_kdebug_level > 0) printf a
    165   1.1     oster #define db2_printf(a) if (rf_kdebug_level > 1) printf a
    166   1.1     oster #define db3_printf(a) if (rf_kdebug_level > 2) printf a
    167   1.1     oster #define db4_printf(a) if (rf_kdebug_level > 3) printf a
    168   1.1     oster #define db5_printf(a) if (rf_kdebug_level > 4) printf a
    169   1.9     oster #else				/* DEBUG */
    170   1.1     oster #define db0_printf(a) printf a
    171   1.1     oster #define db1_printf(a) { }
    172   1.1     oster #define db2_printf(a) { }
    173   1.1     oster #define db3_printf(a) { }
    174   1.1     oster #define db4_printf(a) { }
    175   1.1     oster #define db5_printf(a) { }
    176   1.9     oster #endif				/* DEBUG */
    177   1.1     oster 
    178   1.9     oster static RF_Raid_t **raidPtrs;	/* global raid device descriptors */
    179   1.1     oster 
    180   1.1     oster static int rf_pending_testaccs;
    181   1.1     oster 
    182   1.1     oster RF_DECLARE_STATIC_MUTEX(rf_sparet_wait_mutex)
    183   1.1     oster RF_DECLARE_STATIC_MUTEX(rf_async_done_q_mutex)
    184  1.10     oster static RF_SparetWait_t *rf_sparet_wait_queue;	/* requests to install a
    185  1.10     oster 						 * spare table */
    186  1.10     oster static RF_SparetWait_t *rf_sparet_resp_queue;	/* responses from
    187  1.10     oster 						 * installation process */
    188  1.10     oster static struct rf_test_acc *rf_async_done_qh, *rf_async_done_qt;
    189  1.10     oster 
    190  1.10     oster static struct rf_recon_req *recon_queue = NULL;	/* used to communicate
    191  1.10     oster 						 * reconstruction
    192  1.10     oster 						 * requests */
    193   1.1     oster 
    194   1.1     oster 
    195   1.9     oster decl_simple_lock_data(, recon_queue_mutex)
    196   1.1     oster #define LOCK_RECON_Q_MUTEX() simple_lock(&recon_queue_mutex)
    197   1.1     oster #define UNLOCK_RECON_Q_MUTEX() simple_unlock(&recon_queue_mutex)
    198   1.1     oster 
    199   1.1     oster /* prototypes */
    200  1.10     oster static void KernelWakeupFunc(struct buf * bp);
    201  1.10     oster static void InitBP(struct buf * bp, struct vnode *, unsigned rw_flag,
    202  1.10     oster 		   dev_t dev, RF_SectorNum_t startSect,
    203  1.10     oster 		   RF_SectorCount_t numSect, caddr_t buf,
    204  1.10     oster 		   void (*cbFunc) (struct buf *), void *cbArg,
    205  1.10     oster 		   int logBytesPerSector, struct proc * b_proc);
    206   1.1     oster 
    207   1.1     oster #define Dprintf0(s)       if (rf_queueDebug) rf_debug_printf(s,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL)
    208   1.1     oster #define Dprintf1(s,a)     if (rf_queueDebug) rf_debug_printf(s,a,NULL,NULL,NULL,NULL,NULL,NULL,NULL)
    209   1.1     oster #define Dprintf2(s,a,b)   if (rf_queueDebug) rf_debug_printf(s,a,b,NULL,NULL,NULL,NULL,NULL,NULL)
    210   1.1     oster #define Dprintf3(s,a,b,c) if (rf_queueDebug) rf_debug_printf(s,a,b,c,NULL,NULL,NULL,NULL,NULL)
    211   1.1     oster 
    212   1.1     oster 
    213   1.1     oster /* this is so that we can compile under 2.0 as well as 3.2 */
    214   1.1     oster #ifndef proc_to_task
    215   1.1     oster #define proc_to_task(x) ((x)->task)
    216   1.9     oster #endif				/* !proc_to_task */
    217   1.1     oster 
    218  1.10     oster void raidattach __P((int));
    219  1.10     oster int raidsize __P((dev_t));
    220   1.1     oster 
    221  1.10     oster void    rf_DiskIOComplete(RF_DiskQueue_t *, RF_DiskQueueData_t *, int);
    222  1.10     oster void    rf_CopybackReconstructedData(RF_Raid_t * raidPtr);
    223  1.10     oster static int raidinit __P((dev_t, RF_Raid_t *, int));
    224  1.10     oster 
    225  1.10     oster int raidopen __P((dev_t, int, int, struct proc *));
    226  1.10     oster int raidclose __P((dev_t, int, int, struct proc *));
    227  1.10     oster int raidioctl __P((dev_t, u_long, caddr_t, int, struct proc *));
    228  1.10     oster int raidwrite __P((dev_t, struct uio *, int));
    229  1.10     oster int raidread __P((dev_t, struct uio *, int));
    230  1.10     oster void raidstrategy __P((struct buf *));
    231  1.10     oster int raiddump __P((dev_t, daddr_t, caddr_t, size_t));
    232   1.1     oster 
    233   1.1     oster /*
    234   1.1     oster  * Pilfered from ccd.c
    235   1.1     oster  */
    236   1.1     oster 
    237  1.10     oster struct raidbuf {
    238  1.10     oster 	struct buf rf_buf;	/* new I/O buf.  MUST BE FIRST!!! */
    239  1.10     oster 	struct buf *rf_obp;	/* ptr. to original I/O buf */
    240  1.10     oster 	int     rf_flags;	/* misc. flags */
    241  1.10     oster 	RF_DiskQueueData_t *req;	/* the request that this was
    242  1.10     oster 					 * part of.. */
    243  1.10     oster };
    244   1.1     oster 
    245   1.1     oster 
    246   1.1     oster #define RAIDGETBUF(rs) pool_get(&(rs)->sc_cbufpool, PR_NOWAIT)
    247   1.1     oster #define	RAIDPUTBUF(rs, cbp) pool_put(&(rs)->sc_cbufpool, cbp)
    248   1.1     oster 
    249   1.9     oster /* XXX Not sure if the following should be replacing the raidPtrs above,
    250  1.10     oster    or if it should be used in conjunction with that... */
    251   1.1     oster 
    252  1.10     oster struct raid_softc {
    253  1.10     oster 	int     sc_unit;/* logical unit number */
    254  1.10     oster 	int     sc_flags;	/* flags */
    255  1.10     oster 	int     sc_cflags;	/* configuration flags */
    256  1.10     oster 	size_t  sc_size;/* size of the raid device */
    257  1.10     oster 	dev_t   sc_dev;	/* our device.. */
    258  1.10     oster 	char    sc_xname[20];	/* XXX external name */
    259  1.10     oster 	struct disk sc_dkdev;	/* generic disk device info */
    260  1.10     oster 	struct pool sc_cbufpool;	/* component buffer pool */
    261  1.10     oster };
    262   1.1     oster /* sc_flags */
    263   1.1     oster #define RAIDF_INITED	0x01	/* unit has been initialized */
    264   1.1     oster #define RAIDF_WLABEL	0x02	/* label area is writable */
    265   1.1     oster #define RAIDF_LABELLING	0x04	/* unit is currently being labelled */
    266   1.1     oster #define RAIDF_WANTED	0x40	/* someone is waiting to obtain a lock */
    267   1.1     oster #define RAIDF_LOCKED	0x80	/* unit is locked */
    268   1.1     oster 
    269   1.1     oster #define	raidunit(x)	DISKUNIT(x)
    270  1.10     oster static int numraid = 0;
    271   1.1     oster 
    272   1.1     oster #define RAIDLABELDEV(dev)	\
    273   1.1     oster 	(MAKEDISKDEV(major((dev)), raidunit((dev)), RAW_PART))
    274   1.1     oster 
    275   1.1     oster /* declared here, and made public, for the benefit of KVM stuff.. */
    276  1.10     oster struct raid_softc *raid_softc;
    277   1.9     oster 
    278  1.10     oster static void raidgetdefaultlabel __P((RF_Raid_t *, struct raid_softc *,
    279  1.10     oster 				     struct disklabel *));
    280  1.10     oster static void raidgetdisklabel __P((dev_t));
    281  1.10     oster static void raidmakedisklabel __P((struct raid_softc *));
    282   1.1     oster 
    283  1.10     oster static int raidlock __P((struct raid_softc *));
    284  1.10     oster static void raidunlock __P((struct raid_softc *));
    285  1.10     oster int raidlookup __P((char *, struct proc * p, struct vnode **));
    286   1.1     oster 
    287   1.1     oster 
    288  1.10     oster void
    289  1.10     oster raidattach(num)
    290   1.9     oster 	int     num;
    291   1.1     oster {
    292   1.9     oster 	int     raidID;
    293   1.1     oster 
    294   1.1     oster #ifdef DEBUG
    295   1.9     oster 	printf("raidattach: Asked for %d units\n", num);
    296   1.1     oster #endif
    297   1.1     oster 
    298   1.1     oster 	if (num <= 0) {
    299   1.1     oster #ifdef DIAGNOSTIC
    300   1.1     oster 		panic("raidattach: count <= 0");
    301   1.1     oster #endif
    302   1.1     oster 		return;
    303   1.1     oster 	}
    304   1.9     oster 	/* This is where all the initialization stuff gets done. */
    305   1.1     oster 
    306   1.1     oster 	/* Make some space for requested number of units... */
    307   1.1     oster 
    308   1.1     oster 	RF_Calloc(raidPtrs, num, sizeof(RF_Raid_t *), (RF_Raid_t **));
    309   1.1     oster 	if (raidPtrs == NULL) {
    310   1.1     oster 		panic("raidPtrs is NULL!!\n");
    311   1.1     oster 	}
    312   1.1     oster 	rf_kbooted = rf_boot();
    313   1.1     oster 	if (rf_kbooted) {
    314   1.1     oster 		panic("Serious error booting RAID!!\n");
    315   1.1     oster 	}
    316   1.9     oster 	rf_kbooted = RFK_BOOT_GOOD;
    317   1.9     oster 
    318   1.9     oster 	/* put together some datastructures like the CCD device does.. This
    319   1.9     oster 	 * lets us lock the device and what-not when it gets opened. */
    320   1.1     oster 
    321   1.1     oster 	raid_softc = (struct raid_softc *)
    322   1.9     oster 	    malloc(num * sizeof(struct raid_softc),
    323   1.9     oster 	    M_RAIDFRAME, M_NOWAIT);
    324   1.1     oster 	if (raid_softc == NULL) {
    325   1.1     oster 		printf("WARNING: no memory for RAIDframe driver\n");
    326   1.1     oster 		return;
    327   1.1     oster 	}
    328   1.1     oster 	numraid = num;
    329   1.1     oster 	bzero(raid_softc, num * sizeof(struct raid_softc));
    330   1.1     oster 
    331   1.9     oster 	for (raidID = 0; raidID < num; raidID++) {
    332   1.9     oster 		RF_Calloc(raidPtrs[raidID], 1, sizeof(RF_Raid_t),
    333   1.9     oster 		    (RF_Raid_t *));
    334   1.9     oster 		if (raidPtrs[raidID] == NULL) {
    335   1.9     oster 			printf("raidPtrs[%d] is NULL\n", raidID);
    336   1.1     oster 		}
    337   1.1     oster 	}
    338   1.1     oster }
    339   1.1     oster 
    340   1.1     oster 
    341   1.1     oster int
    342   1.1     oster raidsize(dev)
    343   1.9     oster 	dev_t   dev;
    344   1.1     oster {
    345   1.1     oster 	struct raid_softc *rs;
    346   1.1     oster 	struct disklabel *lp;
    347   1.9     oster 	int     part, unit, omask, size;
    348   1.1     oster 
    349   1.1     oster 	unit = raidunit(dev);
    350   1.1     oster 	if (unit >= numraid)
    351   1.1     oster 		return (-1);
    352   1.1     oster 	rs = &raid_softc[unit];
    353   1.1     oster 
    354   1.1     oster 	if ((rs->sc_flags & RAIDF_INITED) == 0)
    355   1.1     oster 		return (-1);
    356   1.1     oster 
    357   1.1     oster 	part = DISKPART(dev);
    358   1.1     oster 	omask = rs->sc_dkdev.dk_openmask & (1 << part);
    359   1.1     oster 	lp = rs->sc_dkdev.dk_label;
    360   1.1     oster 
    361   1.1     oster 	if (omask == 0 && raidopen(dev, 0, S_IFBLK, curproc))
    362   1.1     oster 		return (-1);
    363   1.1     oster 
    364   1.1     oster 	if (lp->d_partitions[part].p_fstype != FS_SWAP)
    365   1.1     oster 		size = -1;
    366   1.1     oster 	else
    367   1.1     oster 		size = lp->d_partitions[part].p_size *
    368   1.1     oster 		    (lp->d_secsize / DEV_BSIZE);
    369   1.1     oster 
    370   1.1     oster 	if (omask == 0 && raidclose(dev, 0, S_IFBLK, curproc))
    371   1.1     oster 		return (-1);
    372   1.1     oster 
    373   1.1     oster 	return (size);
    374   1.1     oster 
    375   1.1     oster }
    376   1.1     oster 
    377   1.1     oster int
    378   1.1     oster raiddump(dev, blkno, va, size)
    379   1.9     oster 	dev_t   dev;
    380   1.1     oster 	daddr_t blkno;
    381   1.1     oster 	caddr_t va;
    382   1.9     oster 	size_t  size;
    383   1.1     oster {
    384   1.1     oster 	/* Not implemented. */
    385   1.1     oster 	return ENXIO;
    386   1.1     oster }
    387   1.1     oster /* ARGSUSED */
    388   1.1     oster int
    389   1.1     oster raidopen(dev, flags, fmt, p)
    390   1.9     oster 	dev_t   dev;
    391   1.9     oster 	int     flags, fmt;
    392   1.1     oster 	struct proc *p;
    393   1.1     oster {
    394   1.9     oster 	int     unit = raidunit(dev);
    395   1.1     oster 	struct raid_softc *rs;
    396   1.1     oster 	struct disklabel *lp;
    397   1.9     oster 	int     part, pmask;
    398   1.1     oster 	unsigned int raidID;
    399   1.9     oster 	int     rc;
    400   1.9     oster 	int     error = 0;
    401   1.9     oster 
    402   1.9     oster 	/* This whole next chunk of code is somewhat suspect... Not sure it's
    403   1.9     oster 	 * needed here at all... XXX */
    404   1.1     oster 
    405   1.9     oster 	if (rf_kbooted == RFK_BOOT_NONE) {
    406   1.1     oster 		printf("Doing restart on raidopen.\n");
    407   1.1     oster 		rf_kbooted = RFK_BOOT_GOOD;
    408   1.1     oster 		rc = rf_boot();
    409   1.1     oster 		if (rc) {
    410   1.1     oster 			rf_kbooted = RFK_BOOT_BAD;
    411   1.1     oster 			printf("Someone is unhappy...\n");
    412   1.9     oster 			return (rc);
    413   1.1     oster 		}
    414   1.1     oster 	}
    415   1.1     oster 	if (unit >= numraid)
    416   1.1     oster 		return (ENXIO);
    417   1.1     oster 	rs = &raid_softc[unit];
    418   1.1     oster 
    419   1.1     oster 	if ((error = raidlock(rs)) != 0)
    420   1.9     oster 		return (error);
    421   1.1     oster 	lp = rs->sc_dkdev.dk_label;
    422   1.1     oster 
    423   1.1     oster 	raidID = raidunit(dev);
    424   1.1     oster 
    425   1.1     oster 	part = DISKPART(dev);
    426   1.1     oster 	pmask = (1 << part);
    427   1.1     oster 
    428   1.1     oster 	db1_printf(("Opening raid device number: %d partition: %d\n",
    429   1.9     oster 		raidID, part));
    430   1.1     oster 
    431   1.1     oster 
    432   1.1     oster 	if ((rs->sc_flags & RAIDF_INITED) &&
    433   1.1     oster 	    (rs->sc_dkdev.dk_openmask == 0))
    434   1.9     oster 		raidgetdisklabel(dev);
    435   1.1     oster 
    436   1.1     oster 	/* make sure that this partition exists */
    437   1.1     oster 
    438   1.1     oster 	if (part != RAW_PART) {
    439   1.1     oster 		db1_printf(("Not a raw partition..\n"));
    440   1.1     oster 		if (((rs->sc_flags & RAIDF_INITED) == 0) ||
    441   1.1     oster 		    ((part >= lp->d_npartitions) ||
    442   1.9     oster 			(lp->d_partitions[part].p_fstype == FS_UNUSED))) {
    443   1.1     oster 			error = ENXIO;
    444   1.1     oster 			raidunlock(rs);
    445   1.1     oster 			db1_printf(("Bailing out...\n"));
    446   1.9     oster 			return (error);
    447   1.1     oster 		}
    448   1.1     oster 	}
    449   1.1     oster 	/* Prevent this unit from being unconfigured while open. */
    450   1.1     oster 	switch (fmt) {
    451   1.1     oster 	case S_IFCHR:
    452   1.1     oster 		rs->sc_dkdev.dk_copenmask |= pmask;
    453   1.1     oster 		break;
    454   1.1     oster 
    455   1.1     oster 	case S_IFBLK:
    456   1.1     oster 		rs->sc_dkdev.dk_bopenmask |= pmask;
    457   1.1     oster 		break;
    458   1.1     oster 	}
    459   1.1     oster 	rs->sc_dkdev.dk_openmask =
    460   1.1     oster 	    rs->sc_dkdev.dk_copenmask | rs->sc_dkdev.dk_bopenmask;
    461   1.1     oster 
    462   1.1     oster 	raidunlock(rs);
    463   1.1     oster 
    464   1.9     oster 	return (error);
    465   1.1     oster 
    466   1.1     oster 
    467   1.1     oster }
    468   1.1     oster /* ARGSUSED */
    469   1.1     oster int
    470   1.1     oster raidclose(dev, flags, fmt, p)
    471   1.9     oster 	dev_t   dev;
    472   1.9     oster 	int     flags, fmt;
    473   1.1     oster 	struct proc *p;
    474   1.1     oster {
    475   1.9     oster 	int     unit = raidunit(dev);
    476   1.1     oster 	struct raid_softc *rs;
    477   1.9     oster 	int     error = 0;
    478   1.9     oster 	int     part;
    479   1.1     oster 
    480   1.1     oster 	if (unit >= numraid)
    481   1.1     oster 		return (ENXIO);
    482   1.1     oster 	rs = &raid_softc[unit];
    483   1.1     oster 
    484   1.1     oster 	if ((error = raidlock(rs)) != 0)
    485   1.1     oster 		return (error);
    486   1.1     oster 
    487   1.1     oster 	part = DISKPART(dev);
    488   1.1     oster 
    489   1.1     oster 	/* ...that much closer to allowing unconfiguration... */
    490   1.1     oster 	switch (fmt) {
    491   1.1     oster 	case S_IFCHR:
    492   1.1     oster 		rs->sc_dkdev.dk_copenmask &= ~(1 << part);
    493   1.1     oster 		break;
    494   1.1     oster 
    495   1.1     oster 	case S_IFBLK:
    496   1.1     oster 		rs->sc_dkdev.dk_bopenmask &= ~(1 << part);
    497   1.1     oster 		break;
    498   1.1     oster 	}
    499   1.1     oster 	rs->sc_dkdev.dk_openmask =
    500   1.1     oster 	    rs->sc_dkdev.dk_copenmask | rs->sc_dkdev.dk_bopenmask;
    501   1.1     oster 
    502   1.1     oster 	raidunlock(rs);
    503   1.1     oster 	return (0);
    504   1.1     oster 
    505   1.1     oster }
    506   1.1     oster 
    507   1.1     oster void
    508   1.1     oster raidstrategy(bp)
    509   1.1     oster 	register struct buf *bp;
    510   1.1     oster {
    511   1.1     oster 	register int s;
    512   1.1     oster 
    513   1.1     oster 	unsigned int raidID = raidunit(bp->b_dev);
    514   1.1     oster 	RF_Raid_t *raidPtr;
    515   1.1     oster 	struct raid_softc *rs = &raid_softc[raidID];
    516   1.1     oster 	struct disklabel *lp;
    517   1.9     oster 	int     wlabel;
    518   1.1     oster 
    519   1.5     oster #if 0
    520   1.9     oster 	db1_printf(("Strategy: 0x%x 0x%x\n", bp, bp->b_data));
    521   1.9     oster 	db1_printf(("Strategy(2): bp->b_bufsize%d\n", (int) bp->b_bufsize));
    522   1.9     oster 	db1_printf(("bp->b_count=%d\n", (int) bp->b_bcount));
    523   1.9     oster 	db1_printf(("bp->b_resid=%d\n", (int) bp->b_resid));
    524   1.9     oster 	db1_printf(("bp->b_blkno=%d\n", (int) bp->b_blkno));
    525   1.5     oster 
    526   1.9     oster 	if (bp->b_flags & B_READ)
    527   1.1     oster 		db1_printf(("READ\n"));
    528   1.1     oster 	else
    529   1.1     oster 		db1_printf(("WRITE\n"));
    530   1.1     oster #endif
    531   1.1     oster 	if (rf_kbooted != RFK_BOOT_GOOD)
    532   1.1     oster 		return;
    533   1.1     oster 	if (raidID >= numraid || !raidPtrs[raidID]) {
    534   1.1     oster 		bp->b_error = ENODEV;
    535   1.1     oster 		bp->b_flags |= B_ERROR;
    536   1.1     oster 		bp->b_resid = bp->b_bcount;
    537   1.1     oster 		biodone(bp);
    538   1.1     oster 		return;
    539   1.1     oster 	}
    540   1.1     oster 	raidPtr = raidPtrs[raidID];
    541   1.1     oster 	if (!raidPtr->valid) {
    542   1.1     oster 		bp->b_error = ENODEV;
    543   1.1     oster 		bp->b_flags |= B_ERROR;
    544   1.1     oster 		bp->b_resid = bp->b_bcount;
    545   1.1     oster 		biodone(bp);
    546   1.1     oster 		return;
    547   1.1     oster 	}
    548   1.1     oster 	if (bp->b_bcount == 0) {
    549   1.1     oster 		db1_printf(("b_bcount is zero..\n"));
    550   1.1     oster 		biodone(bp);
    551   1.1     oster 		return;
    552   1.1     oster 	}
    553   1.1     oster 	lp = rs->sc_dkdev.dk_label;
    554   1.1     oster 
    555   1.1     oster 	/*
    556   1.1     oster 	 * Do bounds checking and adjust transfer.  If there's an
    557   1.1     oster 	 * error, the bounds check will flag that for us.
    558   1.1     oster 	 */
    559   1.1     oster 
    560   1.9     oster 	wlabel = rs->sc_flags & (RAIDF_WLABEL | RAIDF_LABELLING);
    561   1.1     oster 	if (DISKPART(bp->b_dev) != RAW_PART)
    562   1.1     oster 		if (bounds_check_with_label(bp, lp, wlabel) <= 0) {
    563   1.1     oster 			db1_printf(("Bounds check failed!!:%d %d\n",
    564   1.9     oster 				(int) bp->b_blkno, (int) wlabel));
    565   1.1     oster 			biodone(bp);
    566   1.1     oster 			return;
    567   1.1     oster 		}
    568   1.9     oster 	s = splbio();		/* XXX Needed? */
    569   1.9     oster 	db1_printf(("Beginning strategy...\n"));
    570   1.1     oster 
    571   1.1     oster 	bp->b_resid = 0;
    572   1.9     oster 	bp->b_error = rf_DoAccessKernel(raidPtrs[raidID], bp,
    573   1.9     oster 	    NULL, NULL, NULL);
    574   1.1     oster 	if (bp->b_error) {
    575   1.1     oster 		bp->b_flags |= B_ERROR;
    576   1.1     oster 		db1_printf(("bp->b_flags HAS B_ERROR SET!!!: %d\n",
    577   1.9     oster 			bp->b_error));
    578   1.1     oster 	}
    579   1.1     oster 	splx(s);
    580   1.5     oster #if 0
    581   1.1     oster 	db1_printf(("Strategy exiting: 0x%x 0x%x %d %d\n",
    582   1.9     oster 		bp, bp->b_data,
    583   1.9     oster 		(int) bp->b_bcount, (int) bp->b_resid));
    584   1.5     oster #endif
    585   1.1     oster }
    586   1.1     oster /* ARGSUSED */
    587   1.1     oster int
    588   1.1     oster raidread(dev, uio, flags)
    589   1.9     oster 	dev_t   dev;
    590   1.1     oster 	struct uio *uio;
    591   1.9     oster 	int     flags;
    592   1.1     oster {
    593   1.9     oster 	int     unit = raidunit(dev);
    594   1.1     oster 	struct raid_softc *rs;
    595   1.9     oster 	int     result;
    596   1.9     oster 	int     part;
    597   1.1     oster 
    598   1.1     oster 	if (unit >= numraid)
    599   1.1     oster 		return (ENXIO);
    600   1.1     oster 	rs = &raid_softc[unit];
    601   1.1     oster 
    602   1.1     oster 	if ((rs->sc_flags & RAIDF_INITED) == 0)
    603   1.1     oster 		return (ENXIO);
    604   1.1     oster 	part = DISKPART(dev);
    605   1.1     oster 
    606   1.9     oster 	db1_printf(("raidread: unit: %d partition: %d\n", unit, part));
    607   1.1     oster 
    608   1.1     oster #if 0
    609   1.1     oster 	return (physio(raidstrategy, NULL, dev, B_READ, minphys, uio));
    610   1.1     oster #endif
    611   1.9     oster 	result = physio(raidstrategy, NULL, dev, B_READ, minphys, uio);
    612   1.1     oster 	db1_printf(("raidread done.  Result is %d %d\n",
    613   1.9     oster 		result, uio->uio_resid));
    614   1.9     oster 	return (result);
    615   1.1     oster 
    616   1.1     oster }
    617   1.1     oster /* ARGSUSED */
    618   1.1     oster int
    619   1.1     oster raidwrite(dev, uio, flags)
    620   1.9     oster 	dev_t   dev;
    621   1.1     oster 	struct uio *uio;
    622   1.9     oster 	int     flags;
    623   1.1     oster {
    624   1.9     oster 	int     unit = raidunit(dev);
    625   1.1     oster 	struct raid_softc *rs;
    626   1.1     oster 
    627   1.1     oster 	if (unit >= numraid)
    628   1.1     oster 		return (ENXIO);
    629   1.1     oster 	rs = &raid_softc[unit];
    630   1.1     oster 
    631   1.1     oster 	if ((rs->sc_flags & RAIDF_INITED) == 0)
    632   1.1     oster 		return (ENXIO);
    633   1.1     oster 	db1_printf(("raidwrite\n"));
    634   1.1     oster 	return (physio(raidstrategy, NULL, dev, B_WRITE, minphys, uio));
    635   1.1     oster 
    636   1.1     oster 
    637   1.1     oster }
    638   1.1     oster 
    639   1.1     oster int
    640   1.1     oster raidioctl(dev, cmd, data, flag, p)
    641   1.9     oster 	dev_t   dev;
    642   1.9     oster 	u_long  cmd;
    643   1.1     oster 	caddr_t data;
    644   1.9     oster 	int     flag;
    645   1.1     oster 	struct proc *p;
    646   1.1     oster {
    647   1.9     oster 	int     unit = raidunit(dev);
    648   1.9     oster 	int     error = 0;
    649   1.9     oster 	int     part, pmask;
    650   1.1     oster 	struct raid_softc *rs;
    651   1.1     oster #if 0
    652   1.9     oster 	int     r, c;
    653   1.1     oster #endif
    654   1.9     oster 	/* struct raid_ioctl *ccio = (struct ccd_ioctl *)data; */
    655   1.1     oster 
    656   1.9     oster 	/* struct ccdbuf *cbp; */
    657   1.9     oster 	/* struct raidbuf *raidbp; */
    658   1.1     oster 	RF_Config_t *k_cfg, *u_cfg;
    659   1.1     oster 	u_char *specific_buf;
    660   1.9     oster 	int     retcode = 0;
    661   1.1     oster 
    662   1.9     oster 	int     row;
    663   1.1     oster 	struct rf_recon_req *rrcopy, *rr;
    664   1.1     oster #if 0
    665   1.9     oster 	int     nbytes, spl, rw, row;
    666   1.1     oster 	struct rf_test_acc *ta;
    667   1.1     oster 	struct buf *bp;
    668   1.1     oster 	RF_SparetWait_t *waitreq;
    669   1.1     oster 	struct rf_test_acc *ta_p, *ta_copy;
    670   1.1     oster #endif
    671   1.1     oster 
    672   1.1     oster 	if (unit >= numraid)
    673   1.1     oster 		return (ENXIO);
    674   1.1     oster 	rs = &raid_softc[unit];
    675   1.1     oster 
    676   1.9     oster 	db1_printf(("raidioctl: %d %d %d %d\n", (int) dev,
    677   1.9     oster 		(int) DISKPART(dev), (int) unit, (int) cmd));
    678   1.1     oster 
    679   1.1     oster 	/* Must be open for writes for these commands... */
    680   1.1     oster 	switch (cmd) {
    681   1.1     oster 	case DIOCSDINFO:
    682   1.1     oster 	case DIOCWDINFO:
    683   1.1     oster 	case DIOCWLABEL:
    684   1.1     oster 		if ((flag & FWRITE) == 0)
    685   1.1     oster 			return (EBADF);
    686   1.1     oster 	}
    687   1.1     oster 
    688   1.1     oster 	/* Must be initialized for these... */
    689   1.1     oster 	switch (cmd) {
    690   1.1     oster 	case DIOCGDINFO:
    691   1.1     oster 	case DIOCSDINFO:
    692   1.1     oster 	case DIOCWDINFO:
    693   1.1     oster 	case DIOCGPART:
    694   1.1     oster 	case DIOCWLABEL:
    695   1.1     oster 	case DIOCGDEFLABEL:
    696   1.1     oster 	case RAIDFRAME_SHUTDOWN:
    697   1.1     oster 	case RAIDFRAME_REWRITEPARITY:
    698   1.1     oster 	case RAIDFRAME_GET_INFO:
    699   1.1     oster 	case RAIDFRAME_RESET_ACCTOTALS:
    700   1.1     oster 	case RAIDFRAME_GET_ACCTOTALS:
    701   1.1     oster 	case RAIDFRAME_KEEP_ACCTOTALS:
    702   1.1     oster 	case RAIDFRAME_GET_SIZE:
    703   1.1     oster 	case RAIDFRAME_FAIL_DISK:
    704   1.1     oster 	case RAIDFRAME_COPYBACK:
    705   1.1     oster 	case RAIDFRAME_CHECKRECON:
    706   1.1     oster 		if ((rs->sc_flags & RAIDF_INITED) == 0)
    707   1.1     oster 			return (ENXIO);
    708   1.1     oster 	}
    709   1.9     oster 
    710   1.1     oster 	switch (cmd) {
    711   1.1     oster 
    712   1.1     oster 
    713   1.1     oster 		/* configure the system */
    714   1.1     oster 	case RAIDFRAME_CONFIGURE:
    715   1.1     oster 
    716   1.1     oster 		db3_printf(("rf_ioctl: RAIDFRAME_CONFIGURE\n"));
    717   1.1     oster 		/* copy-in the configuration information */
    718   1.1     oster 		/* data points to a pointer to the configuration structure */
    719   1.9     oster 		u_cfg = *((RF_Config_t **) data);
    720   1.9     oster 		RF_Malloc(k_cfg, sizeof(RF_Config_t), (RF_Config_t *));
    721   1.1     oster 		if (k_cfg == NULL) {
    722   1.1     oster 			db3_printf(("rf_ioctl: ENOMEM for config. Code is %d\n", retcode));
    723   1.9     oster 			return (ENOMEM);
    724   1.1     oster 		}
    725   1.9     oster 		retcode = copyin((caddr_t) u_cfg, (caddr_t) k_cfg,
    726   1.9     oster 		    sizeof(RF_Config_t));
    727   1.1     oster 		if (retcode) {
    728   1.9     oster 			db3_printf(("rf_ioctl: retcode=%d copyin.1\n",
    729   1.9     oster 				retcode));
    730   1.9     oster 			return (retcode);
    731   1.1     oster 		}
    732   1.9     oster 		/* allocate a buffer for the layout-specific data, and copy it
    733   1.9     oster 		 * in */
    734   1.1     oster 		if (k_cfg->layoutSpecificSize) {
    735   1.9     oster 			if (k_cfg->layoutSpecificSize > 10000) {
    736   1.1     oster 				/* sanity check */
    737   1.1     oster 				db3_printf(("rf_ioctl: EINVAL %d\n", retcode));
    738   1.9     oster 				return (EINVAL);
    739   1.1     oster 			}
    740   1.9     oster 			RF_Malloc(specific_buf, k_cfg->layoutSpecificSize,
    741   1.9     oster 			    (u_char *));
    742   1.1     oster 			if (specific_buf == NULL) {
    743   1.9     oster 				RF_Free(k_cfg, sizeof(RF_Config_t));
    744   1.1     oster 				db3_printf(("rf_ioctl: ENOMEM %d\n", retcode));
    745   1.9     oster 				return (ENOMEM);
    746   1.1     oster 			}
    747   1.9     oster 			retcode = copyin(k_cfg->layoutSpecific,
    748   1.9     oster 			    (caddr_t) specific_buf,
    749   1.9     oster 			    k_cfg->layoutSpecificSize);
    750   1.1     oster 			if (retcode) {
    751   1.1     oster 				db3_printf(("rf_ioctl: retcode=%d copyin.2\n",
    752   1.9     oster 					retcode));
    753   1.9     oster 				return (retcode);
    754   1.1     oster 			}
    755   1.9     oster 		} else
    756   1.9     oster 			specific_buf = NULL;
    757   1.1     oster 		k_cfg->layoutSpecific = specific_buf;
    758   1.9     oster 
    759   1.9     oster 		/* should do some kind of sanity check on the configuration.
    760   1.9     oster 		 * Store the sum of all the bytes in the last byte? */
    761   1.1     oster 
    762   1.5     oster #if 0
    763   1.1     oster 		db1_printf(("Considering configuring the system.:%d 0x%x\n",
    764   1.9     oster 			unit, p));
    765   1.5     oster #endif
    766   1.1     oster 
    767   1.9     oster 		/* We need the pointer to this a little deeper, so stash it
    768   1.9     oster 		 * here... */
    769   1.1     oster 
    770   1.1     oster 		raidPtrs[unit]->proc = p;
    771   1.1     oster 
    772   1.1     oster 		/* configure the system */
    773   1.1     oster 		rf_pending_testaccs = 0;
    774   1.1     oster 
    775   1.1     oster 
    776   1.1     oster 		raidPtrs[unit]->raidid = unit;
    777   1.1     oster 		retcode = rf_Configure(raidPtrs[unit], k_cfg);
    778   1.1     oster 
    779   1.9     oster 
    780   1.1     oster 		if (retcode == 0) {
    781   1.9     oster 			retcode = raidinit(dev, raidPtrs[unit], unit);
    782   1.9     oster 		}
    783   1.1     oster 		/* free the buffers.  No return code here. */
    784   1.1     oster 		if (k_cfg->layoutSpecificSize) {
    785   1.9     oster 			RF_Free(specific_buf, k_cfg->layoutSpecificSize);
    786   1.1     oster 		}
    787   1.9     oster 		RF_Free(k_cfg, sizeof(RF_Config_t));
    788   1.9     oster 
    789   1.9     oster 		db3_printf(("rf_ioctl: retcode=%d RAIDFRAME_CONFIGURE\n",
    790   1.9     oster 			retcode));
    791   1.9     oster 		return (retcode);
    792   1.9     oster 
    793   1.9     oster 		/* shutdown the system */
    794   1.1     oster 	case RAIDFRAME_SHUTDOWN:
    795   1.9     oster 
    796   1.9     oster 		if ((error = raidlock(rs)) != 0)
    797   1.9     oster 			return (error);
    798   1.1     oster 
    799   1.1     oster 		/*
    800   1.1     oster 		 * If somebody has a partition mounted, we shouldn't
    801   1.1     oster 		 * shutdown.
    802   1.1     oster 		 */
    803   1.1     oster 
    804   1.1     oster 		part = DISKPART(dev);
    805   1.1     oster 		pmask = (1 << part);
    806   1.9     oster 		if ((rs->sc_dkdev.dk_openmask & ~pmask) ||
    807   1.9     oster 		    ((rs->sc_dkdev.dk_bopenmask & pmask) &&
    808   1.9     oster 			(rs->sc_dkdev.dk_copenmask & pmask))) {
    809   1.9     oster 			raidunlock(rs);
    810   1.9     oster 			return (EBUSY);
    811   1.9     oster 		}
    812   1.1     oster 		/* the intention here was to disallow shutdowns while
    813   1.9     oster 		 * raidframe is mounted, but it doesn't work because the
    814   1.9     oster 		 * shutdown ioctl calls rf_open */
    815   1.1     oster 		if (rf_pending_testaccs > 0) {
    816   1.1     oster 			printf("RAIDFRAME:  Can't shutdown because there are %d pending test accs\n",
    817   1.9     oster 			    rf_pending_testaccs);
    818   1.9     oster 			return (EINVAL);
    819   1.1     oster 		}
    820   1.1     oster 		if (rf_debugKernelAccess) {
    821   1.1     oster 			printf("call shutdown\n");
    822   1.1     oster 		}
    823   1.9     oster 		raidPtrs[unit]->proc = p;	/* XXX  necessary evil */
    824   1.1     oster 		retcode = rf_Shutdown(raidPtrs[unit]);
    825   1.1     oster 
    826   1.3   hubertf 		db1_printf(("Done main shutdown\n"));
    827   1.1     oster 
    828   1.1     oster 		pool_destroy(&rs->sc_cbufpool);
    829   1.3   hubertf 		db1_printf(("Done freeing component buffer freelist\n"));
    830   1.1     oster 
    831   1.1     oster 		/* It's no longer initialized... */
    832   1.1     oster 		rs->sc_flags &= ~RAIDF_INITED;
    833   1.1     oster 
    834   1.9     oster 		/* Detach the disk. */
    835   1.9     oster 		disk_detach(&rs->sc_dkdev);
    836   1.1     oster 
    837   1.1     oster 		raidunlock(rs);
    838   1.1     oster 
    839   1.9     oster 		return (retcode);
    840   1.9     oster 
    841   1.1     oster 		/* initialize all parity */
    842   1.1     oster 	case RAIDFRAME_REWRITEPARITY:
    843   1.1     oster 
    844   1.9     oster 		if (raidPtrs[unit]->Layout.map->faultsTolerated == 0)
    845   1.9     oster 			return (EINVAL);
    846   1.1     oster 		/* borrow the thread of the requesting process */
    847   1.9     oster 		raidPtrs[unit]->proc = p;	/* Blah... :-p GO */
    848   1.1     oster 		retcode = rf_RewriteParity(raidPtrs[unit]);
    849   1.9     oster 		/* return I/O Error if the parity rewrite fails */
    850   1.1     oster 
    851   1.9     oster 		if (retcode)
    852   1.9     oster 			retcode = EIO;
    853   1.9     oster 		return (retcode);
    854   1.9     oster 
    855   1.9     oster 		/* issue a test-unit-ready through raidframe to the indicated
    856   1.9     oster 		 * device */
    857   1.9     oster #if 0				/* XXX not supported yet (ever?) */
    858   1.1     oster 	case RAIDFRAME_TUR:
    859   1.1     oster 		/* debug only */
    860   1.9     oster 		retcode = rf_SCSI_DoTUR(0, 0, 0, 0, *(dev_t *) data);
    861   1.9     oster 		return (retcode);
    862   1.1     oster #endif
    863   1.1     oster 	case RAIDFRAME_GET_INFO:
    864   1.1     oster 		{
    865   1.1     oster 			RF_Raid_t *raid = raidPtrs[unit];
    866   1.1     oster 			RF_DeviceConfig_t *cfg, **ucfgp;
    867   1.9     oster 			int     i, j, d;
    868   1.9     oster 
    869   1.1     oster 			if (!raid->valid)
    870   1.9     oster 				return (ENODEV);
    871   1.9     oster 			ucfgp = (RF_DeviceConfig_t **) data;
    872   1.9     oster 			RF_Malloc(cfg, sizeof(RF_DeviceConfig_t),
    873   1.9     oster 			    (RF_DeviceConfig_t *));
    874   1.1     oster 			if (cfg == NULL)
    875   1.9     oster 				return (ENOMEM);
    876   1.9     oster 			bzero((char *) cfg, sizeof(RF_DeviceConfig_t));
    877   1.1     oster 			cfg->rows = raid->numRow;
    878   1.1     oster 			cfg->cols = raid->numCol;
    879   1.1     oster 			cfg->ndevs = raid->numRow * raid->numCol;
    880   1.1     oster 			if (cfg->ndevs >= RF_MAX_DISKS) {
    881   1.1     oster 				cfg->ndevs = 0;
    882   1.9     oster 				return (ENOMEM);
    883   1.1     oster 			}
    884   1.1     oster 			cfg->nspares = raid->numSpare;
    885   1.1     oster 			if (cfg->nspares >= RF_MAX_DISKS) {
    886   1.1     oster 				cfg->nspares = 0;
    887   1.9     oster 				return (ENOMEM);
    888   1.1     oster 			}
    889   1.1     oster 			cfg->maxqdepth = raid->maxQueueDepth;
    890   1.1     oster 			d = 0;
    891   1.9     oster 			for (i = 0; i < cfg->rows; i++) {
    892   1.9     oster 				for (j = 0; j < cfg->cols; j++) {
    893   1.1     oster 					cfg->devs[d] = raid->Disks[i][j];
    894   1.1     oster 					d++;
    895   1.1     oster 				}
    896   1.1     oster 			}
    897   1.9     oster 			for (j = cfg->cols, i = 0; i < cfg->nspares; i++, j++) {
    898   1.1     oster 				cfg->spares[i] = raid->Disks[0][j];
    899   1.1     oster 			}
    900   1.9     oster 			retcode = copyout((caddr_t) cfg, (caddr_t) * ucfgp,
    901   1.9     oster 			    sizeof(RF_DeviceConfig_t));
    902   1.9     oster 			RF_Free(cfg, sizeof(RF_DeviceConfig_t));
    903   1.9     oster 
    904   1.9     oster 			return (retcode);
    905   1.1     oster 		}
    906   1.9     oster 		break;
    907   1.9     oster 
    908   1.1     oster 	case RAIDFRAME_RESET_ACCTOTALS:
    909   1.1     oster 		{
    910   1.1     oster 			RF_Raid_t *raid = raidPtrs[unit];
    911   1.9     oster 
    912   1.1     oster 			bzero(&raid->acc_totals, sizeof(raid->acc_totals));
    913   1.9     oster 			return (0);
    914   1.1     oster 		}
    915   1.9     oster 		break;
    916   1.9     oster 
    917   1.1     oster 	case RAIDFRAME_GET_ACCTOTALS:
    918   1.1     oster 		{
    919   1.9     oster 			RF_AccTotals_t *totals = (RF_AccTotals_t *) data;
    920   1.1     oster 			RF_Raid_t *raid = raidPtrs[unit];
    921   1.9     oster 
    922   1.1     oster 			*totals = raid->acc_totals;
    923   1.9     oster 			return (0);
    924   1.1     oster 		}
    925   1.9     oster 		break;
    926   1.9     oster 
    927   1.1     oster 	case RAIDFRAME_KEEP_ACCTOTALS:
    928   1.1     oster 		{
    929   1.1     oster 			RF_Raid_t *raid = raidPtrs[unit];
    930   1.9     oster 			int    *keep = (int *) data;
    931   1.9     oster 
    932   1.1     oster 			raid->keep_acc_totals = *keep;
    933   1.9     oster 			return (0);
    934   1.1     oster 		}
    935   1.9     oster 		break;
    936   1.9     oster 
    937   1.1     oster 	case RAIDFRAME_GET_SIZE:
    938   1.1     oster 		*(int *) data = raidPtrs[unit]->totalSectors;
    939   1.9     oster 		return (0);
    940   1.1     oster 
    941   1.1     oster #define RAIDFRAME_RECON 1
    942   1.1     oster 		/* XXX The above should probably be set somewhere else!! GO */
    943   1.1     oster #if RAIDFRAME_RECON > 0
    944   1.1     oster 
    945   1.1     oster 		/* fail a disk & optionally start reconstruction */
    946   1.1     oster 	case RAIDFRAME_FAIL_DISK:
    947   1.1     oster 		rr = (struct rf_recon_req *) data;
    948   1.9     oster 
    949   1.9     oster 		if (rr->row < 0 || rr->row >= raidPtrs[unit]->numRow
    950   1.1     oster 		    || rr->col < 0 || rr->col >= raidPtrs[unit]->numCol)
    951   1.9     oster 			return (EINVAL);
    952   1.1     oster 
    953   1.9     oster 		printf("Failing the disk: row: %d col: %d\n", rr->row, rr->col);
    954   1.9     oster 
    955   1.9     oster 		/* make a copy of the recon request so that we don't rely on
    956   1.9     oster 		 * the user's buffer */
    957   1.1     oster 		RF_Malloc(rrcopy, sizeof(*rrcopy), (struct rf_recon_req *));
    958   1.1     oster 		bcopy(rr, rrcopy, sizeof(*rr));
    959   1.1     oster 		rrcopy->raidPtr = (void *) raidPtrs[unit];
    960   1.1     oster 
    961   1.1     oster 		LOCK_RECON_Q_MUTEX();
    962   1.1     oster 		rrcopy->next = recon_queue;
    963   1.1     oster 		recon_queue = rrcopy;
    964   1.1     oster 		wakeup(&recon_queue);
    965   1.1     oster 		UNLOCK_RECON_Q_MUTEX();
    966   1.9     oster 
    967   1.9     oster 		return (0);
    968   1.9     oster 
    969   1.9     oster 		/* invoke a copyback operation after recon on whatever disk
    970   1.9     oster 		 * needs it, if any */
    971   1.9     oster 	case RAIDFRAME_COPYBACK:
    972   1.1     oster 		/* borrow the current thread to get this done */
    973   1.9     oster 		raidPtrs[unit]->proc = p;	/* ICK.. but needed :-p  GO */
    974   1.1     oster 		rf_CopybackReconstructedData(raidPtrs[unit]);
    975   1.9     oster 		return (0);
    976   1.9     oster 
    977   1.1     oster 		/* return the percentage completion of reconstruction */
    978   1.1     oster 	case RAIDFRAME_CHECKRECON:
    979   1.1     oster 		row = *(int *) data;
    980   1.1     oster 		if (row < 0 || row >= raidPtrs[unit]->numRow)
    981   1.9     oster 			return (EINVAL);
    982   1.9     oster 		if (raidPtrs[unit]->status[row] != rf_rs_reconstructing)
    983   1.1     oster 			*(int *) data = 100;
    984   1.9     oster 		else
    985   1.1     oster 			*(int *) data = raidPtrs[unit]->reconControl[row]->percentComplete;
    986   1.9     oster 		return (0);
    987   1.9     oster 
    988   1.9     oster 		/* the sparetable daemon calls this to wait for the kernel to
    989   1.9     oster 		 * need a spare table. this ioctl does not return until a
    990   1.9     oster 		 * spare table is needed. XXX -- calling mpsleep here in the
    991   1.9     oster 		 * ioctl code is almost certainly wrong and evil. -- XXX XXX
    992   1.9     oster 		 * -- I should either compute the spare table in the kernel,
    993   1.9     oster 		 * or have a different -- XXX XXX -- interface (a different
    994   1.9     oster 		 * character device) for delivering the table          -- XXX */
    995   1.1     oster #if 0
    996   1.1     oster 	case RAIDFRAME_SPARET_WAIT:
    997   1.1     oster 		RF_LOCK_MUTEX(rf_sparet_wait_mutex);
    998   1.9     oster 		while (!rf_sparet_wait_queue)
    999   1.9     oster 			mpsleep(&rf_sparet_wait_queue, (PZERO + 1) | PCATCH, "sparet wait", 0, (void *) simple_lock_addr(rf_sparet_wait_mutex), MS_LOCK_SIMPLE);
   1000   1.1     oster 		waitreq = rf_sparet_wait_queue;
   1001   1.1     oster 		rf_sparet_wait_queue = rf_sparet_wait_queue->next;
   1002   1.1     oster 		RF_UNLOCK_MUTEX(rf_sparet_wait_mutex);
   1003   1.9     oster 
   1004   1.9     oster 		*((RF_SparetWait_t *) data) = *waitreq;	/* structure assignment */
   1005   1.9     oster 
   1006   1.1     oster 		RF_Free(waitreq, sizeof(*waitreq));
   1007   1.9     oster 		return (0);
   1008   1.9     oster 
   1009   1.9     oster 
   1010   1.9     oster 		/* wakes up a process waiting on SPARET_WAIT and puts an error
   1011   1.9     oster 		 * code in it that will cause the dameon to exit */
   1012   1.1     oster 	case RAIDFRAME_ABORT_SPARET_WAIT:
   1013   1.1     oster 		RF_Malloc(waitreq, sizeof(*waitreq), (RF_SparetWait_t *));
   1014   1.1     oster 		waitreq->fcol = -1;
   1015   1.1     oster 		RF_LOCK_MUTEX(rf_sparet_wait_mutex);
   1016   1.1     oster 		waitreq->next = rf_sparet_wait_queue;
   1017   1.1     oster 		rf_sparet_wait_queue = waitreq;
   1018   1.1     oster 		RF_UNLOCK_MUTEX(rf_sparet_wait_mutex);
   1019   1.1     oster 		wakeup(&rf_sparet_wait_queue);
   1020   1.9     oster 		return (0);
   1021   1.1     oster 
   1022   1.9     oster 		/* used by the spare table daemon to deliver a spare table
   1023   1.9     oster 		 * into the kernel */
   1024   1.1     oster 	case RAIDFRAME_SEND_SPARET:
   1025   1.9     oster 
   1026   1.1     oster 		/* install the spare table */
   1027   1.9     oster 		retcode = rf_SetSpareTable(raidPtrs[unit], *(void **) data);
   1028   1.9     oster 
   1029   1.9     oster 		/* respond to the requestor.  the return status of the spare
   1030   1.9     oster 		 * table installation is passed in the "fcol" field */
   1031   1.1     oster 		RF_Malloc(waitreq, sizeof(*waitreq), (RF_SparetWait_t *));
   1032   1.1     oster 		waitreq->fcol = retcode;
   1033   1.1     oster 		RF_LOCK_MUTEX(rf_sparet_wait_mutex);
   1034   1.1     oster 		waitreq->next = rf_sparet_resp_queue;
   1035   1.1     oster 		rf_sparet_resp_queue = waitreq;
   1036   1.1     oster 		wakeup(&rf_sparet_resp_queue);
   1037   1.1     oster 		RF_UNLOCK_MUTEX(rf_sparet_wait_mutex);
   1038   1.9     oster 
   1039   1.9     oster 		return (retcode);
   1040   1.1     oster #endif
   1041   1.1     oster 
   1042   1.1     oster 
   1043   1.9     oster #endif				/* RAIDFRAME_RECON > 0 */
   1044   1.9     oster 
   1045   1.9     oster 	default:
   1046   1.9     oster 		break;		/* fall through to the os-specific code below */
   1047   1.1     oster 
   1048   1.1     oster 	}
   1049   1.9     oster 
   1050   1.1     oster 	if (!raidPtrs[unit]->valid)
   1051   1.9     oster 		return (EINVAL);
   1052   1.9     oster 
   1053   1.1     oster 	/*
   1054   1.1     oster 	 * Add support for "regular" device ioctls here.
   1055   1.1     oster 	 */
   1056   1.9     oster 
   1057   1.1     oster 	switch (cmd) {
   1058   1.1     oster 	case DIOCGDINFO:
   1059   1.9     oster 		db1_printf(("DIOCGDINFO %d %d\n", (int) dev, (int) DISKPART(dev)));
   1060   1.9     oster 		*(struct disklabel *) data = *(rs->sc_dkdev.dk_label);
   1061   1.1     oster 		break;
   1062   1.1     oster 
   1063   1.1     oster 	case DIOCGPART:
   1064   1.9     oster 		db1_printf(("DIOCGPART: %d %d\n", (int) dev, (int) DISKPART(dev)));
   1065   1.9     oster 		((struct partinfo *) data)->disklab = rs->sc_dkdev.dk_label;
   1066   1.9     oster 		((struct partinfo *) data)->part =
   1067   1.1     oster 		    &rs->sc_dkdev.dk_label->d_partitions[DISKPART(dev)];
   1068   1.1     oster 		break;
   1069   1.1     oster 
   1070   1.1     oster 	case DIOCWDINFO:
   1071   1.1     oster 		db1_printf(("DIOCWDINFO\n"));
   1072   1.1     oster 	case DIOCSDINFO:
   1073   1.1     oster 		db1_printf(("DIOCSDINFO\n"));
   1074   1.1     oster 		if ((error = raidlock(rs)) != 0)
   1075   1.1     oster 			return (error);
   1076   1.1     oster 
   1077   1.1     oster 		rs->sc_flags |= RAIDF_LABELLING;
   1078   1.1     oster 
   1079   1.1     oster 		error = setdisklabel(rs->sc_dkdev.dk_label,
   1080   1.9     oster 		    (struct disklabel *) data, 0, rs->sc_dkdev.dk_cpulabel);
   1081   1.1     oster 		if (error == 0) {
   1082   1.1     oster 			if (cmd == DIOCWDINFO)
   1083   1.1     oster 				error = writedisklabel(RAIDLABELDEV(dev),
   1084   1.1     oster 				    raidstrategy, rs->sc_dkdev.dk_label,
   1085   1.1     oster 				    rs->sc_dkdev.dk_cpulabel);
   1086   1.1     oster 		}
   1087   1.1     oster 		rs->sc_flags &= ~RAIDF_LABELLING;
   1088   1.1     oster 
   1089   1.1     oster 		raidunlock(rs);
   1090   1.1     oster 
   1091   1.1     oster 		if (error)
   1092   1.1     oster 			return (error);
   1093   1.1     oster 		break;
   1094   1.1     oster 
   1095   1.1     oster 	case DIOCWLABEL:
   1096   1.1     oster 		db1_printf(("DIOCWLABEL\n"));
   1097   1.9     oster 		if (*(int *) data != 0)
   1098   1.1     oster 			rs->sc_flags |= RAIDF_WLABEL;
   1099   1.1     oster 		else
   1100   1.1     oster 			rs->sc_flags &= ~RAIDF_WLABEL;
   1101   1.1     oster 		break;
   1102   1.1     oster 
   1103   1.1     oster 	case DIOCGDEFLABEL:
   1104   1.1     oster 		db1_printf(("DIOCGDEFLABEL\n"));
   1105   1.1     oster 		raidgetdefaultlabel(raidPtrs[unit], rs,
   1106   1.9     oster 		    (struct disklabel *) data);
   1107   1.1     oster 		break;
   1108   1.1     oster 
   1109   1.1     oster 	default:
   1110   1.9     oster 		retcode = ENOTTY;	/* XXXX ?? OR EINVAL ? */
   1111   1.1     oster 	}
   1112   1.9     oster 	return (retcode);
   1113   1.1     oster 
   1114   1.1     oster }
   1115   1.1     oster 
   1116   1.1     oster 
   1117   1.9     oster /* raidinit -- complete the rest of the initialization for the
   1118   1.1     oster    RAIDframe device.  */
   1119   1.1     oster 
   1120   1.1     oster 
   1121   1.1     oster static int
   1122   1.9     oster raidinit(dev, raidPtr, unit)
   1123   1.9     oster 	dev_t   dev;
   1124   1.1     oster 	RF_Raid_t *raidPtr;
   1125   1.9     oster 	int     unit;
   1126   1.1     oster {
   1127   1.9     oster 	int     retcode;
   1128   1.9     oster 	/* int ix; */
   1129   1.9     oster 	/* struct raidbuf *raidbp; */
   1130   1.1     oster 	struct raid_softc *rs;
   1131   1.1     oster 
   1132   1.1     oster 	retcode = 0;
   1133   1.1     oster 
   1134   1.1     oster 	rs = &raid_softc[unit];
   1135   1.1     oster 	pool_init(&rs->sc_cbufpool, sizeof(struct raidbuf), 0,
   1136   1.9     oster 	    0, 0, "raidpl", 0, NULL, NULL, M_RAIDFRAME);
   1137   1.9     oster 
   1138   1.1     oster 
   1139   1.1     oster 	/* XXX should check return code first... */
   1140   1.1     oster 	rs->sc_flags |= RAIDF_INITED;
   1141   1.1     oster 
   1142   1.9     oster 	sprintf(rs->sc_xname, "raid%d", unit);	/* XXX doesn't check bounds. */
   1143   1.1     oster 
   1144   1.9     oster 	rs->sc_dkdev.dk_name = rs->sc_xname;
   1145   1.1     oster 	/* disk_attach actually creates space for the CPU disklabel, among
   1146   1.9     oster 	 * other things, so it's critical to call this *BEFORE* we try putzing
   1147   1.9     oster 	 * with disklabels. */
   1148   1.1     oster 	disk_attach(&rs->sc_dkdev);
   1149   1.1     oster 
   1150   1.1     oster 	/* XXX There may be a weird interaction here between this, and
   1151   1.9     oster 	 * protectedSectors, as used in RAIDframe.  */
   1152   1.9     oster 	rs->sc_size = raidPtr->totalSectors;
   1153   1.1     oster 	rs->sc_dev = dev;
   1154   1.9     oster 	return (retcode);
   1155   1.1     oster }
   1156   1.1     oster 
   1157   1.1     oster 
   1158   1.1     oster /*********************************************************
   1159   1.1     oster  *
   1160   1.1     oster  * initialization code called at boot time (startup.c)
   1161   1.1     oster  *
   1162   1.1     oster  ********************************************************/
   1163   1.9     oster int
   1164   1.9     oster rf_boot()
   1165   1.1     oster {
   1166   1.9     oster 	int     i, rc;
   1167   1.1     oster 
   1168   1.9     oster 	rc = rf_mutex_init(&rf_sparet_wait_mutex);
   1169   1.9     oster 	if (rc) {
   1170   1.9     oster 		RF_PANIC();
   1171   1.9     oster 	}
   1172   1.9     oster 	rc = rf_mutex_init(&rf_async_done_q_mutex);
   1173   1.9     oster 	if (rc) {
   1174   1.9     oster 		RF_PANIC();
   1175   1.9     oster 	}
   1176   1.9     oster 	rf_sparet_wait_queue = rf_sparet_resp_queue = NULL;
   1177   1.9     oster 	recon_queue = NULL;
   1178   1.9     oster 	rf_async_done_qh = rf_async_done_qt = NULL;
   1179   1.9     oster 	for (i = 0; i < numraid; i++)
   1180   1.9     oster 		raidPtrs[i] = NULL;
   1181   1.9     oster 	rc = rf_BootRaidframe();
   1182   1.9     oster 	if (rc == 0)
   1183   1.9     oster 		printf("Kernelized RAIDframe activated\n");
   1184   1.9     oster 	else
   1185   1.9     oster 		rf_kbooted = RFK_BOOT_BAD;
   1186   1.9     oster 	return (rc);
   1187   1.1     oster }
   1188   1.1     oster /*
   1189   1.1     oster  * This kernel thread never exits.  It is created once, and persists
   1190   1.1     oster  * until the system reboots.
   1191   1.1     oster  */
   1192   1.9     oster void
   1193   1.9     oster rf_ReconKernelThread()
   1194   1.1     oster {
   1195   1.9     oster 	struct rf_recon_req *req;
   1196   1.9     oster 	int     s;
   1197   1.1     oster 
   1198   1.9     oster 	/* XXX not sure what spl() level we should be at here... probably
   1199   1.9     oster 	 * splbio() */
   1200   1.9     oster 	s = splbio();
   1201   1.1     oster 
   1202   1.9     oster 	while (1) {
   1203   1.9     oster 		/* grab the next reconstruction request from the queue */
   1204   1.9     oster 		LOCK_RECON_Q_MUTEX();
   1205   1.9     oster 		while (!recon_queue) {
   1206   1.9     oster 			UNLOCK_RECON_Q_MUTEX();
   1207   1.9     oster 			tsleep(&recon_queue, PRIBIO | PCATCH, "raidframe recon", 0);
   1208   1.9     oster 			LOCK_RECON_Q_MUTEX();
   1209   1.9     oster 		}
   1210   1.9     oster 		req = recon_queue;
   1211   1.9     oster 		recon_queue = recon_queue->next;
   1212   1.9     oster 		UNLOCK_RECON_Q_MUTEX();
   1213   1.9     oster 
   1214   1.9     oster 		/*
   1215   1.9     oster 	         * If flags specifies that we should start recon, this call
   1216   1.9     oster 	         * will not return until reconstruction completes, fails, or is aborted.
   1217   1.9     oster 	         */
   1218   1.9     oster 		rf_FailDisk((RF_Raid_t *) req->raidPtr, req->row, req->col,
   1219   1.9     oster 		    ((req->flags & RF_FDFLAGS_RECON) ? 1 : 0));
   1220   1.1     oster 
   1221   1.9     oster 		RF_Free(req, sizeof(*req));
   1222   1.9     oster 	}
   1223   1.1     oster }
   1224   1.1     oster /* wake up the daemon & tell it to get us a spare table
   1225   1.1     oster  * XXX
   1226   1.9     oster  * the entries in the queues should be tagged with the raidPtr
   1227   1.1     oster  * so that in the extremely rare case that two recons happen at once, we know for
   1228   1.1     oster  * which device were requesting a spare table
   1229   1.1     oster  * XXX
   1230   1.1     oster  */
   1231   1.9     oster int
   1232   1.9     oster rf_GetSpareTableFromDaemon(req)
   1233   1.9     oster 	RF_SparetWait_t *req;
   1234   1.9     oster {
   1235   1.9     oster 	int     retcode;
   1236   1.9     oster 
   1237   1.9     oster 	RF_LOCK_MUTEX(rf_sparet_wait_mutex);
   1238   1.9     oster 	req->next = rf_sparet_wait_queue;
   1239   1.9     oster 	rf_sparet_wait_queue = req;
   1240   1.9     oster 	wakeup(&rf_sparet_wait_queue);
   1241   1.9     oster 
   1242   1.9     oster 	/* mpsleep unlocks the mutex */
   1243   1.9     oster 	while (!rf_sparet_resp_queue) {
   1244   1.9     oster 		tsleep(&rf_sparet_resp_queue, PRIBIO | PCATCH,
   1245   1.9     oster 		    "raidframe getsparetable", 0);
   1246   1.1     oster #if 0
   1247   1.9     oster 		mpsleep(&rf_sparet_resp_queue, PZERO, "sparet resp", 0, (void *) simple_lock_addr(rf_sparet_wait_mutex), MS_LOCK_SIMPLE);
   1248   1.1     oster #endif
   1249   1.9     oster 	}
   1250   1.9     oster 	req = rf_sparet_resp_queue;
   1251   1.9     oster 	rf_sparet_resp_queue = req->next;
   1252   1.9     oster 	RF_UNLOCK_MUTEX(rf_sparet_wait_mutex);
   1253   1.9     oster 
   1254   1.9     oster 	retcode = req->fcol;
   1255   1.9     oster 	RF_Free(req, sizeof(*req));	/* this is not the same req as we
   1256   1.9     oster 					 * alloc'd */
   1257   1.9     oster 	return (retcode);
   1258   1.1     oster }
   1259   1.1     oster /* a wrapper around rf_DoAccess that extracts appropriate info from the bp & passes it down.
   1260   1.1     oster  * any calls originating in the kernel must use non-blocking I/O
   1261   1.1     oster  * do some extra sanity checking to return "appropriate" error values for
   1262   1.1     oster  * certain conditions (to make some standard utilities work)
   1263   1.1     oster  */
   1264   1.9     oster int
   1265   1.9     oster rf_DoAccessKernel(raidPtr, bp, flags, cbFunc, cbArg)
   1266   1.9     oster 	RF_Raid_t *raidPtr;
   1267   1.9     oster 	struct buf *bp;
   1268   1.9     oster 	RF_RaidAccessFlags_t flags;
   1269   1.9     oster 	void    (*cbFunc) (struct buf *);
   1270   1.9     oster 	void   *cbArg;
   1271   1.1     oster {
   1272   1.1     oster 	RF_SectorCount_t num_blocks, pb, sum;
   1273   1.1     oster 	RF_RaidAddr_t raid_addr;
   1274   1.9     oster 	int     retcode;
   1275   1.1     oster 	struct partition *pp;
   1276   1.9     oster 	daddr_t blocknum;
   1277   1.9     oster 	int     unit;
   1278   1.1     oster 	struct raid_softc *rs;
   1279   1.9     oster 	int     do_async;
   1280   1.1     oster 
   1281   1.1     oster 	/* XXX The dev_t used here should be for /dev/[r]raid* !!! */
   1282   1.1     oster 
   1283   1.1     oster 	unit = raidPtr->raidid;
   1284   1.1     oster 	rs = &raid_softc[unit];
   1285   1.1     oster 
   1286   1.1     oster 	/* Ok, for the bp we have here, bp->b_blkno is relative to the
   1287   1.9     oster 	 * partition.. Need to make it absolute to the underlying device.. */
   1288   1.1     oster 
   1289   1.1     oster 	blocknum = bp->b_blkno;
   1290   1.1     oster 	if (DISKPART(bp->b_dev) != RAW_PART) {
   1291   1.1     oster 		pp = &rs->sc_dkdev.dk_label->d_partitions[DISKPART(bp->b_dev)];
   1292   1.1     oster 		blocknum += pp->p_offset;
   1293   1.9     oster 		db1_printf(("updated: %d %d\n", DISKPART(bp->b_dev),
   1294   1.9     oster 			pp->p_offset));
   1295   1.1     oster 	} else {
   1296   1.1     oster 		db1_printf(("Is raw..\n"));
   1297   1.1     oster 	}
   1298   1.1     oster 	db1_printf(("Blocks: %d, %d\n", (int) bp->b_blkno, (int) blocknum));
   1299   1.1     oster 
   1300   1.9     oster 	db1_printf(("bp->b_bcount = %d\n", (int) bp->b_bcount));
   1301   1.9     oster 	db1_printf(("bp->b_resid = %d\n", (int) bp->b_resid));
   1302   1.1     oster 
   1303   1.9     oster 	/* *THIS* is where we adjust what block we're going to... but DO NOT
   1304   1.9     oster 	 * TOUCH bp->b_blkno!!! */
   1305   1.1     oster 	raid_addr = blocknum;
   1306   1.9     oster 
   1307   1.1     oster 	num_blocks = bp->b_bcount >> raidPtr->logBytesPerSector;
   1308   1.9     oster 	pb = (bp->b_bcount & raidPtr->sectorMask) ? 1 : 0;
   1309   1.1     oster 	sum = raid_addr + num_blocks + pb;
   1310   1.1     oster 	if (1 || rf_debugKernelAccess) {
   1311   1.9     oster 		db1_printf(("raid_addr=%d sum=%d num_blocks=%d(+%d) (%d)\n",
   1312   1.9     oster 			(int) raid_addr, (int) sum, (int) num_blocks,
   1313   1.9     oster 			(int) pb, (int) bp->b_resid));
   1314   1.1     oster 	}
   1315   1.1     oster 	if ((sum > raidPtr->totalSectors) || (sum < raid_addr)
   1316   1.9     oster 	    || (sum < num_blocks) || (sum < pb)) {
   1317   1.1     oster 		bp->b_error = ENOSPC;
   1318   1.1     oster 		bp->b_flags |= B_ERROR;
   1319   1.1     oster 		bp->b_resid = bp->b_bcount;
   1320   1.1     oster 		biodone(bp);
   1321   1.9     oster 		return (bp->b_error);
   1322   1.1     oster 	}
   1323   1.1     oster 	/*
   1324   1.1     oster 	 * XXX rf_DoAccess() should do this, not just DoAccessKernel()
   1325   1.1     oster 	 */
   1326   1.1     oster 
   1327   1.1     oster 	if (bp->b_bcount & raidPtr->sectorMask) {
   1328   1.1     oster 		bp->b_error = EINVAL;
   1329   1.1     oster 		bp->b_flags |= B_ERROR;
   1330   1.1     oster 		bp->b_resid = bp->b_bcount;
   1331   1.1     oster 		biodone(bp);
   1332   1.9     oster 		return (bp->b_error);
   1333   1.1     oster 	}
   1334   1.1     oster 	db1_printf(("Calling DoAccess..\n"));
   1335   1.1     oster 
   1336   1.7  explorer 	/*
   1337   1.7  explorer 	 * XXX For now, all writes are sync
   1338   1.7  explorer 	 */
   1339   1.7  explorer 	do_async = 1;
   1340   1.7  explorer 	if ((bp->b_flags & B_READ) == 0)
   1341   1.7  explorer 		do_async = 0;
   1342   1.7  explorer 
   1343   1.9     oster 	/* don't ever condition on bp->b_flags & B_WRITE.  always condition on
   1344   1.9     oster 	 * B_READ instead */
   1345   1.9     oster 	retcode = rf_DoAccess(raidPtr, (bp->b_flags & B_READ) ?
   1346   1.9     oster 	    RF_IO_TYPE_READ : RF_IO_TYPE_WRITE,
   1347   1.9     oster 	    do_async, raid_addr, num_blocks,
   1348   1.9     oster 	    bp->b_un.b_addr,
   1349   1.9     oster 	    bp, NULL, NULL, RF_DAG_NONBLOCKING_IO | flags,
   1350   1.9     oster 	    NULL, cbFunc, cbArg);
   1351   1.5     oster #if 0
   1352   1.9     oster 	db1_printf(("After call to DoAccess: 0x%x 0x%x %d\n", bp,
   1353   1.9     oster 		bp->b_data, (int) bp->b_resid));
   1354   1.5     oster #endif
   1355   1.7  explorer 
   1356   1.7  explorer 	/*
   1357   1.7  explorer 	 * If we requested sync I/O, sleep here.
   1358   1.7  explorer 	 */
   1359   1.7  explorer 	if ((retcode == 0) && (do_async == 0))
   1360   1.7  explorer 		tsleep(bp, PRIBIO, "raidsyncio", 0);
   1361   1.7  explorer 
   1362   1.9     oster 	return (retcode);
   1363   1.1     oster }
   1364   1.1     oster /* invoke an I/O from kernel mode.  Disk queue should be locked upon entry */
   1365   1.1     oster 
   1366   1.9     oster int
   1367   1.9     oster rf_DispatchKernelIO(queue, req)
   1368   1.9     oster 	RF_DiskQueue_t *queue;
   1369   1.9     oster 	RF_DiskQueueData_t *req;
   1370   1.1     oster {
   1371   1.9     oster 	int     op = (req->type == RF_IO_TYPE_READ) ? B_READ : B_WRITE;
   1372   1.1     oster 	struct buf *bp;
   1373   1.9     oster 	struct raidbuf *raidbp = NULL;
   1374   1.1     oster 	struct raid_softc *rs;
   1375   1.9     oster 	int     unit;
   1376   1.9     oster 
   1377   1.1     oster 	/* XXX along with the vnode, we also need the softc associated with
   1378   1.9     oster 	 * this device.. */
   1379   1.9     oster 
   1380   1.1     oster 	req->queue = queue;
   1381   1.9     oster 
   1382   1.1     oster 	unit = queue->raidPtr->raidid;
   1383   1.1     oster 
   1384   1.9     oster 	db1_printf(("DispatchKernelIO unit: %d\n", unit));
   1385   1.1     oster 
   1386   1.9     oster 	if (unit >= numraid) {
   1387   1.9     oster 		printf("Invalid unit number: %d %d\n", unit, numraid);
   1388   1.1     oster 		panic("Invalid Unit number in rf_DispatchKernelIO\n");
   1389   1.1     oster 	}
   1390   1.1     oster 	rs = &raid_softc[unit];
   1391   1.1     oster 
   1392   1.1     oster 	/* XXX is this the right place? */
   1393   1.9     oster 	disk_busy(&rs->sc_dkdev);
   1394   1.1     oster 
   1395   1.1     oster 	bp = req->bp;
   1396   1.1     oster 
   1397   1.9     oster 	/* XXX when there is a physical disk failure, someone is passing us a
   1398   1.9     oster 	 * buffer that contains old stuff!!  Attempt to deal with this problem
   1399   1.9     oster 	 * without taking a performance hit... (not sure where the real bug
   1400   1.9     oster 	 * is.  It's buried in RAIDframe somewhere) :-(  GO ) */
   1401   1.4     oster 
   1402   1.4     oster 	if (bp->b_flags & B_ERROR) {
   1403   1.4     oster 		bp->b_flags &= ~B_ERROR;
   1404   1.4     oster 	}
   1405   1.9     oster 	if (bp->b_error != 0) {
   1406   1.4     oster 		bp->b_error = 0;
   1407   1.4     oster 	}
   1408   1.1     oster 	raidbp = RAIDGETBUF(rs);
   1409   1.1     oster 
   1410   1.9     oster 	raidbp->rf_flags = 0;	/* XXX not really used anywhere... */
   1411   1.1     oster 
   1412   1.1     oster 	/*
   1413   1.1     oster 	 * context for raidiodone
   1414   1.1     oster 	 */
   1415   1.1     oster 	raidbp->rf_obp = bp;
   1416   1.1     oster 	raidbp->req = req;
   1417   1.1     oster 
   1418   1.1     oster 	switch (req->type) {
   1419   1.9     oster 	case RF_IO_TYPE_NOP:	/* used primarily to unlock a locked queue */
   1420   1.9     oster 		/* Dprintf2("rf_DispatchKernelIO: NOP to r %d c %d\n",
   1421   1.9     oster 		 * queue->row, queue->col); */
   1422   1.1     oster 		/* XXX need to do something extra here.. */
   1423   1.9     oster 		/* I'm leaving this in, as I've never actually seen it used,
   1424   1.9     oster 		 * and I'd like folks to report it... GO */
   1425   1.1     oster 		printf(("WAKEUP CALLED\n"));
   1426   1.1     oster 		queue->numOutstanding++;
   1427   1.1     oster 
   1428   1.1     oster 		/* XXX need to glue the original buffer into this??  */
   1429   1.1     oster 
   1430   1.1     oster 		KernelWakeupFunc(&raidbp->rf_buf);
   1431   1.1     oster 		break;
   1432   1.9     oster 
   1433   1.1     oster 	case RF_IO_TYPE_READ:
   1434   1.1     oster 	case RF_IO_TYPE_WRITE:
   1435   1.9     oster 
   1436   1.1     oster 		if (req->tracerec) {
   1437   1.1     oster 			RF_ETIMER_START(req->tracerec->timer);
   1438   1.1     oster 		}
   1439   1.9     oster 		InitBP(&raidbp->rf_buf, queue->rf_cinfo->ci_vp,
   1440   1.9     oster 		    op | bp->b_flags, queue->rf_cinfo->ci_dev,
   1441   1.9     oster 		    req->sectorOffset, req->numSector,
   1442   1.9     oster 		    req->buf, KernelWakeupFunc, (void *) req,
   1443   1.9     oster 		    queue->raidPtr->logBytesPerSector, req->b_proc);
   1444   1.1     oster 
   1445   1.1     oster 		if (rf_debugKernelAccess) {
   1446   1.9     oster 			db1_printf(("dispatch: bp->b_blkno = %ld\n",
   1447   1.9     oster 				(long) bp->b_blkno));
   1448   1.1     oster 		}
   1449   1.1     oster 		queue->numOutstanding++;
   1450   1.1     oster 		queue->last_deq_sector = req->sectorOffset;
   1451   1.9     oster 		/* acc wouldn't have been let in if there were any pending
   1452   1.9     oster 		 * reqs at any other priority */
   1453   1.1     oster 		queue->curPriority = req->priority;
   1454   1.9     oster 		/* Dprintf3("rf_DispatchKernelIO: %c to row %d col %d\n",
   1455   1.9     oster 		 * req->type, queue->row, queue->col); */
   1456   1.1     oster 
   1457   1.1     oster 		db1_printf(("Going for %c to unit %d row %d col %d\n",
   1458   1.9     oster 			req->type, unit, queue->row, queue->col));
   1459   1.1     oster 		db1_printf(("sector %d count %d (%d bytes) %d\n",
   1460   1.9     oster 			(int) req->sectorOffset, (int) req->numSector,
   1461   1.9     oster 			(int) (req->numSector <<
   1462   1.9     oster 			    queue->raidPtr->logBytesPerSector),
   1463   1.9     oster 			(int) queue->raidPtr->logBytesPerSector));
   1464   1.1     oster 		if ((raidbp->rf_buf.b_flags & B_READ) == 0) {
   1465   1.1     oster 			raidbp->rf_buf.b_vp->v_numoutput++;
   1466   1.1     oster 		}
   1467   1.9     oster 		VOP_STRATEGY(&raidbp->rf_buf);
   1468   1.1     oster 
   1469   1.1     oster 		break;
   1470   1.9     oster 
   1471   1.1     oster 	default:
   1472   1.1     oster 		panic("bad req->type in rf_DispatchKernelIO");
   1473   1.1     oster 	}
   1474   1.1     oster 	db1_printf(("Exiting from DispatchKernelIO\n"));
   1475   1.9     oster 	return (0);
   1476   1.1     oster }
   1477   1.9     oster /* this is the callback function associated with a I/O invoked from
   1478   1.1     oster    kernel code.
   1479   1.1     oster  */
   1480   1.9     oster static void
   1481   1.9     oster KernelWakeupFunc(vbp)
   1482   1.9     oster 	struct buf *vbp;
   1483   1.9     oster {
   1484   1.9     oster 	RF_DiskQueueData_t *req = NULL;
   1485   1.9     oster 	RF_DiskQueue_t *queue;
   1486   1.9     oster 	struct raidbuf *raidbp = (struct raidbuf *) vbp;
   1487   1.9     oster 	struct buf *bp;
   1488   1.9     oster 	struct raid_softc *rs;
   1489   1.9     oster 	int     unit;
   1490   1.9     oster 	register int s;
   1491   1.9     oster 
   1492   1.9     oster 	s = splbio();		/* XXX */
   1493   1.9     oster 	db1_printf(("recovering the request queue:\n"));
   1494   1.9     oster 	req = raidbp->req;
   1495   1.1     oster 
   1496   1.9     oster 	bp = raidbp->rf_obp;
   1497   1.5     oster #if 0
   1498   1.9     oster 	db1_printf(("bp=0x%x\n", bp));
   1499   1.5     oster #endif
   1500   1.1     oster 
   1501   1.9     oster 	queue = (RF_DiskQueue_t *) req->queue;
   1502   1.1     oster 
   1503   1.9     oster 	if (raidbp->rf_buf.b_flags & B_ERROR) {
   1504   1.1     oster #if 0
   1505   1.9     oster 		printf("Setting bp->b_flags!!! %d\n", raidbp->rf_buf.b_error);
   1506   1.1     oster #endif
   1507   1.9     oster 		bp->b_flags |= B_ERROR;
   1508   1.9     oster 		bp->b_error = raidbp->rf_buf.b_error ?
   1509   1.9     oster 		    raidbp->rf_buf.b_error : EIO;
   1510   1.9     oster 	}
   1511   1.5     oster #if 0
   1512   1.9     oster 	db1_printf(("raidbp->rf_buf.b_bcount=%d\n", (int) raidbp->rf_buf.b_bcount));
   1513   1.9     oster 	db1_printf(("raidbp->rf_buf.b_bufsize=%d\n", (int) raidbp->rf_buf.b_bufsize));
   1514   1.9     oster 	db1_printf(("raidbp->rf_buf.b_resid=%d\n", (int) raidbp->rf_buf.b_resid));
   1515   1.9     oster 	db1_printf(("raidbp->rf_buf.b_data=0x%x\n", raidbp->rf_buf.b_data));
   1516   1.5     oster #endif
   1517   1.1     oster 
   1518   1.9     oster 	/* XXX methinks this could be wrong... */
   1519   1.1     oster #if 1
   1520   1.9     oster 	bp->b_resid = raidbp->rf_buf.b_resid;
   1521   1.1     oster #endif
   1522   1.1     oster 
   1523   1.9     oster 	if (req->tracerec) {
   1524   1.9     oster 		RF_ETIMER_STOP(req->tracerec->timer);
   1525   1.9     oster 		RF_ETIMER_EVAL(req->tracerec->timer);
   1526   1.9     oster 		RF_LOCK_MUTEX(rf_tracing_mutex);
   1527   1.9     oster 		req->tracerec->diskwait_us += RF_ETIMER_VAL_US(req->tracerec->timer);
   1528   1.9     oster 		req->tracerec->phys_io_us += RF_ETIMER_VAL_US(req->tracerec->timer);
   1529   1.9     oster 		req->tracerec->num_phys_ios++;
   1530   1.9     oster 		RF_UNLOCK_MUTEX(rf_tracing_mutex);
   1531   1.9     oster 	}
   1532   1.9     oster 	bp->b_bcount = raidbp->rf_buf.b_bcount;	/* XXXX ?? */
   1533   1.1     oster 
   1534   1.9     oster 	unit = queue->raidPtr->raidid;	/* *Much* simpler :-> */
   1535   1.1     oster 
   1536   1.1     oster 
   1537   1.9     oster 	/* XXX Ok, let's get aggressive... If B_ERROR is set, let's go
   1538   1.9     oster 	 * ballistic, and mark the component as hosed... */
   1539   1.9     oster #if 1
   1540   1.9     oster 	if (bp->b_flags & B_ERROR) {
   1541   1.9     oster 		/* Mark the disk as dead */
   1542   1.9     oster 		/* but only mark it once... */
   1543   1.9     oster 		if (queue->raidPtr->Disks[queue->row][queue->col].status ==
   1544   1.9     oster 		    rf_ds_optimal) {
   1545   1.9     oster 			printf("raid%d: IO Error.  Marking %s as failed.\n",
   1546   1.9     oster 			    unit, queue->raidPtr->Disks[queue->row][queue->col].devname);
   1547   1.9     oster 			queue->raidPtr->Disks[queue->row][queue->col].status =
   1548   1.9     oster 			    rf_ds_failed;
   1549   1.9     oster 			queue->raidPtr->status[queue->row] = rf_rs_degraded;
   1550   1.9     oster 			queue->raidPtr->numFailures++;
   1551   1.9     oster 		} else {	/* Disk is already dead... */
   1552   1.9     oster 			/* printf("Disk already marked as dead!\n"); */
   1553   1.9     oster 		}
   1554   1.4     oster 
   1555   1.9     oster 	}
   1556   1.4     oster #endif
   1557   1.4     oster 
   1558   1.9     oster 	rs = &raid_softc[unit];
   1559   1.9     oster 	RAIDPUTBUF(rs, raidbp);
   1560   1.9     oster 
   1561   1.4     oster 
   1562   1.9     oster 	if (bp->b_resid == 0) {
   1563   1.9     oster 		db1_printf(("Disk is no longer busy for this buffer... %d %ld %ld\n",
   1564   1.9     oster 			unit, bp->b_resid, bp->b_bcount));
   1565   1.9     oster 		/* XXX is this the right place for a disk_unbusy()??!??!?!? */
   1566   1.9     oster 		disk_unbusy(&rs->sc_dkdev, (bp->b_bcount - bp->b_resid));
   1567   1.9     oster 	} else {
   1568   1.9     oster 		db1_printf(("b_resid is still %ld\n", bp->b_resid));
   1569   1.9     oster 	}
   1570   1.1     oster 
   1571   1.9     oster 	rf_DiskIOComplete(queue, req, (bp->b_flags & B_ERROR) ? 1 : 0);
   1572   1.9     oster 	(req->CompleteFunc) (req->argument, (bp->b_flags & B_ERROR) ? 1 : 0);
   1573   1.9     oster 	/* printf("Exiting KernelWakeupFunc\n"); */
   1574   1.1     oster 
   1575   1.9     oster 	splx(s);		/* XXX */
   1576   1.1     oster }
   1577   1.1     oster 
   1578   1.1     oster 
   1579   1.1     oster 
   1580   1.1     oster /*
   1581   1.1     oster  * initialize a buf structure for doing an I/O in the kernel.
   1582   1.1     oster  */
   1583   1.9     oster static void
   1584   1.9     oster InitBP(
   1585   1.9     oster     struct buf * bp,
   1586   1.9     oster     struct vnode * b_vp,
   1587   1.9     oster     unsigned rw_flag,
   1588   1.9     oster     dev_t dev,
   1589   1.9     oster     RF_SectorNum_t startSect,
   1590   1.9     oster     RF_SectorCount_t numSect,
   1591   1.9     oster     caddr_t buf,
   1592   1.9     oster     void (*cbFunc) (struct buf *),
   1593   1.9     oster     void *cbArg,
   1594   1.9     oster     int logBytesPerSector,
   1595   1.9     oster     struct proc * b_proc)
   1596   1.9     oster {
   1597   1.9     oster 	/* bp->b_flags       = B_PHYS | rw_flag; */
   1598   1.9     oster 	bp->b_flags = B_CALL | rw_flag;	/* XXX need B_PHYS here too??? */
   1599   1.9     oster 	bp->b_bcount = numSect << logBytesPerSector;
   1600   1.9     oster 	bp->b_bufsize = bp->b_bcount;
   1601   1.9     oster 	bp->b_error = 0;
   1602   1.9     oster 	bp->b_dev = dev;
   1603   1.1     oster 	db1_printf(("bp->b_dev is %d\n", dev));
   1604   1.9     oster 	bp->b_un.b_addr = buf;
   1605   1.5     oster #if 0
   1606   1.9     oster 	db1_printf(("bp->b_data=0x%x\n", bp->b_data));
   1607   1.5     oster #endif
   1608   1.1     oster 
   1609   1.9     oster 	bp->b_blkno = startSect;
   1610   1.9     oster 	bp->b_resid = bp->b_bcount;	/* XXX is this right!??!?!! */
   1611   1.9     oster 	db1_printf(("b_bcount is: %d\n", (int) bp->b_bcount));
   1612   1.1     oster 	if (bp->b_bcount == 0) {
   1613   1.1     oster 		panic("bp->b_bcount is zero in InitBP!!\n");
   1614   1.1     oster 	}
   1615   1.9     oster 	bp->b_proc = b_proc;
   1616   1.9     oster 	bp->b_iodone = cbFunc;
   1617   1.9     oster 	bp->b_vp = b_vp;
   1618   1.9     oster 
   1619   1.1     oster }
   1620   1.1     oster /* Extras... */
   1621   1.1     oster 
   1622   1.9     oster unsigned int
   1623   1.9     oster rpcc()
   1624   1.1     oster {
   1625   1.9     oster 	/* XXX no clue what this is supposed to do.. my guess is that it's
   1626   1.9     oster 	 * supposed to read the CPU cycle counter... */
   1627   1.9     oster 	/* db1_printf("this is supposed to do something useful too!??\n"); */
   1628   1.9     oster 	return (0);
   1629   1.1     oster }
   1630   1.1     oster #if 0
   1631   1.9     oster int
   1632   1.9     oster rf_GetSpareTableFromDaemon(req)
   1633   1.9     oster 	RF_SparetWait_t *req;
   1634   1.1     oster {
   1635   1.9     oster 	int     retcode = 1;
   1636   1.9     oster 	printf("This is supposed to do something useful!!\n");	/* XXX */
   1637   1.9     oster 
   1638   1.9     oster 	return (retcode);
   1639   1.1     oster 
   1640   1.1     oster }
   1641   1.1     oster #endif
   1642   1.1     oster 
   1643   1.1     oster static void
   1644   1.1     oster raidgetdefaultlabel(raidPtr, rs, lp)
   1645   1.1     oster 	RF_Raid_t *raidPtr;
   1646   1.1     oster 	struct raid_softc *rs;
   1647   1.1     oster 	struct disklabel *lp;
   1648   1.1     oster {
   1649   1.1     oster 	db1_printf(("Building a default label...\n"));
   1650   1.1     oster 	bzero(lp, sizeof(*lp));
   1651   1.1     oster 
   1652   1.1     oster 	/* fabricate a label... */
   1653   1.1     oster 	lp->d_secperunit = raidPtr->totalSectors;
   1654   1.1     oster 	lp->d_secsize = raidPtr->bytesPerSector;
   1655   1.1     oster 	lp->d_nsectors = 1024 * (1024 / raidPtr->bytesPerSector);
   1656   1.1     oster 	lp->d_ntracks = 1;
   1657   1.1     oster 	lp->d_ncylinders = raidPtr->totalSectors / lp->d_nsectors;
   1658   1.1     oster 	lp->d_secpercyl = lp->d_ntracks * lp->d_nsectors;
   1659   1.1     oster 
   1660   1.1     oster 	strncpy(lp->d_typename, "raid", sizeof(lp->d_typename));
   1661   1.9     oster 	lp->d_type = DTYPE_RAID;
   1662   1.1     oster 	strncpy(lp->d_packname, "fictitious", sizeof(lp->d_packname));
   1663   1.1     oster 	lp->d_rpm = 3600;
   1664   1.1     oster 	lp->d_interleave = 1;
   1665   1.1     oster 	lp->d_flags = 0;
   1666   1.1     oster 
   1667   1.1     oster 	lp->d_partitions[RAW_PART].p_offset = 0;
   1668   1.1     oster 	lp->d_partitions[RAW_PART].p_size = raidPtr->totalSectors;
   1669   1.1     oster 	lp->d_partitions[RAW_PART].p_fstype = FS_UNUSED;
   1670   1.1     oster 	lp->d_npartitions = RAW_PART + 1;
   1671   1.1     oster 
   1672   1.1     oster 	lp->d_magic = DISKMAGIC;
   1673   1.1     oster 	lp->d_magic2 = DISKMAGIC;
   1674   1.1     oster 	lp->d_checksum = dkcksum(rs->sc_dkdev.dk_label);
   1675   1.1     oster 
   1676   1.1     oster }
   1677   1.1     oster /*
   1678   1.1     oster  * Read the disklabel from the raid device.  If one is not present, fake one
   1679   1.1     oster  * up.
   1680   1.1     oster  */
   1681   1.1     oster static void
   1682   1.1     oster raidgetdisklabel(dev)
   1683   1.9     oster 	dev_t   dev;
   1684   1.1     oster {
   1685   1.9     oster 	int     unit = raidunit(dev);
   1686   1.1     oster 	struct raid_softc *rs = &raid_softc[unit];
   1687   1.9     oster 	char   *errstring;
   1688   1.1     oster 	struct disklabel *lp = rs->sc_dkdev.dk_label;
   1689   1.1     oster 	struct cpu_disklabel *clp = rs->sc_dkdev.dk_cpulabel;
   1690   1.1     oster 	RF_Raid_t *raidPtr;
   1691   1.1     oster 
   1692   1.1     oster 	db1_printf(("Getting the disklabel...\n"));
   1693   1.1     oster 
   1694   1.1     oster 	bzero(clp, sizeof(*clp));
   1695   1.1     oster 
   1696   1.1     oster 	raidPtr = raidPtrs[unit];
   1697   1.1     oster 
   1698   1.1     oster 	raidgetdefaultlabel(raidPtr, rs, lp);
   1699   1.1     oster 
   1700   1.1     oster 	/*
   1701   1.1     oster 	 * Call the generic disklabel extraction routine.
   1702   1.1     oster 	 */
   1703   1.1     oster 	errstring = readdisklabel(RAIDLABELDEV(dev), raidstrategy,
   1704   1.1     oster 	    rs->sc_dkdev.dk_label, rs->sc_dkdev.dk_cpulabel);
   1705   1.9     oster 	if (errstring)
   1706   1.1     oster 		raidmakedisklabel(rs);
   1707   1.1     oster 	else {
   1708   1.9     oster 		int     i;
   1709   1.1     oster 		struct partition *pp;
   1710   1.1     oster 
   1711   1.1     oster 		/*
   1712   1.1     oster 		 * Sanity check whether the found disklabel is valid.
   1713   1.1     oster 		 *
   1714   1.1     oster 		 * This is necessary since total size of the raid device
   1715   1.1     oster 		 * may vary when an interleave is changed even though exactly
   1716   1.1     oster 		 * same componets are used, and old disklabel may used
   1717   1.1     oster 		 * if that is found.
   1718   1.1     oster 		 */
   1719   1.1     oster 		if (lp->d_secperunit != rs->sc_size)
   1720   1.1     oster 			printf("WARNING: %s: "
   1721   1.1     oster 			    "total sector size in disklabel (%d) != "
   1722   1.1     oster 			    "the size of raid (%d)\n", rs->sc_xname,
   1723   1.1     oster 			    lp->d_secperunit, rs->sc_size);
   1724   1.1     oster 		for (i = 0; i < lp->d_npartitions; i++) {
   1725   1.1     oster 			pp = &lp->d_partitions[i];
   1726   1.1     oster 			if (pp->p_offset + pp->p_size > rs->sc_size)
   1727   1.1     oster 				printf("WARNING: %s: end of partition `%c' "
   1728   1.1     oster 				    "exceeds the size of raid (%d)\n",
   1729   1.1     oster 				    rs->sc_xname, 'a' + i, rs->sc_size);
   1730   1.1     oster 		}
   1731   1.1     oster 	}
   1732   1.1     oster 
   1733   1.1     oster }
   1734   1.1     oster /*
   1735   1.1     oster  * Take care of things one might want to take care of in the event
   1736   1.1     oster  * that a disklabel isn't present.
   1737   1.1     oster  */
   1738   1.1     oster static void
   1739   1.1     oster raidmakedisklabel(rs)
   1740   1.1     oster 	struct raid_softc *rs;
   1741   1.1     oster {
   1742   1.1     oster 	struct disklabel *lp = rs->sc_dkdev.dk_label;
   1743   1.1     oster 	db1_printf(("Making a label..\n"));
   1744   1.1     oster 
   1745   1.1     oster 	/*
   1746   1.1     oster 	 * For historical reasons, if there's no disklabel present
   1747   1.1     oster 	 * the raw partition must be marked FS_BSDFFS.
   1748   1.1     oster 	 */
   1749   1.1     oster 
   1750   1.1     oster 	lp->d_partitions[RAW_PART].p_fstype = FS_BSDFFS;
   1751   1.1     oster 
   1752   1.1     oster 	strncpy(lp->d_packname, "default label", sizeof(lp->d_packname));
   1753   1.1     oster 
   1754   1.1     oster 	lp->d_checksum = dkcksum(lp);
   1755   1.1     oster }
   1756   1.1     oster /*
   1757   1.1     oster  * Lookup the provided name in the filesystem.  If the file exists,
   1758   1.1     oster  * is a valid block device, and isn't being used by anyone else,
   1759   1.1     oster  * set *vpp to the file's vnode.
   1760   1.9     oster  * You'll find the original of this in ccd.c
   1761   1.1     oster  */
   1762   1.1     oster int
   1763   1.1     oster raidlookup(path, p, vpp)
   1764   1.9     oster 	char   *path;
   1765   1.1     oster 	struct proc *p;
   1766   1.1     oster 	struct vnode **vpp;	/* result */
   1767   1.1     oster {
   1768   1.1     oster 	struct nameidata nd;
   1769   1.1     oster 	struct vnode *vp;
   1770   1.1     oster 	struct vattr va;
   1771   1.9     oster 	int     error;
   1772   1.1     oster 
   1773   1.1     oster 	NDINIT(&nd, LOOKUP, FOLLOW, UIO_SYSSPACE, path, p);
   1774   1.9     oster 	if ((error = vn_open(&nd, FREAD | FWRITE, 0)) != 0) {
   1775   1.1     oster #ifdef DEBUG
   1776   1.9     oster 		printf("RAIDframe: vn_open returned %d\n", error);
   1777   1.1     oster #endif
   1778   1.1     oster 		return (error);
   1779   1.1     oster 	}
   1780   1.1     oster 	vp = nd.ni_vp;
   1781   1.1     oster 	if (vp->v_usecount > 1) {
   1782   1.1     oster 		VOP_UNLOCK(vp, 0);
   1783   1.9     oster 		(void) vn_close(vp, FREAD | FWRITE, p->p_ucred, p);
   1784   1.1     oster 		return (EBUSY);
   1785   1.1     oster 	}
   1786   1.1     oster 	if ((error = VOP_GETATTR(vp, &va, p->p_ucred, p)) != 0) {
   1787   1.1     oster 		VOP_UNLOCK(vp, 0);
   1788   1.9     oster 		(void) vn_close(vp, FREAD | FWRITE, p->p_ucred, p);
   1789   1.1     oster 		return (error);
   1790   1.1     oster 	}
   1791   1.1     oster 	/* XXX: eventually we should handle VREG, too. */
   1792   1.1     oster 	if (va.va_type != VBLK) {
   1793   1.1     oster 		VOP_UNLOCK(vp, 0);
   1794   1.9     oster 		(void) vn_close(vp, FREAD | FWRITE, p->p_ucred, p);
   1795   1.1     oster 		return (ENOTBLK);
   1796   1.1     oster 	}
   1797   1.1     oster 	VOP_UNLOCK(vp, 0);
   1798   1.1     oster 	*vpp = vp;
   1799   1.1     oster 	return (0);
   1800   1.1     oster }
   1801   1.1     oster /*
   1802   1.1     oster  * Wait interruptibly for an exclusive lock.
   1803   1.1     oster  *
   1804   1.1     oster  * XXX
   1805   1.1     oster  * Several drivers do this; it should be abstracted and made MP-safe.
   1806   1.1     oster  * (Hmm... where have we seen this warning before :->  GO )
   1807   1.1     oster  */
   1808   1.1     oster static int
   1809   1.1     oster raidlock(rs)
   1810   1.1     oster 	struct raid_softc *rs;
   1811   1.1     oster {
   1812   1.9     oster 	int     error;
   1813   1.1     oster 
   1814   1.1     oster 	while ((rs->sc_flags & RAIDF_LOCKED) != 0) {
   1815   1.1     oster 		rs->sc_flags |= RAIDF_WANTED;
   1816   1.9     oster 		if ((error =
   1817   1.9     oster 			tsleep(rs, PRIBIO | PCATCH, "raidlck", 0)) != 0)
   1818   1.1     oster 			return (error);
   1819   1.1     oster 	}
   1820   1.1     oster 	rs->sc_flags |= RAIDF_LOCKED;
   1821   1.1     oster 	return (0);
   1822   1.1     oster }
   1823   1.1     oster /*
   1824   1.1     oster  * Unlock and wake up any waiters.
   1825   1.1     oster  */
   1826   1.1     oster static void
   1827   1.1     oster raidunlock(rs)
   1828   1.1     oster 	struct raid_softc *rs;
   1829   1.1     oster {
   1830   1.1     oster 
   1831   1.1     oster 	rs->sc_flags &= ~RAIDF_LOCKED;
   1832   1.1     oster 	if ((rs->sc_flags & RAIDF_WANTED) != 0) {
   1833   1.1     oster 		rs->sc_flags &= ~RAIDF_WANTED;
   1834   1.1     oster 		wakeup(rs);
   1835   1.1     oster 	}
   1836   1.1     oster }
   1837