Home | History | Annotate | Line # | Download | only in ata
ld_ataraid.c revision 1.39
      1  1.39       tls /*	$NetBSD: ld_ataraid.c,v 1.39 2012/02/02 19:43:02 tls Exp $	*/
      2   1.1   thorpej 
      3   1.1   thorpej /*
      4   1.1   thorpej  * Copyright (c) 2003 Wasabi Systems, Inc.
      5   1.1   thorpej  * All rights reserved.
      6   1.1   thorpej  *
      7   1.1   thorpej  * Written by Jason R. Thorpe for Wasabi Systems, Inc.
      8   1.1   thorpej  *
      9   1.1   thorpej  * Redistribution and use in source and binary forms, with or without
     10   1.1   thorpej  * modification, are permitted provided that the following conditions
     11   1.1   thorpej  * are met:
     12   1.1   thorpej  * 1. Redistributions of source code must retain the above copyright
     13   1.1   thorpej  *    notice, this list of conditions and the following disclaimer.
     14   1.1   thorpej  * 2. Redistributions in binary form must reproduce the above copyright
     15   1.1   thorpej  *    notice, this list of conditions and the following disclaimer in the
     16   1.1   thorpej  *    documentation and/or other materials provided with the distribution.
     17   1.1   thorpej  * 3. All advertising materials mentioning features or use of this software
     18   1.1   thorpej  *    must display the following acknowledgement:
     19   1.1   thorpej  *	This product includes software developed for the NetBSD Project by
     20   1.1   thorpej  *	Wasabi Systems, Inc.
     21   1.1   thorpej  * 4. The name of Wasabi Systems, Inc. may not be used to endorse
     22   1.1   thorpej  *    or promote products derived from this software without specific prior
     23   1.1   thorpej  *    written permission.
     24   1.1   thorpej  *
     25   1.1   thorpej  * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
     26   1.1   thorpej  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     27   1.1   thorpej  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     28   1.1   thorpej  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL WASABI SYSTEMS, INC
     29   1.1   thorpej  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     30   1.1   thorpej  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     31   1.1   thorpej  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     32   1.1   thorpej  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     33   1.1   thorpej  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     34   1.1   thorpej  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     35   1.1   thorpej  * POSSIBILITY OF SUCH DAMAGE.
     36   1.1   thorpej  */
     37   1.1   thorpej 
     38   1.1   thorpej /*
     39   1.1   thorpej  * Support for ATA RAID logical disks.
     40   1.1   thorpej  *
     41   1.1   thorpej  * Note that all the RAID happens in software here; the ATA RAID
     42   1.1   thorpej  * controllers we're dealing with (Promise, etc.) only support
     43   1.1   thorpej  * configuration data on the component disks, with the BIOS supporting
     44   1.1   thorpej  * booting from the RAID volumes.
     45  1.33  wrstuden  *
     46  1.30      tron  * bio(4) support was written by Juan Romero Pardines <xtraeme (at) gmail.com>.
     47   1.1   thorpej  */
     48   1.8     lukem 
     49   1.8     lukem #include <sys/cdefs.h>
     50  1.39       tls __KERNEL_RCSID(0, "$NetBSD: ld_ataraid.c,v 1.39 2012/02/02 19:43:02 tls Exp $");
     51   1.1   thorpej 
     52  1.30      tron #include "bio.h"
     53  1.39       tls 
     54   1.1   thorpej 
     55   1.1   thorpej #include <sys/param.h>
     56   1.1   thorpej #include <sys/systm.h>
     57   1.1   thorpej #include <sys/conf.h>
     58   1.1   thorpej #include <sys/kernel.h>
     59   1.1   thorpej #include <sys/device.h>
     60   1.1   thorpej #include <sys/buf.h>
     61  1.13      yamt #include <sys/bufq.h>
     62   1.1   thorpej #include <sys/dkio.h>
     63   1.1   thorpej #include <sys/disk.h>
     64   1.1   thorpej #include <sys/disklabel.h>
     65   1.1   thorpej #include <sys/fcntl.h>
     66   1.1   thorpej #include <sys/malloc.h>
     67   1.1   thorpej #include <sys/vnode.h>
     68  1.16      elad #include <sys/kauth.h>
     69   1.1   thorpej #include <sys/rnd.h>
     70  1.30      tron #if NBIO > 0
     71  1.30      tron #include <dev/ata/atavar.h>
     72  1.30      tron #include <dev/ata/atareg.h>
     73  1.30      tron #include <dev/ata/wdvar.h>
     74  1.30      tron #include <dev/biovar.h>
     75  1.30      tron #include <dev/scsipi/scsipiconf.h> /* for scsipi_strvis() */
     76  1.30      tron #endif
     77   1.1   thorpej 
     78   1.1   thorpej #include <miscfs/specfs/specdev.h>
     79   1.1   thorpej 
     80   1.1   thorpej #include <dev/ldvar.h>
     81   1.1   thorpej 
     82   1.1   thorpej #include <dev/ata/ata_raidvar.h>
     83   1.1   thorpej 
     84   1.1   thorpej struct ld_ataraid_softc {
     85   1.1   thorpej 	struct ld_softc sc_ld;
     86   1.1   thorpej 
     87   1.1   thorpej 	struct ataraid_array_info *sc_aai;
     88   1.1   thorpej 	struct vnode *sc_vnodes[ATA_RAID_MAX_DISKS];
     89   1.1   thorpej 
     90   1.1   thorpej 	void	(*sc_iodone)(struct buf *);
     91  1.36       bsh 
     92  1.36       bsh        pool_cache_t sc_cbufpool;
     93  1.36       bsh 
     94  1.36       bsh        SIMPLEQ_HEAD(, cbuf) sc_cbufq;
     95  1.36       bsh 
     96  1.36       bsh        void    *sc_sih_cookie;
     97   1.1   thorpej };
     98   1.1   thorpej 
     99  1.35    cegger static int	ld_ataraid_match(device_t, cfdata_t, void *);
    100  1.35    cegger static void	ld_ataraid_attach(device_t, device_t, void *);
    101   1.1   thorpej 
    102   1.1   thorpej static int	ld_ataraid_dump(struct ld_softc *, void *, int, int);
    103   1.1   thorpej 
    104  1.36       bsh static int     cbufpool_ctor(void *, void *, int);
    105  1.36       bsh static void    cbufpool_dtor(void *, void *);
    106  1.36       bsh 
    107  1.36       bsh static void    ld_ataraid_start_vstrategy(void *);
    108   1.1   thorpej static int	ld_ataraid_start_span(struct ld_softc *, struct buf *);
    109   1.1   thorpej 
    110   1.1   thorpej static int	ld_ataraid_start_raid0(struct ld_softc *, struct buf *);
    111   1.1   thorpej static void	ld_ataraid_iodone_raid0(struct buf *);
    112   1.1   thorpej 
    113  1.30      tron #if NBIO > 0
    114  1.30      tron static int	ld_ataraid_bioctl(device_t, u_long, void *);
    115  1.30      tron static int	ld_ataraid_bioinq(struct ld_ataraid_softc *, struct bioc_inq *);
    116  1.30      tron static int	ld_ataraid_biovol(struct ld_ataraid_softc *, struct bioc_vol *);
    117  1.30      tron static int	ld_ataraid_biodisk(struct ld_ataraid_softc *,
    118  1.30      tron 				   struct bioc_disk *);
    119  1.30      tron #endif
    120  1.30      tron 
    121  1.27   xtraeme CFATTACH_DECL_NEW(ld_ataraid, sizeof(struct ld_ataraid_softc),
    122   1.1   thorpej     ld_ataraid_match, ld_ataraid_attach, NULL, NULL);
    123   1.1   thorpej 
    124   1.1   thorpej struct cbuf {
    125   1.1   thorpej 	struct buf	cb_buf;		/* new I/O buf */
    126   1.1   thorpej 	struct buf	*cb_obp;	/* ptr. to original I/O buf */
    127   1.1   thorpej 	struct ld_ataraid_softc *cb_sc;	/* pointer to ld softc */
    128   1.1   thorpej 	u_int		cb_comp;	/* target component */
    129   1.1   thorpej 	SIMPLEQ_ENTRY(cbuf) cb_q;	/* fifo of component buffers */
    130  1.12     enami 	struct cbuf	*cb_other;	/* other cbuf in case of mirror */
    131  1.12     enami 	int		cb_flags;
    132  1.12     enami #define	CBUF_IODONE	0x00000001	/* I/O is already successfully done */
    133   1.1   thorpej };
    134   1.1   thorpej 
    135  1.36       bsh #define        CBUF_GET()      pool_cache_get(sc->sc_cbufpool, PR_NOWAIT);
    136  1.36       bsh #define        CBUF_PUT(cbp)   pool_cache_put(sc->sc_cbufpool, (cbp))
    137   1.1   thorpej 
    138   1.1   thorpej static int
    139  1.27   xtraeme ld_ataraid_match(device_t parent, cfdata_t match, void *aux)
    140   1.1   thorpej {
    141   1.1   thorpej 
    142   1.1   thorpej 	return (1);
    143   1.1   thorpej }
    144   1.1   thorpej 
    145   1.1   thorpej static void
    146  1.27   xtraeme ld_ataraid_attach(device_t parent, device_t self, void *aux)
    147   1.1   thorpej {
    148  1.27   xtraeme 	struct ld_ataraid_softc *sc = device_private(self);
    149   1.1   thorpej 	struct ld_softc *ld = &sc->sc_ld;
    150   1.1   thorpej 	struct ataraid_array_info *aai = aux;
    151  1.32      tron 	struct ataraid_disk_info *adi = NULL;
    152   1.1   thorpej 	const char *level;
    153   1.1   thorpej 	struct vnode *vp;
    154   1.1   thorpej 	char unklev[32];
    155   1.1   thorpej 	u_int i;
    156   1.1   thorpej 
    157  1.29      tron 	ld->sc_dv = self;
    158  1.29      tron 
    159  1.36       bsh        sc->sc_cbufpool = pool_cache_init(sizeof(struct cbuf), 0,
    160  1.36       bsh            0, 0, "ldcbuf", NULL, IPL_BIO, cbufpool_ctor, cbufpool_dtor, sc);
    161  1.36       bsh        sc->sc_sih_cookie = softint_establish(SOFTINT_BIO,
    162  1.36       bsh            ld_ataraid_start_vstrategy, sc);
    163   1.1   thorpej 
    164   1.1   thorpej 	sc->sc_aai = aai;	/* this data persists */
    165   1.1   thorpej 
    166   1.1   thorpej 	ld->sc_maxxfer = MAXPHYS * aai->aai_width;	/* XXX */
    167   1.1   thorpej 	ld->sc_secperunit = aai->aai_capacity;
    168   1.1   thorpej 	ld->sc_secsize = 512;				/* XXX */
    169   1.1   thorpej 	ld->sc_maxqueuecnt = 128;			/* XXX */
    170   1.1   thorpej 	ld->sc_dump = ld_ataraid_dump;
    171   1.1   thorpej 
    172   1.1   thorpej 	switch (aai->aai_level) {
    173   1.1   thorpej 	case AAI_L_SPAN:
    174   1.1   thorpej 		level = "SPAN";
    175   1.1   thorpej 		ld->sc_start = ld_ataraid_start_span;
    176   1.1   thorpej 		sc->sc_iodone = ld_ataraid_iodone_raid0;
    177   1.1   thorpej 		break;
    178   1.1   thorpej 
    179   1.1   thorpej 	case AAI_L_RAID0:
    180   1.9   thorpej 		level = "RAID-0";
    181   1.1   thorpej 		ld->sc_start = ld_ataraid_start_raid0;
    182   1.1   thorpej 		sc->sc_iodone = ld_ataraid_iodone_raid0;
    183   1.1   thorpej 		break;
    184   1.1   thorpej 
    185   1.1   thorpej 	case AAI_L_RAID1:
    186   1.9   thorpej 		level = "RAID-1";
    187  1.12     enami 		ld->sc_start = ld_ataraid_start_raid0;
    188  1.12     enami 		sc->sc_iodone = ld_ataraid_iodone_raid0;
    189   1.1   thorpej 		break;
    190   1.1   thorpej 
    191   1.1   thorpej 	case AAI_L_RAID0 | AAI_L_RAID1:
    192   1.9   thorpej 		level = "RAID-10";
    193  1.12     enami 		ld->sc_start = ld_ataraid_start_raid0;
    194  1.12     enami 		sc->sc_iodone = ld_ataraid_iodone_raid0;
    195   1.1   thorpej 		break;
    196   1.1   thorpej 
    197   1.1   thorpej 	default:
    198  1.11    itojun 		snprintf(unklev, sizeof(unklev), "<unknown level 0x%x>",
    199  1.11    itojun 		    aai->aai_level);
    200   1.1   thorpej 		level = unklev;
    201   1.1   thorpej 	}
    202   1.1   thorpej 
    203   1.1   thorpej 	aprint_naive(": ATA %s array\n", level);
    204   1.1   thorpej 	aprint_normal(": %s ATA %s array\n",
    205   1.1   thorpej 	    ata_raid_type_name(aai->aai_type), level);
    206   1.1   thorpej 
    207   1.1   thorpej 	if (ld->sc_start == NULL) {
    208  1.29      tron 		aprint_error_dev(ld->sc_dv, "unsupported array type\n");
    209   1.1   thorpej 		return;
    210   1.1   thorpej 	}
    211   1.1   thorpej 
    212   1.1   thorpej 	/*
    213   1.1   thorpej 	 * We get a geometry from the device; use it.
    214   1.1   thorpej 	 */
    215   1.1   thorpej 	ld->sc_nheads = aai->aai_heads;
    216   1.1   thorpej 	ld->sc_nsectors = aai->aai_sectors;
    217   1.1   thorpej 	ld->sc_ncylinders = aai->aai_cylinders;
    218   1.1   thorpej 
    219   1.1   thorpej 	/*
    220   1.1   thorpej 	 * Configure all the component disks.
    221   1.1   thorpej 	 */
    222   1.1   thorpej 	for (i = 0; i < aai->aai_ndisks; i++) {
    223  1.32      tron 		adi = &aai->aai_disks[i];
    224  1.32      tron 		vp = ata_raid_disk_vnode_find(adi);
    225  1.32      tron 		if (vp == NULL) {
    226   1.1   thorpej 			/*
    227   1.1   thorpej 			 * XXX This is bogus.  We should just mark the
    228   1.1   thorpej 			 * XXX component as FAILED, and write-back new
    229   1.1   thorpej 			 * XXX config blocks.
    230   1.1   thorpej 			 */
    231   1.3   thorpej 			break;
    232   1.1   thorpej 		}
    233   1.1   thorpej 		sc->sc_vnodes[i] = vp;
    234   1.1   thorpej 	}
    235   1.3   thorpej 	if (i == aai->aai_ndisks) {
    236   1.3   thorpej 		ld->sc_flags = LDF_ENABLED;
    237   1.3   thorpej 		goto finish;
    238   1.3   thorpej 	}
    239   1.1   thorpej 
    240   1.1   thorpej 	for (i = 0; i < aai->aai_ndisks; i++) {
    241   1.1   thorpej 		vp = sc->sc_vnodes[i];
    242   1.1   thorpej 		sc->sc_vnodes[i] = NULL;
    243   1.3   thorpej 		if (vp != NULL)
    244  1.25        ad 			(void) vn_close(vp, FREAD|FWRITE, NOCRED);
    245   1.1   thorpej 	}
    246   1.3   thorpej 
    247   1.3   thorpej  finish:
    248  1.30      tron #if NBIO > 0
    249  1.30      tron 	if (bio_register(self, ld_ataraid_bioctl) != 0)
    250  1.30      tron 		panic("%s: bioctl registration failed\n",
    251  1.30      tron 		    device_xname(ld->sc_dv));
    252  1.30      tron #endif
    253  1.36       bsh        SIMPLEQ_INIT(&sc->sc_cbufq);
    254   1.3   thorpej 	ldattach(ld);
    255   1.1   thorpej }
    256   1.1   thorpej 
    257  1.36       bsh static int
    258  1.36       bsh cbufpool_ctor(void *arg, void *obj, int flags)
    259  1.36       bsh {
    260  1.36       bsh        struct ld_ataraid_softc *sc = arg;
    261  1.36       bsh        struct ld_softc *ld = &sc->sc_ld;
    262  1.36       bsh        struct cbuf *cbp = obj;
    263  1.36       bsh 
    264  1.36       bsh        /* We release/reacquire the spinlock before calling buf_init() */
    265  1.36       bsh        mutex_exit(&ld->sc_mutex);
    266  1.36       bsh        buf_init(&cbp->cb_buf);
    267  1.36       bsh        mutex_enter(&ld->sc_mutex);
    268  1.36       bsh 
    269  1.36       bsh        return 0;
    270  1.36       bsh }
    271  1.36       bsh 
    272  1.36       bsh static void
    273  1.36       bsh cbufpool_dtor(void *arg, void *obj)
    274  1.36       bsh {
    275  1.36       bsh        struct cbuf *cbp = obj;
    276  1.36       bsh 
    277  1.36       bsh        buf_destroy(&cbp->cb_buf);
    278  1.36       bsh }
    279  1.36       bsh 
    280   1.1   thorpej static struct cbuf *
    281   1.1   thorpej ld_ataraid_make_cbuf(struct ld_ataraid_softc *sc, struct buf *bp,
    282  1.19  christos     u_int comp, daddr_t bn, void *addr, long bcount)
    283   1.1   thorpej {
    284   1.1   thorpej 	struct cbuf *cbp;
    285   1.1   thorpej 
    286   1.1   thorpej 	cbp = CBUF_GET();
    287   1.1   thorpej 	if (cbp == NULL)
    288  1.36       bsh                return NULL;
    289  1.23        ad 	cbp->cb_buf.b_flags = bp->b_flags;
    290  1.23        ad 	cbp->cb_buf.b_oflags = bp->b_oflags;
    291  1.23        ad 	cbp->cb_buf.b_cflags = bp->b_cflags;
    292   1.1   thorpej 	cbp->cb_buf.b_iodone = sc->sc_iodone;
    293   1.1   thorpej 	cbp->cb_buf.b_proc = bp->b_proc;
    294   1.1   thorpej 	cbp->cb_buf.b_vp = sc->sc_vnodes[comp];
    295  1.38     rmind 	cbp->cb_buf.b_objlock = sc->sc_vnodes[comp]->v_interlock;
    296   1.1   thorpej 	cbp->cb_buf.b_blkno = bn + sc->sc_aai->aai_offset;
    297   1.1   thorpej 	cbp->cb_buf.b_data = addr;
    298   1.1   thorpej 	cbp->cb_buf.b_bcount = bcount;
    299   1.1   thorpej 
    300   1.1   thorpej 	/* Context for iodone */
    301   1.1   thorpej 	cbp->cb_obp = bp;
    302   1.1   thorpej 	cbp->cb_sc = sc;
    303   1.1   thorpej 	cbp->cb_comp = comp;
    304  1.12     enami 	cbp->cb_other = NULL;
    305  1.12     enami 	cbp->cb_flags = 0;
    306   1.1   thorpej 
    307  1.36       bsh        return cbp;
    308  1.36       bsh }
    309  1.36       bsh 
    310  1.36       bsh static void
    311  1.36       bsh ld_ataraid_start_vstrategy(void *arg)
    312  1.36       bsh {
    313  1.36       bsh        struct ld_ataraid_softc *sc = arg;
    314  1.36       bsh        struct cbuf *cbp;
    315  1.36       bsh 
    316  1.36       bsh        while ((cbp = SIMPLEQ_FIRST(&sc->sc_cbufq)) != NULL) {
    317  1.36       bsh                SIMPLEQ_REMOVE_HEAD(&sc->sc_cbufq, cb_q);
    318  1.36       bsh                if ((cbp->cb_buf.b_flags & B_READ) == 0) {
    319  1.38     rmind                        mutex_enter(cbp->cb_buf.b_vp->v_interlock);
    320  1.36       bsh                        cbp->cb_buf.b_vp->v_numoutput++;
    321  1.38     rmind                        mutex_exit(cbp->cb_buf.b_vp->v_interlock);
    322  1.36       bsh                }
    323  1.36       bsh                VOP_STRATEGY(cbp->cb_buf.b_vp, &cbp->cb_buf);
    324  1.36       bsh        }
    325   1.1   thorpej }
    326   1.1   thorpej 
    327   1.1   thorpej static int
    328   1.1   thorpej ld_ataraid_start_span(struct ld_softc *ld, struct buf *bp)
    329   1.1   thorpej {
    330   1.1   thorpej 	struct ld_ataraid_softc *sc = (void *) ld;
    331   1.1   thorpej 	struct ataraid_array_info *aai = sc->sc_aai;
    332   1.1   thorpej 	struct ataraid_disk_info *adi;
    333   1.1   thorpej 	struct cbuf *cbp;
    334  1.19  christos 	char *addr;
    335   1.1   thorpej 	daddr_t bn;
    336   1.1   thorpej 	long bcount, rcount;
    337   1.1   thorpej 	u_int comp;
    338   1.1   thorpej 
    339   1.1   thorpej 	/* Allocate component buffers. */
    340   1.1   thorpej 	addr = bp->b_data;
    341   1.1   thorpej 
    342   1.1   thorpej 	/* Find the first component. */
    343   1.1   thorpej 	comp = 0;
    344   1.1   thorpej 	adi = &aai->aai_disks[comp];
    345   1.1   thorpej 	bn = bp->b_rawblkno;
    346   1.1   thorpej 	while (bn >= adi->adi_compsize) {
    347   1.1   thorpej 		bn -= adi->adi_compsize;
    348   1.1   thorpej 		adi = &aai->aai_disks[++comp];
    349   1.1   thorpej 	}
    350   1.1   thorpej 
    351   1.1   thorpej 	bp->b_resid = bp->b_bcount;
    352   1.1   thorpej 
    353   1.1   thorpej 	for (bcount = bp->b_bcount; bcount > 0; bcount -= rcount) {
    354   1.1   thorpej 		rcount = bp->b_bcount;
    355   1.1   thorpej 		if ((adi->adi_compsize - bn) < btodb(rcount))
    356   1.1   thorpej 			rcount = dbtob(adi->adi_compsize - bn);
    357   1.1   thorpej 
    358   1.1   thorpej 		cbp = ld_ataraid_make_cbuf(sc, bp, comp, bn, addr, rcount);
    359   1.1   thorpej 		if (cbp == NULL) {
    360   1.1   thorpej 			/* Free the already allocated component buffers. */
    361  1.36       bsh                        while ((cbp = SIMPLEQ_FIRST(&sc->sc_cbufq)) != NULL) {
    362  1.36       bsh                                SIMPLEQ_REMOVE_HEAD(&sc->sc_cbufq, cb_q);
    363   1.1   thorpej 				CBUF_PUT(cbp);
    364   1.1   thorpej 			}
    365  1.36       bsh                        return EAGAIN;
    366   1.1   thorpej 		}
    367   1.1   thorpej 
    368   1.1   thorpej 		/*
    369   1.1   thorpej 		 * For a span, we always know we advance to the next disk,
    370   1.1   thorpej 		 * and always start at offset 0 on that disk.
    371   1.1   thorpej 		 */
    372   1.1   thorpej 		adi = &aai->aai_disks[++comp];
    373   1.1   thorpej 		bn = 0;
    374   1.1   thorpej 
    375  1.36       bsh                SIMPLEQ_INSERT_TAIL(&sc->sc_cbufq, cbp, cb_q);
    376   1.1   thorpej 		addr += rcount;
    377   1.1   thorpej 	}
    378   1.1   thorpej 
    379   1.1   thorpej 	/* Now fire off the requests. */
    380  1.36       bsh        softint_schedule(sc->sc_sih_cookie);
    381   1.1   thorpej 
    382  1.36       bsh        return 0;
    383   1.1   thorpej }
    384   1.1   thorpej 
    385   1.1   thorpej static int
    386   1.1   thorpej ld_ataraid_start_raid0(struct ld_softc *ld, struct buf *bp)
    387   1.1   thorpej {
    388  1.36       bsh        struct ld_ataraid_softc *sc = (void *)ld;
    389   1.1   thorpej 	struct ataraid_array_info *aai = sc->sc_aai;
    390  1.12     enami 	struct ataraid_disk_info *adi;
    391  1.12     enami 	struct cbuf *cbp, *other_cbp;
    392  1.19  christos 	char *addr;
    393   1.1   thorpej 	daddr_t bn, cbn, tbn, off;
    394   1.1   thorpej 	long bcount, rcount;
    395   1.1   thorpej 	u_int comp;
    396  1.12     enami 	const int read = bp->b_flags & B_READ;
    397  1.12     enami 	const int mirror = aai->aai_level & AAI_L_RAID1;
    398  1.36       bsh        int error = 0;
    399   1.1   thorpej 
    400   1.1   thorpej 	/* Allocate component buffers. */
    401   1.1   thorpej 	addr = bp->b_data;
    402   1.1   thorpej 	bn = bp->b_rawblkno;
    403   1.1   thorpej 
    404   1.1   thorpej 	bp->b_resid = bp->b_bcount;
    405   1.1   thorpej 
    406   1.1   thorpej 	for (bcount = bp->b_bcount; bcount > 0; bcount -= rcount) {
    407   1.1   thorpej 		tbn = bn / aai->aai_interleave;
    408   1.1   thorpej 		off = bn % aai->aai_interleave;
    409   1.1   thorpej 
    410   1.1   thorpej 		if (__predict_false(tbn == aai->aai_capacity /
    411   1.1   thorpej 					   aai->aai_interleave)) {
    412   1.1   thorpej 			/* Last stripe. */
    413   1.1   thorpej 			daddr_t sz = (aai->aai_capacity -
    414   1.1   thorpej 				      (tbn * aai->aai_interleave)) /
    415   1.1   thorpej 				     aai->aai_width;
    416   1.1   thorpej 			comp = off / sz;
    417   1.1   thorpej 			cbn = ((tbn / aai->aai_width) * aai->aai_interleave) +
    418   1.1   thorpej 			    (off % sz);
    419   1.1   thorpej 			rcount = min(bcount, dbtob(sz));
    420   1.1   thorpej 		} else {
    421   1.1   thorpej 			comp = tbn % aai->aai_width;
    422   1.1   thorpej 			cbn = ((tbn / aai->aai_width) * aai->aai_interleave) +
    423   1.1   thorpej 			    off;
    424   1.1   thorpej 			rcount = min(bcount, dbtob(aai->aai_interleave - off));
    425   1.1   thorpej 		}
    426   1.1   thorpej 
    427  1.12     enami 		/*
    428  1.12     enami 		 * See if a component is valid.
    429  1.12     enami 		 */
    430  1.12     enami try_mirror:
    431  1.12     enami 		adi = &aai->aai_disks[comp];
    432  1.12     enami 		if ((adi->adi_status & ADI_S_ONLINE) == 0) {
    433  1.12     enami 			if (mirror && comp < aai->aai_width) {
    434  1.12     enami 				comp += aai->aai_width;
    435  1.12     enami 				goto try_mirror;
    436  1.12     enami 			}
    437  1.12     enami 
    438  1.12     enami 			/*
    439  1.12     enami 			 * No component available.
    440  1.12     enami 			 */
    441  1.12     enami 			error = EIO;
    442  1.12     enami 			goto free_and_exit;
    443  1.12     enami 		}
    444  1.12     enami 
    445   1.1   thorpej 		cbp = ld_ataraid_make_cbuf(sc, bp, comp, cbn, addr, rcount);
    446   1.1   thorpej 		if (cbp == NULL) {
    447  1.12     enami resource_shortage:
    448  1.12     enami 			error = EAGAIN;
    449  1.12     enami free_and_exit:
    450   1.1   thorpej 			/* Free the already allocated component buffers. */
    451  1.36       bsh                        while ((cbp = SIMPLEQ_FIRST(&sc->sc_cbufq)) != NULL) {
    452  1.36       bsh                                SIMPLEQ_REMOVE_HEAD(&sc->sc_cbufq, cb_q);
    453   1.1   thorpej 				CBUF_PUT(cbp);
    454   1.1   thorpej 			}
    455  1.36       bsh                        return error;
    456   1.1   thorpej 		}
    457  1.36       bsh                SIMPLEQ_INSERT_TAIL(&sc->sc_cbufq, cbp, cb_q);
    458  1.12     enami 		if (mirror && !read && comp < aai->aai_width) {
    459  1.12     enami 			comp += aai->aai_width;
    460  1.12     enami 			adi = &aai->aai_disks[comp];
    461  1.12     enami 			if (adi->adi_status & ADI_S_ONLINE) {
    462  1.12     enami 				other_cbp = ld_ataraid_make_cbuf(sc, bp,
    463  1.12     enami 				    comp, cbn, addr, rcount);
    464  1.12     enami 				if (other_cbp == NULL)
    465  1.12     enami 					goto resource_shortage;
    466  1.36       bsh                                SIMPLEQ_INSERT_TAIL(&sc->sc_cbufq,
    467  1.36       bsh                                    other_cbp, cb_q);
    468  1.12     enami 				other_cbp->cb_other = cbp;
    469  1.12     enami 				cbp->cb_other = other_cbp;
    470  1.12     enami 			}
    471  1.12     enami 		}
    472   1.1   thorpej 		bn += btodb(rcount);
    473   1.1   thorpej 		addr += rcount;
    474   1.1   thorpej 	}
    475   1.1   thorpej 
    476   1.1   thorpej 	/* Now fire off the requests. */
    477  1.36       bsh        softint_schedule(sc->sc_sih_cookie);
    478   1.1   thorpej 
    479  1.36       bsh        return error;
    480   1.1   thorpej }
    481   1.1   thorpej 
    482   1.1   thorpej /*
    483   1.1   thorpej  * Called at interrupt time.  Mark the component as done and if all
    484   1.1   thorpej  * components are done, take an "interrupt".
    485   1.1   thorpej  */
    486   1.1   thorpej static void
    487   1.1   thorpej ld_ataraid_iodone_raid0(struct buf *vbp)
    488   1.1   thorpej {
    489  1.12     enami 	struct cbuf *cbp = (struct cbuf *) vbp, *other_cbp;
    490   1.1   thorpej 	struct buf *bp = cbp->cb_obp;
    491   1.1   thorpej 	struct ld_ataraid_softc *sc = cbp->cb_sc;
    492  1.12     enami 	struct ataraid_array_info *aai = sc->sc_aai;
    493  1.12     enami 	struct ataraid_disk_info *adi;
    494   1.1   thorpej 	long count;
    495  1.12     enami 	int s, iodone;
    496   1.1   thorpej 
    497   1.1   thorpej 	s = splbio();
    498   1.1   thorpej 
    499  1.12     enami 	iodone = cbp->cb_flags & CBUF_IODONE;
    500  1.12     enami 	other_cbp = cbp->cb_other;
    501  1.12     enami 	if (other_cbp != NULL)
    502  1.12     enami 		/* You are alone */
    503  1.12     enami 		other_cbp->cb_other = NULL;
    504  1.12     enami 
    505  1.21        ad 	if (cbp->cb_buf.b_error != 0) {
    506  1.12     enami 		/*
    507  1.12     enami 		 * Mark this component broken.
    508  1.12     enami 		 */
    509  1.12     enami 		adi = &aai->aai_disks[cbp->cb_comp];
    510  1.12     enami 		adi->adi_status &= ~ADI_S_ONLINE;
    511  1.12     enami 
    512  1.12     enami 		printf("%s: error %d on component %d (%s)\n",
    513  1.29      tron 		    device_xname(sc->sc_ld.sc_dv), bp->b_error, cbp->cb_comp,
    514  1.26    cegger 		    device_xname(adi->adi_dev));
    515  1.12     enami 
    516  1.12     enami 		/*
    517  1.12     enami 		 * If we didn't see an error yet and we are reading
    518  1.12     enami 		 * RAID1 disk, try another component.
    519  1.12     enami 		 */
    520  1.21        ad 		if (bp->b_error == 0 &&
    521  1.12     enami 		    (cbp->cb_buf.b_flags & B_READ) != 0 &&
    522  1.12     enami 		    (aai->aai_level & AAI_L_RAID1) != 0 &&
    523  1.12     enami 		    cbp->cb_comp < aai->aai_width) {
    524  1.12     enami 			cbp->cb_comp += aai->aai_width;
    525  1.12     enami 			adi = &aai->aai_disks[cbp->cb_comp];
    526  1.12     enami 			if (adi->adi_status & ADI_S_ONLINE) {
    527  1.21        ad 				cbp->cb_buf.b_error = 0;
    528  1.12     enami 				VOP_STRATEGY(cbp->cb_buf.b_vp, &cbp->cb_buf);
    529  1.12     enami 				goto out;
    530  1.12     enami 			}
    531  1.12     enami 		}
    532  1.12     enami 
    533  1.12     enami 		if (iodone || other_cbp != NULL)
    534  1.12     enami 			/*
    535  1.12     enami 			 * If I/O on other component successfully done
    536  1.12     enami 			 * or the I/O is still in progress, no need
    537  1.12     enami 			 * to tell an error to upper layer.
    538  1.12     enami 			 */
    539  1.12     enami 			;
    540  1.12     enami 		else {
    541  1.12     enami 			bp->b_error = cbp->cb_buf.b_error ?
    542  1.12     enami 			    cbp->cb_buf.b_error : EIO;
    543  1.12     enami 		}
    544   1.1   thorpej 
    545   1.1   thorpej 		/* XXX Update component config blocks. */
    546   1.1   thorpej 
    547  1.12     enami 	} else {
    548  1.12     enami 		/*
    549  1.12     enami 		 * If other I/O is still in progress, tell it that
    550  1.12     enami 		 * our I/O is successfully done.
    551  1.12     enami 		 */
    552  1.12     enami 		if (other_cbp != NULL)
    553  1.12     enami 			other_cbp->cb_flags |= CBUF_IODONE;
    554   1.1   thorpej 	}
    555   1.1   thorpej 	count = cbp->cb_buf.b_bcount;
    556   1.1   thorpej 	CBUF_PUT(cbp);
    557   1.1   thorpej 
    558  1.12     enami 	if (other_cbp != NULL)
    559  1.12     enami 		goto out;
    560  1.12     enami 
    561   1.1   thorpej 	/* If all done, "interrupt". */
    562   1.1   thorpej 	bp->b_resid -= count;
    563   1.1   thorpej 	if (bp->b_resid < 0)
    564   1.1   thorpej 		panic("ld_ataraid_iodone_raid0: count");
    565   1.1   thorpej 	if (bp->b_resid == 0)
    566   1.1   thorpej 		lddone(&sc->sc_ld, bp);
    567  1.12     enami 
    568  1.12     enami out:
    569   1.1   thorpej 	splx(s);
    570   1.1   thorpej }
    571   1.1   thorpej 
    572   1.1   thorpej static int
    573  1.18  christos ld_ataraid_dump(struct ld_softc *sc, void *data,
    574  1.18  christos     int blkno, int blkcnt)
    575   1.1   thorpej {
    576   1.1   thorpej 
    577   1.1   thorpej 	return (EIO);
    578   1.1   thorpej }
    579  1.30      tron 
    580  1.30      tron #if NBIO > 0
    581  1.30      tron static int
    582  1.30      tron ld_ataraid_bioctl(device_t self, u_long cmd, void *addr)
    583  1.30      tron {
    584  1.30      tron 	struct ld_ataraid_softc *sc = device_private(self);
    585  1.30      tron 	int error = 0;
    586  1.30      tron 
    587  1.30      tron 	switch (cmd) {
    588  1.30      tron 	case BIOCINQ:
    589  1.30      tron 		error = ld_ataraid_bioinq(sc, (struct bioc_inq *)addr);
    590  1.30      tron 		break;
    591  1.30      tron 	case BIOCVOL:
    592  1.30      tron 		error = ld_ataraid_biovol(sc, (struct bioc_vol *)addr);
    593  1.30      tron 		break;
    594  1.30      tron 	case BIOCDISK:
    595  1.30      tron 		error = ld_ataraid_biodisk(sc, (struct bioc_disk *)addr);
    596  1.30      tron 		break;
    597  1.30      tron 	default:
    598  1.30      tron 		error = ENOTTY;
    599  1.30      tron 		break;
    600  1.30      tron 	}
    601  1.30      tron 
    602  1.30      tron 	return error;
    603  1.30      tron }
    604  1.30      tron 
    605  1.30      tron static int
    606  1.30      tron ld_ataraid_bioinq(struct ld_ataraid_softc *sc, struct bioc_inq *bi)
    607  1.30      tron {
    608  1.30      tron 	struct ataraid_array_info *aai = sc->sc_aai;
    609  1.30      tron 
    610  1.30      tron 	/* there's always one volume per ld device */
    611  1.30      tron 	bi->bi_novol = 1;
    612  1.30      tron 	bi->bi_nodisk = aai->aai_ndisks;
    613  1.30      tron 
    614  1.30      tron 	return 0;
    615  1.30      tron }
    616  1.30      tron 
    617  1.30      tron static int
    618  1.30      tron ld_ataraid_biovol(struct ld_ataraid_softc *sc, struct bioc_vol *bv)
    619  1.30      tron {
    620  1.30      tron 	struct ataraid_array_info *aai = sc->sc_aai;
    621  1.30      tron 	struct ld_softc *ld = &sc->sc_ld;
    622  1.37       bsh #define	to_kibytes(ld,s)	(ld->sc_secsize*(s)/1024)
    623  1.30      tron 
    624  1.30      tron 	/* Fill in data for _this_ volume */
    625  1.30      tron 	bv->bv_percent = -1;
    626  1.30      tron 	bv->bv_seconds = 0;
    627  1.30      tron 
    628  1.30      tron 	switch (aai->aai_status) {
    629  1.30      tron 	case AAI_S_READY:
    630  1.30      tron 		bv->bv_status = BIOC_SVONLINE;
    631  1.30      tron 		break;
    632  1.30      tron 	case AAI_S_DEGRADED:
    633  1.30      tron 		bv->bv_status = BIOC_SVDEGRADED;
    634  1.30      tron 		break;
    635  1.30      tron 	}
    636  1.30      tron 
    637  1.30      tron 	bv->bv_size = ld->sc_secsize * ld->sc_secperunit;
    638  1.30      tron 
    639  1.30      tron 	switch (aai->aai_level) {
    640  1.30      tron 	case AAI_L_SPAN:
    641  1.30      tron 	case AAI_L_RAID0:
    642  1.37       bsh 		bv->bv_stripe_size = to_kibytes(ld, aai->aai_interleave);
    643  1.30      tron 		bv->bv_level = 0;
    644  1.30      tron 		break;
    645  1.30      tron 	case AAI_L_RAID1:
    646  1.30      tron 		bv->bv_stripe_size = 0;
    647  1.30      tron 		bv->bv_level = 1;
    648  1.30      tron 		break;
    649  1.30      tron 	case AAI_L_RAID5:
    650  1.37       bsh 		bv->bv_stripe_size = to_kibytes(ld, aai->aai_interleave);
    651  1.30      tron 		bv->bv_level = 5;
    652  1.30      tron 		break;
    653  1.30      tron 	}
    654  1.30      tron 
    655  1.30      tron 	bv->bv_nodisk = aai->aai_ndisks;
    656  1.30      tron 	strlcpy(bv->bv_dev, device_xname(ld->sc_dv), sizeof(bv->bv_dev));
    657  1.31      tron 	if (aai->aai_name[0] != '\0')
    658  1.31      tron 		strlcpy(bv->bv_vendor, aai->aai_name, sizeof(bv->bv_vendor));
    659  1.30      tron 
    660  1.30      tron 	return 0;
    661  1.30      tron }
    662  1.30      tron 
    663  1.30      tron static int
    664  1.30      tron ld_ataraid_biodisk(struct ld_ataraid_softc *sc, struct bioc_disk *bd)
    665  1.30      tron {
    666  1.30      tron 	struct ataraid_array_info *aai = sc->sc_aai;
    667  1.30      tron 	struct ataraid_disk_info *adi;
    668  1.30      tron 	struct ld_softc *ld = &sc->sc_ld;
    669  1.30      tron 	struct atabus_softc *atabus;
    670  1.30      tron 	struct wd_softc *wd;
    671  1.30      tron 	char model[81], serial[41], rev[17];
    672  1.30      tron 
    673  1.30      tron 	/* sanity check */
    674  1.30      tron 	if (bd->bd_diskid > aai->aai_ndisks)
    675  1.30      tron 		return EINVAL;
    676  1.30      tron 
    677  1.30      tron 	adi = &aai->aai_disks[bd->bd_diskid];
    678  1.30      tron 	atabus = device_private(device_parent(adi->adi_dev));
    679  1.30      tron 	wd = device_private(adi->adi_dev);
    680  1.30      tron 
    681  1.30      tron 	/* fill in data for _this_ disk */
    682  1.30      tron 	switch (adi->adi_status) {
    683  1.30      tron 	case ADI_S_ONLINE | ADI_S_ASSIGNED:
    684  1.30      tron 		bd->bd_status = BIOC_SDONLINE;
    685  1.30      tron 		break;
    686  1.30      tron 	case ADI_S_SPARE:
    687  1.30      tron 		bd->bd_status = BIOC_SDHOTSPARE;
    688  1.30      tron 		break;
    689  1.30      tron 	default:
    690  1.30      tron 		bd->bd_status = BIOC_SDOFFLINE;
    691  1.30      tron 		break;
    692  1.30      tron 	}
    693  1.30      tron 
    694  1.30      tron 	bd->bd_channel = 0;
    695  1.30      tron 	bd->bd_target = atabus->sc_chan->ch_channel;
    696  1.30      tron 	bd->bd_lun = 0;
    697  1.30      tron 	bd->bd_size = (wd->sc_capacity * ld->sc_secsize) - aai->aai_reserved;
    698  1.30      tron 
    699  1.30      tron 	strlcpy(bd->bd_procdev, device_xname(adi->adi_dev),
    700  1.30      tron 	    sizeof(bd->bd_procdev));
    701  1.30      tron 
    702  1.30      tron 	scsipi_strvis(serial, sizeof(serial), wd->sc_params.atap_serial,
    703  1.30      tron 	    sizeof(wd->sc_params.atap_serial));
    704  1.30      tron 	scsipi_strvis(model, sizeof(model), wd->sc_params.atap_model,
    705  1.30      tron 	    sizeof(wd->sc_params.atap_model));
    706  1.30      tron 	scsipi_strvis(rev, sizeof(rev), wd->sc_params.atap_revision,
    707  1.30      tron 	    sizeof(wd->sc_params.atap_revision));
    708  1.30      tron 
    709  1.30      tron 	snprintf(bd->bd_vendor, sizeof(bd->bd_vendor), "%s %s", model, rev);
    710  1.30      tron 	strlcpy(bd->bd_serial, serial, sizeof(bd->bd_serial));
    711  1.30      tron 
    712  1.30      tron 	return 0;
    713  1.30      tron }
    714  1.30      tron #endif /* NBIO > 0 */
    715