Home | History | Annotate | Line # | Download | only in raidframe
rf_reconutil.c revision 1.32
      1  1.32       mrg /*	$NetBSD: rf_reconutil.c,v 1.32 2011/05/02 01:07:24 mrg Exp $	*/
      2   1.1     oster /*
      3   1.1     oster  * Copyright (c) 1995 Carnegie-Mellon University.
      4   1.1     oster  * All rights reserved.
      5   1.1     oster  *
      6   1.1     oster  * Author: Mark Holland
      7   1.1     oster  *
      8   1.1     oster  * Permission to use, copy, modify and distribute this software and
      9   1.1     oster  * its documentation is hereby granted, provided that both the copyright
     10   1.1     oster  * notice and this permission notice appear in all copies of the
     11   1.1     oster  * software, derivative works or modified versions, and any portions
     12   1.1     oster  * thereof, and that both notices appear in supporting documentation.
     13   1.1     oster  *
     14   1.1     oster  * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
     15   1.1     oster  * CONDITION.  CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
     16   1.1     oster  * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
     17   1.1     oster  *
     18   1.1     oster  * Carnegie Mellon requests users of this software to return to
     19   1.1     oster  *
     20   1.1     oster  *  Software Distribution Coordinator  or  Software.Distribution (at) CS.CMU.EDU
     21   1.1     oster  *  School of Computer Science
     22   1.1     oster  *  Carnegie Mellon University
     23   1.1     oster  *  Pittsburgh PA 15213-3890
     24   1.1     oster  *
     25   1.1     oster  * any improvements or extensions that they make and grant Carnegie the
     26   1.1     oster  * rights to redistribute these changes.
     27   1.1     oster  */
     28   1.1     oster 
     29   1.1     oster /********************************************
     30   1.1     oster  * rf_reconutil.c -- reconstruction utilities
     31   1.1     oster  ********************************************/
     32   1.5     lukem 
     33   1.5     lukem #include <sys/cdefs.h>
     34  1.32       mrg __KERNEL_RCSID(0, "$NetBSD: rf_reconutil.c,v 1.32 2011/05/02 01:07:24 mrg Exp $");
     35   1.1     oster 
     36   1.4     oster #include <dev/raidframe/raidframevar.h>
     37   1.4     oster 
     38   1.1     oster #include "rf_raid.h"
     39   1.1     oster #include "rf_desc.h"
     40   1.1     oster #include "rf_reconutil.h"
     41   1.1     oster #include "rf_reconbuffer.h"
     42   1.1     oster #include "rf_general.h"
     43   1.1     oster #include "rf_decluster.h"
     44   1.1     oster #include "rf_raid5_rotatedspare.h"
     45   1.1     oster #include "rf_interdecluster.h"
     46   1.1     oster #include "rf_chaindecluster.h"
     47   1.1     oster 
     48   1.1     oster /*******************************************************************
     49   1.1     oster  * allocates/frees the reconstruction control information structures
     50   1.1     oster  *******************************************************************/
     51  1.19     oster 
     52  1.19     oster /* fcol - failed column
     53  1.19     oster  * scol - identifies which spare we are using
     54  1.19     oster  */
     55  1.19     oster 
     56   1.3     oster RF_ReconCtrl_t *
     57  1.25     perry rf_MakeReconControl(RF_RaidReconDesc_t *reconDesc,
     58  1.19     oster 		    RF_RowCol_t fcol, RF_RowCol_t scol)
     59   1.1     oster {
     60   1.3     oster 	RF_Raid_t *raidPtr = reconDesc->raidPtr;
     61   1.3     oster 	RF_RaidLayout_t *layoutPtr = &raidPtr->Layout;
     62   1.3     oster 	RF_ReconUnitCount_t RUsPerPU = layoutPtr->SUsPerPU / layoutPtr->SUsPerRU;
     63   1.3     oster 	RF_ReconUnitCount_t numSpareRUs;
     64   1.3     oster 	RF_ReconCtrl_t *reconCtrlPtr;
     65   1.3     oster 	RF_ReconBuffer_t *rbuf;
     66  1.14  jdolecek 	const RF_LayoutSW_t *lp;
     67  1.12     oster #if (RF_INCLUDE_PARITY_DECLUSTERING_DS > 0)
     68  1.12     oster 	int     retcode;
     69  1.12     oster #endif
     70   1.3     oster 	RF_RowCol_t i;
     71   1.3     oster 
     72   1.3     oster 	lp = raidPtr->Layout.map;
     73   1.3     oster 
     74   1.3     oster 	/* make and zero the global reconstruction structure and the per-disk
     75   1.3     oster 	 * structure */
     76  1.16     oster 	RF_Malloc(reconCtrlPtr, sizeof(RF_ReconCtrl_t), (RF_ReconCtrl_t *));
     77  1.11     oster 
     78  1.11     oster 	/* note: this zeros the perDiskInfo */
     79  1.16     oster 	RF_Malloc(reconCtrlPtr->perDiskInfo, raidPtr->numCol *
     80  1.11     oster 		  sizeof(RF_PerDiskReconCtrl_t), (RF_PerDiskReconCtrl_t *));
     81   1.3     oster 	reconCtrlPtr->reconDesc = reconDesc;
     82   1.3     oster 	reconCtrlPtr->fcol = fcol;
     83   1.3     oster 	reconCtrlPtr->spareCol = scol;
     84   1.3     oster 	reconCtrlPtr->lastPSID = layoutPtr->numStripe / layoutPtr->SUsPerPU;
     85   1.3     oster 	reconCtrlPtr->percentComplete = 0;
     86  1.24     oster 	reconCtrlPtr->error = 0;
     87  1.24     oster 	reconCtrlPtr->pending_writes = 0;
     88   1.3     oster 
     89   1.3     oster 	/* initialize each per-disk recon information structure */
     90   1.3     oster 	for (i = 0; i < raidPtr->numCol; i++) {
     91   1.3     oster 		reconCtrlPtr->perDiskInfo[i].reconCtrl = reconCtrlPtr;
     92   1.3     oster 		reconCtrlPtr->perDiskInfo[i].col = i;
     93  1.11     oster 		/* make it appear as if we just finished an RU */
     94  1.25     perry 		reconCtrlPtr->perDiskInfo[i].curPSID = -1;
     95   1.3     oster 		reconCtrlPtr->perDiskInfo[i].ru_count = RUsPerPU - 1;
     96   1.3     oster 	}
     97   1.3     oster 
     98   1.3     oster 	/* Get the number of spare units per disk and the sparemap in case
     99   1.3     oster 	 * spare is distributed  */
    100   1.3     oster 
    101   1.3     oster 	if (lp->GetNumSpareRUs) {
    102   1.3     oster 		numSpareRUs = lp->GetNumSpareRUs(raidPtr);
    103   1.3     oster 	} else {
    104   1.3     oster 		numSpareRUs = 0;
    105   1.3     oster 	}
    106   1.3     oster 
    107  1.12     oster #if (RF_INCLUDE_PARITY_DECLUSTERING_DS > 0)
    108   1.3     oster 	/*
    109   1.3     oster          * Not all distributed sparing archs need dynamic mappings
    110   1.3     oster          */
    111   1.3     oster 	if (lp->InstallSpareTable) {
    112  1.27     oster 		retcode = rf_InstallSpareTable(raidPtr, 0, fcol);
    113   1.3     oster 		if (retcode) {
    114   1.3     oster 			RF_PANIC();	/* XXX fix this */
    115   1.3     oster 		}
    116   1.3     oster 	}
    117  1.12     oster #endif
    118   1.3     oster 	/* make the reconstruction map */
    119   1.3     oster 	reconCtrlPtr->reconMap = rf_MakeReconMap(raidPtr, (int) (layoutPtr->SUsPerRU * layoutPtr->sectorsPerStripeUnit),
    120   1.3     oster 	    raidPtr->sectorsPerDisk, numSpareRUs);
    121   1.3     oster 
    122   1.3     oster 	/* make the per-disk reconstruction buffers */
    123   1.3     oster 	for (i = 0; i < raidPtr->numCol; i++) {
    124  1.15     oster 		reconCtrlPtr->perDiskInfo[i].rbuf = (i == fcol) ? NULL : rf_MakeReconBuffer(raidPtr, i, RF_RBUF_TYPE_EXCLUSIVE);
    125   1.3     oster 	}
    126   1.3     oster 
    127   1.3     oster 	/* initialize the event queue */
    128  1.32       mrg 	rf_init_mutex2(reconCtrlPtr->eq_mutex, IPL_VM);
    129  1.32       mrg 	rf_init_cond2(reconCtrlPtr->eq_cv, "rfevq");
    130  1.17     oster 
    131   1.3     oster 	reconCtrlPtr->eventQueue = NULL;
    132   1.3     oster 	reconCtrlPtr->eq_count = 0;
    133   1.3     oster 
    134   1.3     oster 	/* make the floating recon buffers and append them to the free list */
    135  1.29       mrg 	rf_mutex_init(&reconCtrlPtr->rb_mutex);
    136  1.17     oster 
    137   1.3     oster 	reconCtrlPtr->fullBufferList = NULL;
    138   1.3     oster 	reconCtrlPtr->floatingRbufs = NULL;
    139   1.3     oster 	reconCtrlPtr->committedRbufs = NULL;
    140   1.3     oster 	for (i = 0; i < raidPtr->numFloatingReconBufs; i++) {
    141  1.25     perry 		rbuf = rf_MakeReconBuffer(raidPtr, fcol,
    142  1.11     oster 					  RF_RBUF_TYPE_FLOATING);
    143   1.3     oster 		rbuf->next = reconCtrlPtr->floatingRbufs;
    144   1.3     oster 		reconCtrlPtr->floatingRbufs = rbuf;
    145   1.3     oster 	}
    146   1.3     oster 
    147   1.3     oster 	/* create the parity stripe status table */
    148   1.3     oster 	reconCtrlPtr->pssTable = rf_MakeParityStripeStatusTable(raidPtr);
    149   1.3     oster 
    150   1.3     oster 	/* set the initial min head sep counter val */
    151   1.3     oster 	reconCtrlPtr->minHeadSepCounter = 0;
    152   1.3     oster 
    153   1.3     oster 	return (reconCtrlPtr);
    154   1.1     oster }
    155   1.1     oster 
    156  1.25     perry void
    157  1.19     oster rf_FreeReconControl(RF_Raid_t *raidPtr)
    158   1.1     oster {
    159  1.15     oster 	RF_ReconCtrl_t *reconCtrlPtr = raidPtr->reconControl;
    160   1.3     oster 	RF_ReconBuffer_t *t;
    161   1.3     oster 	RF_ReconUnitNum_t i;
    162   1.3     oster 
    163   1.3     oster 	RF_ASSERT(reconCtrlPtr);
    164   1.3     oster 	for (i = 0; i < raidPtr->numCol; i++)
    165   1.3     oster 		if (reconCtrlPtr->perDiskInfo[i].rbuf)
    166   1.3     oster 			rf_FreeReconBuffer(reconCtrlPtr->perDiskInfo[i].rbuf);
    167  1.24     oster 
    168  1.24     oster 	t = reconCtrlPtr->floatingRbufs;
    169  1.24     oster 	while (t) {
    170   1.3     oster 		reconCtrlPtr->floatingRbufs = t->next;
    171   1.3     oster 		rf_FreeReconBuffer(t);
    172  1.24     oster 		t = reconCtrlPtr->floatingRbufs;
    173   1.3     oster 	}
    174  1.24     oster 
    175  1.32       mrg 	rf_destroy_mutex2(reconCtrlPtr->eq_mutex);
    176  1.32       mrg 	rf_destroy_cond2(reconCtrlPtr->eq_cv);
    177  1.32       mrg 
    178   1.3     oster 	rf_FreeReconMap(reconCtrlPtr->reconMap);
    179   1.3     oster 	rf_FreeParityStripeStatusTable(raidPtr, reconCtrlPtr->pssTable);
    180  1.25     perry 	RF_Free(reconCtrlPtr->perDiskInfo,
    181  1.11     oster 		raidPtr->numCol * sizeof(RF_PerDiskReconCtrl_t));
    182   1.3     oster 	RF_Free(reconCtrlPtr, sizeof(*reconCtrlPtr));
    183   1.1     oster }
    184   1.1     oster 
    185   1.1     oster 
    186   1.1     oster /******************************************************************************
    187   1.1     oster  * computes the default head separation limit
    188   1.1     oster  *****************************************************************************/
    189  1.25     perry RF_HeadSepLimit_t
    190  1.19     oster rf_GetDefaultHeadSepLimit(RF_Raid_t *raidPtr)
    191   1.1     oster {
    192   1.3     oster 	RF_HeadSepLimit_t hsl;
    193  1.14  jdolecek 	const RF_LayoutSW_t *lp;
    194   1.1     oster 
    195   1.3     oster 	lp = raidPtr->Layout.map;
    196   1.3     oster 	if (lp->GetDefaultHeadSepLimit == NULL)
    197   1.3     oster 		return (-1);
    198   1.3     oster 	hsl = lp->GetDefaultHeadSepLimit(raidPtr);
    199   1.3     oster 	return (hsl);
    200   1.1     oster }
    201   1.1     oster 
    202   1.1     oster 
    203   1.1     oster /******************************************************************************
    204   1.1     oster  * computes the default number of floating recon buffers
    205   1.1     oster  *****************************************************************************/
    206  1.25     perry int
    207  1.19     oster rf_GetDefaultNumFloatingReconBuffers(RF_Raid_t *raidPtr)
    208   1.1     oster {
    209  1.14  jdolecek 	const RF_LayoutSW_t *lp;
    210   1.3     oster 	int     nrb;
    211   1.1     oster 
    212   1.3     oster 	lp = raidPtr->Layout.map;
    213   1.3     oster 	if (lp->GetDefaultNumFloatingReconBuffers == NULL)
    214   1.3     oster 		return (3 * raidPtr->numCol);
    215   1.3     oster 	nrb = lp->GetDefaultNumFloatingReconBuffers(raidPtr);
    216   1.3     oster 	return (nrb);
    217   1.1     oster }
    218   1.1     oster 
    219   1.1     oster 
    220   1.1     oster /******************************************************************************
    221   1.1     oster  * creates and initializes a reconstruction buffer
    222   1.1     oster  *****************************************************************************/
    223   1.3     oster RF_ReconBuffer_t *
    224  1.19     oster rf_MakeReconBuffer(RF_Raid_t *raidPtr, RF_RowCol_t col, RF_RbufType_t type)
    225   1.1     oster {
    226   1.3     oster 	RF_RaidLayout_t *layoutPtr = &raidPtr->Layout;
    227   1.3     oster 	RF_ReconBuffer_t *t;
    228   1.3     oster 	u_int   recon_buffer_size = rf_RaidAddressToByte(raidPtr, layoutPtr->SUsPerRU * layoutPtr->sectorsPerStripeUnit);
    229   1.3     oster 
    230  1.22     oster 	t = pool_get(&rf_pools.reconbuffer, PR_WAITOK);
    231  1.28  christos 	RF_Malloc(t->buffer, recon_buffer_size, (void *));
    232   1.3     oster 	t->raidPtr = raidPtr;
    233   1.3     oster 	t->col = col;
    234   1.3     oster 	t->priority = RF_IO_RECON_PRIORITY;
    235   1.3     oster 	t->type = type;
    236   1.3     oster 	t->pssPtr = NULL;
    237   1.3     oster 	t->next = NULL;
    238   1.3     oster 	return (t);
    239   1.1     oster }
    240   1.1     oster /******************************************************************************
    241   1.1     oster  * frees a reconstruction buffer
    242   1.1     oster  *****************************************************************************/
    243  1.25     perry void
    244  1.19     oster rf_FreeReconBuffer(RF_ReconBuffer_t *rbuf)
    245   1.1     oster {
    246   1.3     oster 	RF_Raid_t *raidPtr = rbuf->raidPtr;
    247   1.9     oster 	u_int   recon_buffer_size;
    248   1.9     oster 
    249   1.9     oster 	recon_buffer_size = rf_RaidAddressToByte(raidPtr, raidPtr->Layout.SUsPerRU * raidPtr->Layout.sectorsPerStripeUnit);
    250   1.3     oster 
    251   1.3     oster 	RF_Free(rbuf->buffer, recon_buffer_size);
    252  1.22     oster 	pool_put(&rf_pools.reconbuffer, rbuf);
    253   1.1     oster }
    254   1.1     oster 
    255  1.10     oster #if RF_DEBUG_RECON
    256  1.23     oster XXXX IF you use this, you really want to fix the locking in here.
    257   1.1     oster /******************************************************************************
    258   1.1     oster  * debug only:  sanity check the number of floating recon bufs in use
    259   1.1     oster  *****************************************************************************/
    260  1.25     perry void
    261  1.19     oster rf_CheckFloatingRbufCount(RF_Raid_t *raidPtr, int dolock)
    262   1.1     oster {
    263   1.3     oster 	RF_ReconParityStripeStatus_t *p;
    264   1.3     oster 	RF_PSStatusHeader_t *pssTable;
    265   1.3     oster 	RF_ReconBuffer_t *rbuf;
    266   1.3     oster 	int     i, j, sum = 0;
    267   1.3     oster 
    268   1.3     oster 	if (dolock)
    269  1.15     oster 		RF_LOCK_MUTEX(raidPtr->reconControl->rb_mutex);
    270  1.15     oster 	pssTable = raidPtr->reconControl->pssTable;
    271   1.3     oster 
    272   1.3     oster 	for (i = 0; i < raidPtr->pssTableSize; i++) {
    273   1.3     oster 		RF_LOCK_MUTEX(pssTable[i].mutex);
    274   1.3     oster 		for (p = pssTable[i].chain; p; p = p->next) {
    275   1.3     oster 			rbuf = (RF_ReconBuffer_t *) p->rbuf;
    276   1.3     oster 			if (rbuf && rbuf->type == RF_RBUF_TYPE_FLOATING)
    277   1.3     oster 				sum++;
    278   1.3     oster 
    279   1.3     oster 			rbuf = (RF_ReconBuffer_t *) p->writeRbuf;
    280   1.3     oster 			if (rbuf && rbuf->type == RF_RBUF_TYPE_FLOATING)
    281   1.3     oster 				sum++;
    282   1.3     oster 
    283   1.3     oster 			for (j = 0; j < p->xorBufCount; j++) {
    284   1.3     oster 				rbuf = (RF_ReconBuffer_t *) p->rbufsForXor[j];
    285   1.3     oster 				RF_ASSERT(rbuf);
    286   1.3     oster 				if (rbuf->type == RF_RBUF_TYPE_FLOATING)
    287   1.3     oster 					sum++;
    288   1.3     oster 			}
    289   1.3     oster 		}
    290   1.3     oster 		RF_UNLOCK_MUTEX(pssTable[i].mutex);
    291   1.3     oster 	}
    292   1.3     oster 
    293  1.25     perry 	for (rbuf = raidPtr->reconControl->floatingRbufs; rbuf;
    294  1.11     oster 	     rbuf = rbuf->next) {
    295   1.3     oster 		if (rbuf->type == RF_RBUF_TYPE_FLOATING)
    296   1.3     oster 			sum++;
    297   1.3     oster 	}
    298  1.25     perry 	for (rbuf = raidPtr->reconControl->committedRbufs; rbuf;
    299  1.11     oster 	     rbuf = rbuf->next) {
    300   1.3     oster 		if (rbuf->type == RF_RBUF_TYPE_FLOATING)
    301   1.3     oster 			sum++;
    302   1.3     oster 	}
    303  1.25     perry 	for (rbuf = raidPtr->reconControl->fullBufferList; rbuf;
    304  1.11     oster 	     rbuf = rbuf->next) {
    305   1.3     oster 		if (rbuf->type == RF_RBUF_TYPE_FLOATING)
    306   1.3     oster 			sum++;
    307   1.3     oster 	}
    308   1.3     oster 	RF_ASSERT(sum == raidPtr->numFloatingReconBufs);
    309   1.1     oster 
    310   1.3     oster 	if (dolock)
    311  1.15     oster 		RF_UNLOCK_MUTEX(raidPtr->reconControl->rb_mutex);
    312   1.1     oster }
    313   1.7     oster #endif
    314   1.7     oster 
    315