Home | History | Annotate | Line # | Download | only in raidframe
rf_reconutil.c revision 1.26.10.1
      1  1.26.10.1      elad /*	$NetBSD: rf_reconutil.c,v 1.26.10.1 2006/05/11 23:29:58 elad Exp $	*/
      2        1.1     oster /*
      3        1.1     oster  * Copyright (c) 1995 Carnegie-Mellon University.
      4        1.1     oster  * All rights reserved.
      5        1.1     oster  *
      6        1.1     oster  * Author: Mark Holland
      7        1.1     oster  *
      8        1.1     oster  * Permission to use, copy, modify and distribute this software and
      9        1.1     oster  * its documentation is hereby granted, provided that both the copyright
     10        1.1     oster  * notice and this permission notice appear in all copies of the
     11        1.1     oster  * software, derivative works or modified versions, and any portions
     12        1.1     oster  * thereof, and that both notices appear in supporting documentation.
     13        1.1     oster  *
     14        1.1     oster  * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
     15        1.1     oster  * CONDITION.  CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
     16        1.1     oster  * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
     17        1.1     oster  *
     18        1.1     oster  * Carnegie Mellon requests users of this software to return to
     19        1.1     oster  *
     20        1.1     oster  *  Software Distribution Coordinator  or  Software.Distribution (at) CS.CMU.EDU
     21        1.1     oster  *  School of Computer Science
     22        1.1     oster  *  Carnegie Mellon University
     23        1.1     oster  *  Pittsburgh PA 15213-3890
     24        1.1     oster  *
     25        1.1     oster  * any improvements or extensions that they make and grant Carnegie the
     26        1.1     oster  * rights to redistribute these changes.
     27        1.1     oster  */
     28        1.1     oster 
     29        1.1     oster /********************************************
     30        1.1     oster  * rf_reconutil.c -- reconstruction utilities
     31        1.1     oster  ********************************************/
     32        1.5     lukem 
     33        1.5     lukem #include <sys/cdefs.h>
     34  1.26.10.1      elad __KERNEL_RCSID(0, "$NetBSD: rf_reconutil.c,v 1.26.10.1 2006/05/11 23:29:58 elad Exp $");
     35        1.1     oster 
     36        1.4     oster #include <dev/raidframe/raidframevar.h>
     37        1.4     oster 
     38        1.1     oster #include "rf_raid.h"
     39        1.1     oster #include "rf_desc.h"
     40        1.1     oster #include "rf_reconutil.h"
     41        1.1     oster #include "rf_reconbuffer.h"
     42        1.1     oster #include "rf_general.h"
     43        1.1     oster #include "rf_decluster.h"
     44        1.1     oster #include "rf_raid5_rotatedspare.h"
     45        1.1     oster #include "rf_interdecluster.h"
     46        1.1     oster #include "rf_chaindecluster.h"
     47        1.1     oster 
     48        1.1     oster /*******************************************************************
     49        1.1     oster  * allocates/frees the reconstruction control information structures
     50        1.1     oster  *******************************************************************/
     51       1.19     oster 
     52       1.19     oster /* fcol - failed column
     53       1.19     oster  * scol - identifies which spare we are using
     54       1.19     oster  */
     55       1.19     oster 
     56        1.3     oster RF_ReconCtrl_t *
     57       1.25     perry rf_MakeReconControl(RF_RaidReconDesc_t *reconDesc,
     58       1.19     oster 		    RF_RowCol_t fcol, RF_RowCol_t scol)
     59        1.1     oster {
     60        1.3     oster 	RF_Raid_t *raidPtr = reconDesc->raidPtr;
     61        1.3     oster 	RF_RaidLayout_t *layoutPtr = &raidPtr->Layout;
     62        1.3     oster 	RF_ReconUnitCount_t RUsPerPU = layoutPtr->SUsPerPU / layoutPtr->SUsPerRU;
     63        1.3     oster 	RF_ReconUnitCount_t numSpareRUs;
     64        1.3     oster 	RF_ReconCtrl_t *reconCtrlPtr;
     65        1.3     oster 	RF_ReconBuffer_t *rbuf;
     66       1.14  jdolecek 	const RF_LayoutSW_t *lp;
     67       1.12     oster #if (RF_INCLUDE_PARITY_DECLUSTERING_DS > 0)
     68       1.12     oster 	int     retcode;
     69       1.12     oster #endif
     70        1.3     oster 	RF_RowCol_t i;
     71        1.3     oster 
     72        1.3     oster 	lp = raidPtr->Layout.map;
     73        1.3     oster 
     74        1.3     oster 	/* make and zero the global reconstruction structure and the per-disk
     75        1.3     oster 	 * structure */
     76       1.16     oster 	RF_Malloc(reconCtrlPtr, sizeof(RF_ReconCtrl_t), (RF_ReconCtrl_t *));
     77       1.11     oster 
     78       1.11     oster 	/* note: this zeros the perDiskInfo */
     79       1.16     oster 	RF_Malloc(reconCtrlPtr->perDiskInfo, raidPtr->numCol *
     80       1.11     oster 		  sizeof(RF_PerDiskReconCtrl_t), (RF_PerDiskReconCtrl_t *));
     81        1.3     oster 	reconCtrlPtr->reconDesc = reconDesc;
     82        1.3     oster 	reconCtrlPtr->fcol = fcol;
     83        1.3     oster 	reconCtrlPtr->spareCol = scol;
     84        1.3     oster 	reconCtrlPtr->lastPSID = layoutPtr->numStripe / layoutPtr->SUsPerPU;
     85        1.3     oster 	reconCtrlPtr->percentComplete = 0;
     86       1.24     oster 	reconCtrlPtr->error = 0;
     87       1.24     oster 	reconCtrlPtr->pending_writes = 0;
     88        1.3     oster 
     89        1.3     oster 	/* initialize each per-disk recon information structure */
     90        1.3     oster 	for (i = 0; i < raidPtr->numCol; i++) {
     91        1.3     oster 		reconCtrlPtr->perDiskInfo[i].reconCtrl = reconCtrlPtr;
     92        1.3     oster 		reconCtrlPtr->perDiskInfo[i].col = i;
     93       1.11     oster 		/* make it appear as if we just finished an RU */
     94       1.25     perry 		reconCtrlPtr->perDiskInfo[i].curPSID = -1;
     95        1.3     oster 		reconCtrlPtr->perDiskInfo[i].ru_count = RUsPerPU - 1;
     96        1.3     oster 	}
     97        1.3     oster 
     98        1.3     oster 	/* Get the number of spare units per disk and the sparemap in case
     99        1.3     oster 	 * spare is distributed  */
    100        1.3     oster 
    101        1.3     oster 	if (lp->GetNumSpareRUs) {
    102        1.3     oster 		numSpareRUs = lp->GetNumSpareRUs(raidPtr);
    103        1.3     oster 	} else {
    104        1.3     oster 		numSpareRUs = 0;
    105        1.3     oster 	}
    106        1.3     oster 
    107       1.12     oster #if (RF_INCLUDE_PARITY_DECLUSTERING_DS > 0)
    108        1.3     oster 	/*
    109        1.3     oster          * Not all distributed sparing archs need dynamic mappings
    110        1.3     oster          */
    111        1.3     oster 	if (lp->InstallSpareTable) {
    112  1.26.10.1      elad 		retcode = rf_InstallSpareTable(raidPtr, 0, fcol);
    113        1.3     oster 		if (retcode) {
    114        1.3     oster 			RF_PANIC();	/* XXX fix this */
    115        1.3     oster 		}
    116        1.3     oster 	}
    117       1.12     oster #endif
    118        1.3     oster 	/* make the reconstruction map */
    119        1.3     oster 	reconCtrlPtr->reconMap = rf_MakeReconMap(raidPtr, (int) (layoutPtr->SUsPerRU * layoutPtr->sectorsPerStripeUnit),
    120        1.3     oster 	    raidPtr->sectorsPerDisk, numSpareRUs);
    121        1.3     oster 
    122        1.3     oster 	/* make the per-disk reconstruction buffers */
    123        1.3     oster 	for (i = 0; i < raidPtr->numCol; i++) {
    124       1.15     oster 		reconCtrlPtr->perDiskInfo[i].rbuf = (i == fcol) ? NULL : rf_MakeReconBuffer(raidPtr, i, RF_RBUF_TYPE_EXCLUSIVE);
    125        1.3     oster 	}
    126        1.3     oster 
    127        1.3     oster 	/* initialize the event queue */
    128       1.17     oster 	simple_lock_init(&reconCtrlPtr->eq_mutex);
    129       1.17     oster 
    130        1.3     oster 	reconCtrlPtr->eventQueue = NULL;
    131        1.3     oster 	reconCtrlPtr->eq_count = 0;
    132        1.3     oster 
    133        1.3     oster 	/* make the floating recon buffers and append them to the free list */
    134       1.17     oster 	simple_lock_init(&reconCtrlPtr->rb_mutex);
    135       1.17     oster 
    136        1.3     oster 	reconCtrlPtr->fullBufferList = NULL;
    137        1.3     oster 	reconCtrlPtr->floatingRbufs = NULL;
    138        1.3     oster 	reconCtrlPtr->committedRbufs = NULL;
    139        1.3     oster 	for (i = 0; i < raidPtr->numFloatingReconBufs; i++) {
    140       1.25     perry 		rbuf = rf_MakeReconBuffer(raidPtr, fcol,
    141       1.11     oster 					  RF_RBUF_TYPE_FLOATING);
    142        1.3     oster 		rbuf->next = reconCtrlPtr->floatingRbufs;
    143        1.3     oster 		reconCtrlPtr->floatingRbufs = rbuf;
    144        1.3     oster 	}
    145        1.3     oster 
    146        1.3     oster 	/* create the parity stripe status table */
    147        1.3     oster 	reconCtrlPtr->pssTable = rf_MakeParityStripeStatusTable(raidPtr);
    148        1.3     oster 
    149        1.3     oster 	/* set the initial min head sep counter val */
    150        1.3     oster 	reconCtrlPtr->minHeadSepCounter = 0;
    151        1.3     oster 
    152        1.3     oster 	return (reconCtrlPtr);
    153        1.1     oster }
    154        1.1     oster 
    155       1.25     perry void
    156       1.19     oster rf_FreeReconControl(RF_Raid_t *raidPtr)
    157        1.1     oster {
    158       1.15     oster 	RF_ReconCtrl_t *reconCtrlPtr = raidPtr->reconControl;
    159        1.3     oster 	RF_ReconBuffer_t *t;
    160        1.3     oster 	RF_ReconUnitNum_t i;
    161        1.3     oster 
    162        1.3     oster 	RF_ASSERT(reconCtrlPtr);
    163        1.3     oster 	for (i = 0; i < raidPtr->numCol; i++)
    164        1.3     oster 		if (reconCtrlPtr->perDiskInfo[i].rbuf)
    165        1.3     oster 			rf_FreeReconBuffer(reconCtrlPtr->perDiskInfo[i].rbuf);
    166       1.24     oster 
    167       1.24     oster 	t = reconCtrlPtr->floatingRbufs;
    168       1.24     oster 	while (t) {
    169        1.3     oster 		reconCtrlPtr->floatingRbufs = t->next;
    170        1.3     oster 		rf_FreeReconBuffer(t);
    171       1.24     oster 		t = reconCtrlPtr->floatingRbufs;
    172        1.3     oster 	}
    173       1.24     oster 
    174        1.3     oster 	rf_FreeReconMap(reconCtrlPtr->reconMap);
    175        1.3     oster 	rf_FreeParityStripeStatusTable(raidPtr, reconCtrlPtr->pssTable);
    176       1.25     perry 	RF_Free(reconCtrlPtr->perDiskInfo,
    177       1.11     oster 		raidPtr->numCol * sizeof(RF_PerDiskReconCtrl_t));
    178        1.3     oster 	RF_Free(reconCtrlPtr, sizeof(*reconCtrlPtr));
    179        1.1     oster }
    180        1.1     oster 
    181        1.1     oster 
    182        1.1     oster /******************************************************************************
    183        1.1     oster  * computes the default head separation limit
    184        1.1     oster  *****************************************************************************/
    185       1.25     perry RF_HeadSepLimit_t
    186       1.19     oster rf_GetDefaultHeadSepLimit(RF_Raid_t *raidPtr)
    187        1.1     oster {
    188        1.3     oster 	RF_HeadSepLimit_t hsl;
    189       1.14  jdolecek 	const RF_LayoutSW_t *lp;
    190        1.1     oster 
    191        1.3     oster 	lp = raidPtr->Layout.map;
    192        1.3     oster 	if (lp->GetDefaultHeadSepLimit == NULL)
    193        1.3     oster 		return (-1);
    194        1.3     oster 	hsl = lp->GetDefaultHeadSepLimit(raidPtr);
    195        1.3     oster 	return (hsl);
    196        1.1     oster }
    197        1.1     oster 
    198        1.1     oster 
    199        1.1     oster /******************************************************************************
    200        1.1     oster  * computes the default number of floating recon buffers
    201        1.1     oster  *****************************************************************************/
    202       1.25     perry int
    203       1.19     oster rf_GetDefaultNumFloatingReconBuffers(RF_Raid_t *raidPtr)
    204        1.1     oster {
    205       1.14  jdolecek 	const RF_LayoutSW_t *lp;
    206        1.3     oster 	int     nrb;
    207        1.1     oster 
    208        1.3     oster 	lp = raidPtr->Layout.map;
    209        1.3     oster 	if (lp->GetDefaultNumFloatingReconBuffers == NULL)
    210        1.3     oster 		return (3 * raidPtr->numCol);
    211        1.3     oster 	nrb = lp->GetDefaultNumFloatingReconBuffers(raidPtr);
    212        1.3     oster 	return (nrb);
    213        1.1     oster }
    214        1.1     oster 
    215        1.1     oster 
    216        1.1     oster /******************************************************************************
    217        1.1     oster  * creates and initializes a reconstruction buffer
    218        1.1     oster  *****************************************************************************/
    219        1.3     oster RF_ReconBuffer_t *
    220       1.19     oster rf_MakeReconBuffer(RF_Raid_t *raidPtr, RF_RowCol_t col, RF_RbufType_t type)
    221        1.1     oster {
    222        1.3     oster 	RF_RaidLayout_t *layoutPtr = &raidPtr->Layout;
    223        1.3     oster 	RF_ReconBuffer_t *t;
    224        1.3     oster 	u_int   recon_buffer_size = rf_RaidAddressToByte(raidPtr, layoutPtr->SUsPerRU * layoutPtr->sectorsPerStripeUnit);
    225        1.3     oster 
    226       1.22     oster 	t = pool_get(&rf_pools.reconbuffer, PR_WAITOK);
    227        1.3     oster 	RF_Malloc(t->buffer, recon_buffer_size, (caddr_t));
    228        1.3     oster 	t->raidPtr = raidPtr;
    229        1.3     oster 	t->col = col;
    230        1.3     oster 	t->priority = RF_IO_RECON_PRIORITY;
    231        1.3     oster 	t->type = type;
    232        1.3     oster 	t->pssPtr = NULL;
    233        1.3     oster 	t->next = NULL;
    234        1.3     oster 	return (t);
    235        1.1     oster }
    236        1.1     oster /******************************************************************************
    237        1.1     oster  * frees a reconstruction buffer
    238        1.1     oster  *****************************************************************************/
    239       1.25     perry void
    240       1.19     oster rf_FreeReconBuffer(RF_ReconBuffer_t *rbuf)
    241        1.1     oster {
    242        1.3     oster 	RF_Raid_t *raidPtr = rbuf->raidPtr;
    243        1.9     oster 	u_int   recon_buffer_size;
    244        1.9     oster 
    245        1.9     oster 	recon_buffer_size = rf_RaidAddressToByte(raidPtr, raidPtr->Layout.SUsPerRU * raidPtr->Layout.sectorsPerStripeUnit);
    246        1.3     oster 
    247        1.3     oster 	RF_Free(rbuf->buffer, recon_buffer_size);
    248       1.22     oster 	pool_put(&rf_pools.reconbuffer, rbuf);
    249        1.1     oster }
    250        1.1     oster 
    251       1.10     oster #if RF_DEBUG_RECON
    252       1.23     oster XXXX IF you use this, you really want to fix the locking in here.
    253        1.1     oster /******************************************************************************
    254        1.1     oster  * debug only:  sanity check the number of floating recon bufs in use
    255        1.1     oster  *****************************************************************************/
    256       1.25     perry void
    257       1.19     oster rf_CheckFloatingRbufCount(RF_Raid_t *raidPtr, int dolock)
    258        1.1     oster {
    259        1.3     oster 	RF_ReconParityStripeStatus_t *p;
    260        1.3     oster 	RF_PSStatusHeader_t *pssTable;
    261        1.3     oster 	RF_ReconBuffer_t *rbuf;
    262        1.3     oster 	int     i, j, sum = 0;
    263        1.3     oster 
    264        1.3     oster 	if (dolock)
    265       1.15     oster 		RF_LOCK_MUTEX(raidPtr->reconControl->rb_mutex);
    266       1.15     oster 	pssTable = raidPtr->reconControl->pssTable;
    267        1.3     oster 
    268        1.3     oster 	for (i = 0; i < raidPtr->pssTableSize; i++) {
    269        1.3     oster 		RF_LOCK_MUTEX(pssTable[i].mutex);
    270        1.3     oster 		for (p = pssTable[i].chain; p; p = p->next) {
    271        1.3     oster 			rbuf = (RF_ReconBuffer_t *) p->rbuf;
    272        1.3     oster 			if (rbuf && rbuf->type == RF_RBUF_TYPE_FLOATING)
    273        1.3     oster 				sum++;
    274        1.3     oster 
    275        1.3     oster 			rbuf = (RF_ReconBuffer_t *) p->writeRbuf;
    276        1.3     oster 			if (rbuf && rbuf->type == RF_RBUF_TYPE_FLOATING)
    277        1.3     oster 				sum++;
    278        1.3     oster 
    279        1.3     oster 			for (j = 0; j < p->xorBufCount; j++) {
    280        1.3     oster 				rbuf = (RF_ReconBuffer_t *) p->rbufsForXor[j];
    281        1.3     oster 				RF_ASSERT(rbuf);
    282        1.3     oster 				if (rbuf->type == RF_RBUF_TYPE_FLOATING)
    283        1.3     oster 					sum++;
    284        1.3     oster 			}
    285        1.3     oster 		}
    286        1.3     oster 		RF_UNLOCK_MUTEX(pssTable[i].mutex);
    287        1.3     oster 	}
    288        1.3     oster 
    289       1.25     perry 	for (rbuf = raidPtr->reconControl->floatingRbufs; rbuf;
    290       1.11     oster 	     rbuf = rbuf->next) {
    291        1.3     oster 		if (rbuf->type == RF_RBUF_TYPE_FLOATING)
    292        1.3     oster 			sum++;
    293        1.3     oster 	}
    294       1.25     perry 	for (rbuf = raidPtr->reconControl->committedRbufs; rbuf;
    295       1.11     oster 	     rbuf = rbuf->next) {
    296        1.3     oster 		if (rbuf->type == RF_RBUF_TYPE_FLOATING)
    297        1.3     oster 			sum++;
    298        1.3     oster 	}
    299       1.25     perry 	for (rbuf = raidPtr->reconControl->fullBufferList; rbuf;
    300       1.11     oster 	     rbuf = rbuf->next) {
    301        1.3     oster 		if (rbuf->type == RF_RBUF_TYPE_FLOATING)
    302        1.3     oster 			sum++;
    303        1.3     oster 	}
    304        1.3     oster 	RF_ASSERT(sum == raidPtr->numFloatingReconBufs);
    305        1.1     oster 
    306        1.3     oster 	if (dolock)
    307       1.15     oster 		RF_UNLOCK_MUTEX(raidPtr->reconControl->rb_mutex);
    308        1.1     oster }
    309        1.7     oster #endif
    310        1.7     oster 
    311