Home | History | Annotate | Line # | Download | only in raidframe
rf_reconmap.c revision 1.3
      1  1.3  oster /*	$NetBSD: rf_reconmap.c,v 1.3 1999/01/26 04:40:03 oster Exp $	*/
      2  1.1  oster /*
      3  1.1  oster  * Copyright (c) 1995 Carnegie-Mellon University.
      4  1.1  oster  * All rights reserved.
      5  1.1  oster  *
      6  1.1  oster  * Author: Mark Holland
      7  1.1  oster  *
      8  1.1  oster  * Permission to use, copy, modify and distribute this software and
      9  1.1  oster  * its documentation is hereby granted, provided that both the copyright
     10  1.1  oster  * notice and this permission notice appear in all copies of the
     11  1.1  oster  * software, derivative works or modified versions, and any portions
     12  1.1  oster  * thereof, and that both notices appear in supporting documentation.
     13  1.1  oster  *
     14  1.1  oster  * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
     15  1.1  oster  * CONDITION.  CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
     16  1.1  oster  * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
     17  1.1  oster  *
     18  1.1  oster  * Carnegie Mellon requests users of this software to return to
     19  1.1  oster  *
     20  1.1  oster  *  Software Distribution Coordinator  or  Software.Distribution (at) CS.CMU.EDU
     21  1.1  oster  *  School of Computer Science
     22  1.1  oster  *  Carnegie Mellon University
     23  1.1  oster  *  Pittsburgh PA 15213-3890
     24  1.1  oster  *
     25  1.1  oster  * any improvements or extensions that they make and grant Carnegie the
     26  1.1  oster  * rights to redistribute these changes.
     27  1.1  oster  */
     28  1.1  oster 
     29  1.1  oster /*************************************************************************
     30  1.1  oster  * rf_reconmap.c
     31  1.1  oster  *
     32  1.1  oster  * code to maintain a map of what sectors have/have not been reconstructed
     33  1.1  oster  *
     34  1.1  oster  *************************************************************************/
     35  1.1  oster 
     36  1.1  oster #include "rf_raid.h"
     37  1.1  oster #include <sys/time.h>
     38  1.1  oster #include "rf_general.h"
     39  1.1  oster #include "rf_utils.h"
     40  1.1  oster #include "rf_sys.h"
     41  1.1  oster 
     42  1.1  oster /* special pointer values indicating that a reconstruction unit
     43  1.1  oster  * has been either totally reconstructed or not at all.  Both
     44  1.1  oster  * are illegal pointer values, so you have to be careful not to
     45  1.1  oster  * dereference through them.  RU_NOTHING must be zero, since
     46  1.1  oster  * MakeReconMap uses bzero to initialize the structure.  These are used
     47  1.1  oster  * only at the head of the list.
     48  1.1  oster  */
     49  1.1  oster #define RU_ALL      ((RF_ReconMapListElem_t *) -1)
     50  1.1  oster #define RU_NOTHING  ((RF_ReconMapListElem_t *) 0)
     51  1.1  oster 
     52  1.1  oster /* used to mark the end of the list */
     53  1.1  oster #define RU_NIL      ((RF_ReconMapListElem_t *) 0)
     54  1.1  oster 
     55  1.1  oster 
     56  1.1  oster static void compact_stat_entry(RF_Raid_t *raidPtr, RF_ReconMap_t *mapPtr,
     57  1.1  oster 	int i);
     58  1.1  oster static void crunch_list(RF_ReconMap_t *mapPtr, RF_ReconMapListElem_t *listPtr);
     59  1.1  oster static RF_ReconMapListElem_t *MakeReconMapListElem(RF_SectorNum_t startSector,
     60  1.1  oster 	RF_SectorNum_t stopSector, RF_ReconMapListElem_t *next);
     61  1.1  oster static void FreeReconMapListElem(RF_ReconMap_t *mapPtr,
     62  1.1  oster 	RF_ReconMapListElem_t *p);
     63  1.1  oster static void update_size(RF_ReconMap_t *mapPtr, int size);
     64  1.1  oster static void PrintList(RF_ReconMapListElem_t *listPtr);
     65  1.1  oster 
     66  1.1  oster /*-----------------------------------------------------------------------------
     67  1.1  oster  *
     68  1.1  oster  * Creates and initializes new Reconstruction map
     69  1.1  oster  *
     70  1.1  oster  *-----------------------------------------------------------------------------*/
     71  1.1  oster 
     72  1.1  oster RF_ReconMap_t *rf_MakeReconMap(raidPtr, ru_sectors, disk_sectors, spareUnitsPerDisk)
     73  1.1  oster   RF_Raid_t            *raidPtr;
     74  1.1  oster   RF_SectorCount_t      ru_sectors;        /* size of reconstruction unit in sectors */
     75  1.1  oster   RF_SectorCount_t      disk_sectors;      /* size of disk in sectors */
     76  1.1  oster   RF_ReconUnitCount_t   spareUnitsPerDisk; /* zero unless distributed sparing */
     77  1.1  oster {
     78  1.1  oster   RF_RaidLayout_t *layoutPtr = &raidPtr->Layout;
     79  1.1  oster   RF_ReconUnitCount_t num_rus = layoutPtr->stripeUnitsPerDisk / layoutPtr->SUsPerRU;
     80  1.1  oster   RF_ReconMap_t *p;
     81  1.1  oster   int rc;
     82  1.1  oster 
     83  1.1  oster   RF_Malloc(p, sizeof(RF_ReconMap_t), (RF_ReconMap_t *));
     84  1.1  oster   p->sectorsPerReconUnit = ru_sectors;
     85  1.1  oster   p->sectorsInDisk = disk_sectors;
     86  1.1  oster 
     87  1.1  oster   p->totalRUs = num_rus;
     88  1.1  oster   p->spareRUs = spareUnitsPerDisk;
     89  1.1  oster   p->unitsLeft = num_rus - spareUnitsPerDisk;
     90  1.1  oster 
     91  1.1  oster   RF_Malloc(p->status, num_rus * sizeof(RF_ReconMapListElem_t *), (RF_ReconMapListElem_t **));
     92  1.1  oster   RF_ASSERT(p->status != (RF_ReconMapListElem_t **) NULL);
     93  1.1  oster 
     94  1.1  oster   (void) bzero((char *) p->status, num_rus * sizeof(RF_ReconMapListElem_t *));
     95  1.1  oster 
     96  1.1  oster   p->size = sizeof(RF_ReconMap_t) + num_rus * sizeof(RF_ReconMapListElem_t *);
     97  1.1  oster   p->maxSize = p->size;
     98  1.1  oster 
     99  1.1  oster   rc = rf_mutex_init(&p->mutex);
    100  1.1  oster   if (rc) {
    101  1.1  oster     RF_ERRORMSG3("Unable to init mutex file %s line %d rc=%d\n", __FILE__,
    102  1.1  oster       __LINE__, rc);
    103  1.1  oster     RF_Free(p->status, num_rus * sizeof(RF_ReconMapListElem_t *));
    104  1.1  oster     RF_Free(p, sizeof(RF_ReconMap_t));
    105  1.1  oster     return(NULL);
    106  1.1  oster   }
    107  1.1  oster   return(p);
    108  1.1  oster }
    109  1.1  oster 
    110  1.1  oster 
    111  1.1  oster /*-----------------------------------------------------------------------------
    112  1.1  oster  *
    113  1.1  oster  * marks a new set of sectors as reconstructed.  All the possible mergings get
    114  1.1  oster  * complicated.  To simplify matters, the approach I take is to just dump
    115  1.1  oster  * something into the list, and then clean it up (i.e. merge elements and
    116  1.1  oster  * eliminate redundant ones) in a second pass over the list (compact_stat_entry()).
    117  1.1  oster  * Not 100% efficient, since a structure can be allocated and then immediately
    118  1.1  oster  * freed, but it keeps this code from becoming (more of) a nightmare of
    119  1.1  oster  * special cases.  The only thing that compact_stat_entry() assumes is that the
    120  1.1  oster  * list is sorted by startSector, and so this is the only condition I maintain
    121  1.1  oster  * here.  (MCH)
    122  1.1  oster  *
    123  1.1  oster  *-----------------------------------------------------------------------------*/
    124  1.1  oster 
    125  1.1  oster void rf_ReconMapUpdate(raidPtr, mapPtr, startSector, stopSector)
    126  1.1  oster   RF_Raid_t       *raidPtr;
    127  1.1  oster   RF_ReconMap_t   *mapPtr;
    128  1.1  oster   RF_SectorNum_t   startSector;
    129  1.1  oster   RF_SectorNum_t   stopSector;
    130  1.1  oster {
    131  1.1  oster   RF_SectorCount_t sectorsPerReconUnit = mapPtr->sectorsPerReconUnit;
    132  1.1  oster   RF_SectorNum_t i, first_in_RU, last_in_RU;
    133  1.1  oster   RF_ReconMapListElem_t *p, *pt;
    134  1.1  oster 
    135  1.1  oster   RF_LOCK_MUTEX(mapPtr->mutex);
    136  1.1  oster   RF_ASSERT(startSector >=0 && stopSector < mapPtr->sectorsInDisk && stopSector > startSector);
    137  1.1  oster 
    138  1.1  oster   while (startSector <= stopSector) {
    139  1.1  oster     i = startSector/mapPtr->sectorsPerReconUnit;
    140  1.1  oster     first_in_RU = i*sectorsPerReconUnit;
    141  1.1  oster     last_in_RU  = first_in_RU + sectorsPerReconUnit -1 ;
    142  1.1  oster     p = mapPtr->status[i];
    143  1.1  oster     if (p!=RU_ALL) {
    144  1.1  oster       if (p==RU_NOTHING || p->startSector > startSector ) {	/* insert at front of list */
    145  1.1  oster 
    146  1.1  oster 	mapPtr->status[i] = MakeReconMapListElem(startSector, RF_MIN(stopSector,last_in_RU), (p==RU_NOTHING) ? NULL : p);
    147  1.1  oster 	update_size(mapPtr, sizeof(RF_ReconMapListElem_t));
    148  1.1  oster 
    149  1.1  oster       } else {						/* general case */
    150  1.1  oster 	do {						/* search for place to insert */
    151  1.1  oster 	  pt = p; p = p->next;
    152  1.1  oster 	} while (p && (p->startSector < startSector));
    153  1.1  oster 	pt->next = MakeReconMapListElem(startSector,RF_MIN(stopSector,last_in_RU),p);
    154  1.1  oster 	update_size(mapPtr, sizeof(RF_ReconMapListElem_t));
    155  1.1  oster       }
    156  1.1  oster       compact_stat_entry(raidPtr, mapPtr, i);
    157  1.1  oster     }
    158  1.1  oster     startSector = RF_MIN(stopSector, last_in_RU) +1;
    159  1.1  oster   }
    160  1.1  oster   RF_UNLOCK_MUTEX(mapPtr->mutex);
    161  1.1  oster }
    162  1.1  oster 
    163  1.1  oster 
    164  1.1  oster 
    165  1.1  oster /*-----------------------------------------------------------------------------
    166  1.1  oster  *
    167  1.1  oster  * performs whatever list compactions can be done, and frees any space
    168  1.1  oster  * that is no longer necessary.  Assumes only that the list is sorted
    169  1.1  oster  * by startSector.  crunch_list() compacts a single list as much as possible,
    170  1.1  oster  * and the second block of code deletes the entire list if possible.
    171  1.1  oster  * crunch_list() is also called from MakeReconMapAccessList().
    172  1.1  oster  *
    173  1.1  oster  * When a recon unit is detected to be fully reconstructed, we set the
    174  1.1  oster  * corresponding bit in the parity stripe map so that the head follow
    175  1.1  oster  * code will not select this parity stripe again.  This is redundant (but
    176  1.1  oster  * harmless) when compact_stat_entry is called from the reconstruction code,
    177  1.1  oster  * but necessary when called from the user-write code.
    178  1.1  oster  *
    179  1.1  oster  *-----------------------------------------------------------------------------*/
    180  1.1  oster 
    181  1.1  oster static void compact_stat_entry(raidPtr, mapPtr, i)
    182  1.1  oster   RF_Raid_t      *raidPtr;
    183  1.1  oster   RF_ReconMap_t  *mapPtr;
    184  1.1  oster   int             i;
    185  1.1  oster {
    186  1.1  oster   RF_SectorCount_t sectorsPerReconUnit = mapPtr->sectorsPerReconUnit;
    187  1.1  oster   RF_ReconMapListElem_t *p = mapPtr->status[i];
    188  1.1  oster 
    189  1.1  oster   crunch_list(mapPtr, p);
    190  1.1  oster 
    191  1.1  oster   if ((p->startSector == i*sectorsPerReconUnit) &&
    192  1.1  oster       (p->stopSector == i*sectorsPerReconUnit +sectorsPerReconUnit -1)) {
    193  1.1  oster     mapPtr->status[i] = RU_ALL;
    194  1.1  oster     mapPtr->unitsLeft--;
    195  1.1  oster     FreeReconMapListElem(mapPtr,p);
    196  1.1  oster   }
    197  1.1  oster }
    198  1.1  oster 
    199  1.1  oster static void crunch_list(mapPtr, listPtr)
    200  1.1  oster   RF_ReconMap_t          *mapPtr;
    201  1.1  oster   RF_ReconMapListElem_t  *listPtr;
    202  1.1  oster {
    203  1.1  oster   RF_ReconMapListElem_t *pt, *p = listPtr;
    204  1.1  oster 
    205  1.1  oster   if (!p) return;
    206  1.1  oster   pt = p;  p = p->next;
    207  1.1  oster   while (p) {
    208  1.1  oster     if (pt->stopSector >= p->startSector-1) {
    209  1.1  oster       pt->stopSector = RF_MAX(pt->stopSector, p->stopSector);
    210  1.1  oster       pt->next = p->next;
    211  1.1  oster       FreeReconMapListElem(mapPtr, p);
    212  1.1  oster       p = pt->next;
    213  1.1  oster     }
    214  1.1  oster     else {
    215  1.1  oster       pt = p;
    216  1.1  oster       p = p->next;
    217  1.1  oster     }
    218  1.1  oster   }
    219  1.1  oster }
    220  1.1  oster 
    221  1.1  oster /*-----------------------------------------------------------------------------
    222  1.1  oster  *
    223  1.1  oster  * Allocate and fill a new list element
    224  1.1  oster  *
    225  1.1  oster  *-----------------------------------------------------------------------------*/
    226  1.1  oster 
    227  1.1  oster static RF_ReconMapListElem_t *MakeReconMapListElem(
    228  1.1  oster   RF_SectorNum_t          startSector,
    229  1.1  oster   RF_SectorNum_t          stopSector,
    230  1.1  oster   RF_ReconMapListElem_t  *next)
    231  1.1  oster {
    232  1.1  oster   RF_ReconMapListElem_t *p;
    233  1.1  oster 
    234  1.1  oster   RF_Malloc(p, sizeof(RF_ReconMapListElem_t), (RF_ReconMapListElem_t *));
    235  1.1  oster   if (p == NULL)
    236  1.1  oster     return(NULL);
    237  1.1  oster   p->startSector = startSector;
    238  1.1  oster   p->stopSector = stopSector;
    239  1.1  oster   p->next = next;
    240  1.1  oster   return(p);
    241  1.1  oster }
    242  1.1  oster 
    243  1.1  oster /*-----------------------------------------------------------------------------
    244  1.1  oster  *
    245  1.1  oster  * Free a list element
    246  1.1  oster  *
    247  1.1  oster  *-----------------------------------------------------------------------------*/
    248  1.1  oster 
    249  1.1  oster static void FreeReconMapListElem(mapPtr,p)
    250  1.1  oster   RF_ReconMap_t          *mapPtr;
    251  1.1  oster   RF_ReconMapListElem_t  *p;
    252  1.1  oster {
    253  1.1  oster   int delta;
    254  1.1  oster 
    255  1.1  oster   if (mapPtr) {
    256  1.1  oster     delta = 0 - (int)sizeof(RF_ReconMapListElem_t);
    257  1.1  oster     update_size(mapPtr, delta);
    258  1.1  oster   }
    259  1.1  oster   RF_Free(p, sizeof(*p));
    260  1.1  oster }
    261  1.1  oster 
    262  1.1  oster /*-----------------------------------------------------------------------------
    263  1.1  oster  *
    264  1.1  oster  * Free an entire status structure.  Inefficient, but can be called at any time.
    265  1.1  oster  *
    266  1.1  oster  *-----------------------------------------------------------------------------*/
    267  1.1  oster void rf_FreeReconMap(mapPtr)
    268  1.1  oster   RF_ReconMap_t  *mapPtr;
    269  1.1  oster {
    270  1.1  oster   RF_ReconMapListElem_t *p, *q;
    271  1.1  oster   RF_ReconUnitCount_t numRUs;
    272  1.1  oster   RF_ReconUnitNum_t i;
    273  1.1  oster 
    274  1.1  oster   numRUs = mapPtr->sectorsInDisk / mapPtr->sectorsPerReconUnit;
    275  1.1  oster   if (mapPtr->sectorsInDisk % mapPtr->sectorsPerReconUnit)
    276  1.1  oster     numRUs++;
    277  1.1  oster 
    278  1.1  oster   for (i=0; i<numRUs; i++) {
    279  1.1  oster     p = mapPtr->status[i];
    280  1.1  oster     while (p != RU_NOTHING && p != RU_ALL) {
    281  1.1  oster       q = p; p = p->next;
    282  1.1  oster       RF_Free(q, sizeof(*q));
    283  1.1  oster     }
    284  1.1  oster   }
    285  1.1  oster   rf_mutex_destroy(&mapPtr->mutex);
    286  1.1  oster   RF_Free(mapPtr->status, mapPtr->totalRUs * sizeof(RF_ReconMapListElem_t *));
    287  1.1  oster   RF_Free(mapPtr, sizeof(RF_ReconMap_t));
    288  1.1  oster }
    289  1.1  oster 
    290  1.1  oster /*-----------------------------------------------------------------------------
    291  1.1  oster  *
    292  1.1  oster  * returns nonzero if the indicated RU has been reconstructed already
    293  1.1  oster  *
    294  1.1  oster  *---------------------------------------------------------------------------*/
    295  1.1  oster 
    296  1.1  oster int rf_CheckRUReconstructed(mapPtr, startSector)
    297  1.1  oster   RF_ReconMap_t   *mapPtr;
    298  1.1  oster   RF_SectorNum_t   startSector;
    299  1.1  oster {
    300  1.1  oster   RF_ReconMapListElem_t *l;		/* used for searching */
    301  1.1  oster   RF_ReconUnitNum_t i;
    302  1.1  oster 
    303  1.1  oster   i = startSector / mapPtr->sectorsPerReconUnit;
    304  1.1  oster   l = mapPtr->status[i];
    305  1.1  oster   return( (l == RU_ALL) ? 1 : 0 );
    306  1.1  oster }
    307  1.1  oster 
    308  1.1  oster RF_ReconUnitCount_t rf_UnitsLeftToReconstruct(mapPtr)
    309  1.1  oster   RF_ReconMap_t  *mapPtr;
    310  1.1  oster {
    311  1.1  oster   RF_ASSERT(mapPtr != NULL);
    312  1.1  oster   return( mapPtr->unitsLeft );
    313  1.1  oster }
    314  1.1  oster 
    315  1.1  oster /* updates the size fields of a status descriptor */
    316  1.1  oster static void update_size(mapPtr, size)
    317  1.1  oster   RF_ReconMap_t  *mapPtr;
    318  1.1  oster   int             size;
    319  1.1  oster {
    320  1.1  oster   mapPtr->size += size;
    321  1.1  oster   mapPtr->maxSize = RF_MAX(mapPtr->size, mapPtr->maxSize);
    322  1.1  oster }
    323  1.1  oster 
    324  1.1  oster static void PrintList(listPtr)
    325  1.1  oster   RF_ReconMapListElem_t  *listPtr;
    326  1.1  oster {
    327  1.1  oster   while (listPtr) {
    328  1.1  oster     printf("%d,%d -> ",(int)listPtr->startSector,(int)listPtr->stopSector);
    329  1.1  oster     listPtr = listPtr->next;
    330  1.1  oster   }
    331  1.1  oster   printf("\n");
    332  1.1  oster }
    333  1.1  oster 
    334  1.1  oster void rf_PrintReconMap(raidPtr, mapPtr, frow, fcol)
    335  1.1  oster   RF_Raid_t      *raidPtr;
    336  1.1  oster   RF_ReconMap_t  *mapPtr;
    337  1.1  oster   RF_RowCol_t     frow;
    338  1.1  oster   RF_RowCol_t     fcol;
    339  1.1  oster {
    340  1.1  oster   RF_ReconUnitCount_t numRUs;
    341  1.1  oster   RF_ReconMapListElem_t *p;
    342  1.1  oster   RF_ReconUnitNum_t i;
    343  1.1  oster 
    344  1.1  oster   numRUs = mapPtr->totalRUs;
    345  1.1  oster   if (mapPtr->sectorsInDisk % mapPtr->sectorsPerReconUnit)
    346  1.1  oster     numRUs++;
    347  1.1  oster 
    348  1.1  oster   for (i=0; i<numRUs; i++) {
    349  1.1  oster     p = mapPtr->status[i];
    350  1.1  oster     if (p==RU_ALL) /*printf("[%d] ALL\n",i)*/;
    351  1.1  oster     else if (p == RU_NOTHING) {
    352  1.1  oster       printf("%d: Unreconstructed\n",i);
    353  1.1  oster     } else {
    354  1.1  oster       printf("%d: ", i);
    355  1.1  oster       PrintList(p);
    356  1.1  oster     }
    357  1.1  oster   }
    358  1.1  oster }
    359  1.1  oster 
    360  1.1  oster void rf_PrintReconSchedule(mapPtr, starttime)
    361  1.1  oster   RF_ReconMap_t   *mapPtr;
    362  1.1  oster   struct timeval  *starttime;
    363  1.1  oster {
    364  1.1  oster   static int old_pctg = -1;
    365  1.1  oster   struct timeval tv, diff;
    366  1.1  oster   int new_pctg;
    367  1.1  oster 
    368  1.1  oster   new_pctg = 100 - (rf_UnitsLeftToReconstruct(mapPtr) * 100 / mapPtr->totalRUs);
    369  1.1  oster   if (new_pctg != old_pctg) {
    370  1.1  oster     RF_GETTIME(tv);
    371  1.1  oster     RF_TIMEVAL_DIFF(starttime, &tv, &diff);
    372  1.1  oster     printf("%d %d.%06d\n",(int)new_pctg, (int)diff.tv_sec, (int)diff.tv_usec);
    373  1.1  oster     old_pctg = new_pctg;
    374  1.1  oster   }
    375  1.1  oster }
    376