rf_layout.h revision 1.5 1 /* $NetBSD: rf_layout.h,v 1.5 2001/01/26 04:14:14 oster Exp $ */
2 /*
3 * Copyright (c) 1995 Carnegie-Mellon University.
4 * All rights reserved.
5 *
6 * Author: Mark Holland
7 *
8 * Permission to use, copy, modify and distribute this software and
9 * its documentation is hereby granted, provided that both the copyright
10 * notice and this permission notice appear in all copies of the
11 * software, derivative works or modified versions, and any portions
12 * thereof, and that both notices appear in supporting documentation.
13 *
14 * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
15 * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
16 * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
17 *
18 * Carnegie Mellon requests users of this software to return to
19 *
20 * Software Distribution Coordinator or Software.Distribution (at) CS.CMU.EDU
21 * School of Computer Science
22 * Carnegie Mellon University
23 * Pittsburgh PA 15213-3890
24 *
25 * any improvements or extensions that they make and grant Carnegie the
26 * rights to redistribute these changes.
27 */
28
29 /* rf_layout.h -- header file defining layout data structures
30 */
31
32 #ifndef _RF__RF_LAYOUT_H_
33 #define _RF__RF_LAYOUT_H_
34
35 #include "rf_types.h"
36 #include "rf_archs.h"
37 #include "rf_alloclist.h"
38
39 #ifndef _KERNEL
40 #include <stdio.h>
41 #endif
42
43 /*****************************************************************************************
44 *
45 * This structure identifies all layout-specific operations and parameters.
46 *
47 ****************************************************************************************/
48
49 typedef struct RF_LayoutSW_s {
50 RF_ParityConfig_t parityConfig;
51 const char *configName;
52
53 #ifndef _KERNEL
54 /* layout-specific parsing */
55 int (*MakeLayoutSpecific) (FILE * fp, RF_Config_t * cfgPtr, void *arg);
56 void *makeLayoutSpecificArg;
57 #endif /* !KERNEL */
58
59 #if RF_UTILITY == 0
60 /* initialization routine */
61 int (*Configure) (RF_ShutdownList_t ** shutdownListp, RF_Raid_t * raidPtr, RF_Config_t * cfgPtr);
62
63 /* routine to map RAID sector address -> physical (row, col, offset) */
64 void (*MapSector) (RF_Raid_t * raidPtr, RF_RaidAddr_t raidSector,
65 RF_RowCol_t * row, RF_RowCol_t * col, RF_SectorNum_t * diskSector, int remap);
66
67 /* routine to map RAID sector address -> physical (r,c,o) of parity
68 * unit */
69 void (*MapParity) (RF_Raid_t * raidPtr, RF_RaidAddr_t raidSector,
70 RF_RowCol_t * row, RF_RowCol_t * col, RF_SectorNum_t * diskSector, int remap);
71
72 /* routine to map RAID sector address -> physical (r,c,o) of Q unit */
73 void (*MapQ) (RF_Raid_t * raidPtr, RF_RaidAddr_t raidSector, RF_RowCol_t * row,
74 RF_RowCol_t * col, RF_SectorNum_t * diskSector, int remap);
75
76 /* routine to identify the disks comprising a stripe */
77 void (*IdentifyStripe) (RF_Raid_t * raidPtr, RF_RaidAddr_t addr,
78 RF_RowCol_t ** diskids, RF_RowCol_t * outRow);
79
80 /* routine to select a dag */
81 void (*SelectionFunc) (RF_Raid_t * raidPtr, RF_IoType_t type,
82 RF_AccessStripeMap_t * asmap,
83 RF_VoidFuncPtr *);
84 #if 0
85 void (**createFunc) (RF_Raid_t *,
86 RF_AccessStripeMap_t *,
87 RF_DagHeader_t *, void *,
88 RF_RaidAccessFlags_t,
89 RF_AllocListElem_t *);
90
91 #endif
92
93 /* map a stripe ID to a parity stripe ID. This is typically the
94 * identity mapping */
95 void (*MapSIDToPSID) (RF_RaidLayout_t * layoutPtr, RF_StripeNum_t stripeID,
96 RF_StripeNum_t * psID, RF_ReconUnitNum_t * which_ru);
97
98 /* get default head separation limit (may be NULL) */
99 RF_HeadSepLimit_t(*GetDefaultHeadSepLimit) (RF_Raid_t * raidPtr);
100
101 /* get default num recon buffers (may be NULL) */
102 int (*GetDefaultNumFloatingReconBuffers) (RF_Raid_t * raidPtr);
103
104 /* get number of spare recon units (may be NULL) */
105 RF_ReconUnitCount_t(*GetNumSpareRUs) (RF_Raid_t * raidPtr);
106
107 /* spare table installation (may be NULL) */
108 int (*InstallSpareTable) (RF_Raid_t * raidPtr, RF_RowCol_t frow, RF_RowCol_t fcol);
109
110 /* recon buffer submission function */
111 int (*SubmitReconBuffer) (RF_ReconBuffer_t * rbuf, int keep_it,
112 int use_committed);
113
114 /*
115 * verify that parity information for a stripe is correct
116 * see rf_parityscan.h for return vals
117 */
118 int (*VerifyParity) (RF_Raid_t * raidPtr, RF_RaidAddr_t raidAddr,
119 RF_PhysDiskAddr_t * parityPDA, int correct_it, RF_RaidAccessFlags_t flags);
120
121 /* number of faults tolerated by this mapping */
122 int faultsTolerated;
123
124 /* states to step through in an access. Must end with "LastState". The
125 * default is DefaultStates in rf_layout.c */
126 RF_AccessState_t *states;
127
128 RF_AccessStripeMapFlags_t flags;
129 #endif /* RF_UTILITY == 0 */
130 } RF_LayoutSW_t;
131 /* enables remapping to spare location under dist sparing */
132 #define RF_REMAP 1
133 #define RF_DONT_REMAP 0
134
135 /*
136 * Flags values for RF_AccessStripeMapFlags_t
137 */
138 #define RF_NO_STRIPE_LOCKS 0x0001 /* suppress stripe locks */
139 #define RF_DISTRIBUTE_SPARE 0x0002 /* distribute spare space in archs
140 * that support it */
141 #define RF_BD_DECLUSTERED 0x0004 /* declustering uses block designs */
142
143 /*************************************************************************
144 *
145 * this structure forms the layout component of the main Raid
146 * structure. It describes everything needed to define and perform
147 * the mapping of logical RAID addresses <-> physical disk addresses.
148 *
149 *************************************************************************/
150 struct RF_RaidLayout_s {
151 /* configuration parameters */
152 RF_SectorCount_t sectorsPerStripeUnit; /* number of sectors in one
153 * stripe unit */
154 RF_StripeCount_t SUsPerPU; /* stripe units per parity unit */
155 RF_StripeCount_t SUsPerRU; /* stripe units per reconstruction
156 * unit */
157
158 /* redundant-but-useful info computed from the above, used in all
159 * layouts */
160 RF_StripeCount_t numStripe; /* total number of stripes in the
161 * array */
162 RF_SectorCount_t dataSectorsPerStripe;
163 RF_StripeCount_t dataStripeUnitsPerDisk;
164 u_int bytesPerStripeUnit;
165 u_int dataBytesPerStripe;
166 RF_StripeCount_t numDataCol; /* number of SUs of data per stripe
167 * (name here is a la RAID4) */
168 RF_StripeCount_t numParityCol; /* number of SUs of parity per stripe.
169 * Always 1 for now */
170 RF_StripeCount_t numParityLogCol; /* number of SUs of parity log
171 * per stripe. Always 1 for
172 * now */
173 RF_StripeCount_t stripeUnitsPerDisk;
174
175 RF_LayoutSW_t *map; /* ptr to struct holding mapping fns and
176 * information */
177 void *layoutSpecificInfo; /* ptr to a structure holding
178 * layout-specific params */
179 };
180 /*****************************************************************************************
181 *
182 * The mapping code returns a pointer to a list of AccessStripeMap structures, which
183 * describes all the mapping information about an access. The list contains one
184 * AccessStripeMap structure per stripe touched by the access. Each element in the list
185 * contains a stripe identifier and a pointer to a list of PhysDiskAddr structuress. Each
186 * element in this latter list describes the physical location of a stripe unit accessed
187 * within the corresponding stripe.
188 *
189 ****************************************************************************************/
190
191 #define RF_PDA_TYPE_DATA 0
192 #define RF_PDA_TYPE_PARITY 1
193 #define RF_PDA_TYPE_Q 2
194
195 struct RF_PhysDiskAddr_s {
196 RF_RowCol_t row, col; /* disk identifier */
197 RF_SectorNum_t startSector; /* sector offset into the disk */
198 RF_SectorCount_t numSector; /* number of sectors accessed */
199 int type; /* used by higher levels: currently, data,
200 * parity, or q */
201 caddr_t bufPtr; /* pointer to buffer supplying/receiving data */
202 RF_RaidAddr_t raidAddress; /* raid address corresponding to this
203 * physical disk address */
204 RF_PhysDiskAddr_t *next;
205 };
206 #define RF_MAX_FAILED_PDA RF_MAXCOL
207
208 struct RF_AccessStripeMap_s {
209 RF_StripeNum_t stripeID;/* the stripe index */
210 RF_RaidAddr_t raidAddress; /* the starting raid address within
211 * this stripe */
212 RF_RaidAddr_t endRaidAddress; /* raid address one sector past the
213 * end of the access */
214 RF_SectorCount_t totalSectorsAccessed; /* total num sectors
215 * identified in physInfo list */
216 RF_StripeCount_t numStripeUnitsAccessed; /* total num elements in
217 * physInfo list */
218 int numDataFailed; /* number of failed data disks accessed */
219 int numParityFailed;/* number of failed parity disks accessed (0
220 * or 1) */
221 int numQFailed; /* number of failed Q units accessed (0 or 1) */
222 RF_AccessStripeMapFlags_t flags; /* various flags */
223 #if 0
224 RF_PhysDiskAddr_t *failedPDA; /* points to the PDA that has failed */
225 RF_PhysDiskAddr_t *failedPDAtwo; /* points to the second PDA
226 * that has failed, if any */
227 #else
228 int numFailedPDAs; /* number of failed phys addrs */
229 RF_PhysDiskAddr_t *failedPDAs[RF_MAX_FAILED_PDA]; /* array of failed phys
230 * addrs */
231 #endif
232 RF_PhysDiskAddr_t *physInfo; /* a list of PhysDiskAddr structs */
233 RF_PhysDiskAddr_t *parityInfo; /* list of physical addrs for the
234 * parity (P of P + Q ) */
235 RF_PhysDiskAddr_t *qInfo; /* list of physical addrs for the Q of
236 * P + Q */
237 RF_LockReqDesc_t lockReqDesc; /* used for stripe locking */
238 RF_RowCol_t origRow; /* the original row: we may redirect the acc
239 * to a different row */
240 RF_AccessStripeMap_t *next;
241 };
242 /* flag values */
243 #define RF_ASM_REDIR_LARGE_WRITE 0x00000001 /* allows large-write creation
244 * code to redirect failed
245 * accs */
246 #define RF_ASM_BAILOUT_DAG_USED 0x00000002 /* allows us to detect
247 * recursive calls to the
248 * bailout write dag */
249 #define RF_ASM_FLAGS_LOCK_TRIED 0x00000004 /* we've acquired the lock on
250 * the first parity range in
251 * this parity stripe */
252 #define RF_ASM_FLAGS_LOCK_TRIED2 0x00000008 /* we've acquired the lock on
253 * the 2nd parity range in
254 * this parity stripe */
255 #define RF_ASM_FLAGS_FORCE_TRIED 0x00000010 /* we've done the force-recon
256 * call on this parity stripe */
257 #define RF_ASM_FLAGS_RECON_BLOCKED 0x00000020 /* we blocked recon => we must
258 * unblock it later */
259
260 struct RF_AccessStripeMapHeader_s {
261 RF_StripeCount_t numStripes; /* total number of stripes touched by
262 * this acc */
263 RF_AccessStripeMap_t *stripeMap; /* pointer to the actual map.
264 * Also used for making lists */
265 RF_AccessStripeMapHeader_t *next;
266 };
267 /*****************************************************************************************
268 *
269 * various routines mapping addresses in the RAID address space. These work across
270 * all layouts. DON'T PUT ANY LAYOUT-SPECIFIC CODE HERE.
271 *
272 ****************************************************************************************/
273
274 /* return the identifier of the stripe containing the given address */
275 #define rf_RaidAddressToStripeID(_layoutPtr_, _addr_) \
276 ( ((_addr_) / (_layoutPtr_)->sectorsPerStripeUnit) / (_layoutPtr_)->numDataCol )
277
278 /* return the raid address of the start of the indicates stripe ID */
279 #define rf_StripeIDToRaidAddress(_layoutPtr_, _sid_) \
280 ( ((_sid_) * (_layoutPtr_)->sectorsPerStripeUnit) * (_layoutPtr_)->numDataCol )
281
282 /* return the identifier of the stripe containing the given stripe unit id */
283 #define rf_StripeUnitIDToStripeID(_layoutPtr_, _addr_) \
284 ( (_addr_) / (_layoutPtr_)->numDataCol )
285
286 /* return the identifier of the stripe unit containing the given address */
287 #define rf_RaidAddressToStripeUnitID(_layoutPtr_, _addr_) \
288 ( ((_addr_) / (_layoutPtr_)->sectorsPerStripeUnit) )
289
290 /* return the RAID address of next stripe boundary beyond the given address */
291 #define rf_RaidAddressOfNextStripeBoundary(_layoutPtr_, _addr_) \
292 ( (((_addr_)/(_layoutPtr_)->dataSectorsPerStripe)+1) * (_layoutPtr_)->dataSectorsPerStripe )
293
294 /* return the RAID address of the start of the stripe containing the given address */
295 #define rf_RaidAddressOfPrevStripeBoundary(_layoutPtr_, _addr_) \
296 ( (((_addr_)/(_layoutPtr_)->dataSectorsPerStripe)+0) * (_layoutPtr_)->dataSectorsPerStripe )
297
298 /* return the RAID address of next stripe unit boundary beyond the given address */
299 #define rf_RaidAddressOfNextStripeUnitBoundary(_layoutPtr_, _addr_) \
300 ( (((_addr_)/(_layoutPtr_)->sectorsPerStripeUnit)+1L)*(_layoutPtr_)->sectorsPerStripeUnit )
301
302 /* return the RAID address of the start of the stripe unit containing RAID address _addr_ */
303 #define rf_RaidAddressOfPrevStripeUnitBoundary(_layoutPtr_, _addr_) \
304 ( (((_addr_)/(_layoutPtr_)->sectorsPerStripeUnit)+0)*(_layoutPtr_)->sectorsPerStripeUnit )
305
306 /* returns the offset into the stripe. used by RaidAddressStripeAligned */
307 #define rf_RaidAddressStripeOffset(_layoutPtr_, _addr_) \
308 ( (_addr_) % ((_layoutPtr_)->dataSectorsPerStripe) )
309
310 /* returns the offset into the stripe unit. */
311 #define rf_StripeUnitOffset(_layoutPtr_, _addr_) \
312 ( (_addr_) % ((_layoutPtr_)->sectorsPerStripeUnit) )
313
314 /* returns nonzero if the given RAID address is stripe-aligned */
315 #define rf_RaidAddressStripeAligned( __layoutPtr__, __addr__ ) \
316 ( rf_RaidAddressStripeOffset(__layoutPtr__, __addr__) == 0 )
317
318 /* returns nonzero if the given address is stripe-unit aligned */
319 #define rf_StripeUnitAligned( __layoutPtr__, __addr__ ) \
320 ( rf_StripeUnitOffset(__layoutPtr__, __addr__) == 0 )
321
322 /* convert an address expressed in RAID blocks to/from an addr expressed in bytes */
323 #define rf_RaidAddressToByte(_raidPtr_, _addr_) \
324 ( (_addr_) << ( (_raidPtr_)->logBytesPerSector ) )
325
326 #define rf_ByteToRaidAddress(_raidPtr_, _addr_) \
327 ( (_addr_) >> ( (_raidPtr_)->logBytesPerSector ) )
328
329 /* convert a raid address to/from a parity stripe ID. Conversion to raid address is easy,
330 * since we're asking for the address of the first sector in the parity stripe. Conversion to a
331 * parity stripe ID is more complex, since stripes are not contiguously allocated in
332 * parity stripes.
333 */
334 #define rf_RaidAddressToParityStripeID(_layoutPtr_, _addr_, _ru_num_) \
335 rf_MapStripeIDToParityStripeID( (_layoutPtr_), rf_RaidAddressToStripeID( (_layoutPtr_), (_addr_) ), (_ru_num_) )
336
337 #define rf_ParityStripeIDToRaidAddress(_layoutPtr_, _psid_) \
338 ( (_psid_) * (_layoutPtr_)->SUsPerPU * (_layoutPtr_)->numDataCol * (_layoutPtr_)->sectorsPerStripeUnit )
339
340 RF_LayoutSW_t *rf_GetLayout(RF_ParityConfig_t parityConfig);
341 int
342 rf_ConfigureLayout(RF_ShutdownList_t ** listp, RF_Raid_t * raidPtr,
343 RF_Config_t * cfgPtr);
344 RF_StripeNum_t
345 rf_MapStripeIDToParityStripeID(RF_RaidLayout_t * layoutPtr,
346 RF_StripeNum_t stripeID, RF_ReconUnitNum_t * which_ru);
347
348 #endif /* !_RF__RF_LAYOUT_H_ */
349