rf_reconutil.c revision 1.17 1 1.17 oster /* $NetBSD: rf_reconutil.c,v 1.17 2003/12/29 04:39:29 oster Exp $ */
2 1.1 oster /*
3 1.1 oster * Copyright (c) 1995 Carnegie-Mellon University.
4 1.1 oster * All rights reserved.
5 1.1 oster *
6 1.1 oster * Author: Mark Holland
7 1.1 oster *
8 1.1 oster * Permission to use, copy, modify and distribute this software and
9 1.1 oster * its documentation is hereby granted, provided that both the copyright
10 1.1 oster * notice and this permission notice appear in all copies of the
11 1.1 oster * software, derivative works or modified versions, and any portions
12 1.1 oster * thereof, and that both notices appear in supporting documentation.
13 1.1 oster *
14 1.1 oster * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
15 1.1 oster * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
16 1.1 oster * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
17 1.1 oster *
18 1.1 oster * Carnegie Mellon requests users of this software to return to
19 1.1 oster *
20 1.1 oster * Software Distribution Coordinator or Software.Distribution (at) CS.CMU.EDU
21 1.1 oster * School of Computer Science
22 1.1 oster * Carnegie Mellon University
23 1.1 oster * Pittsburgh PA 15213-3890
24 1.1 oster *
25 1.1 oster * any improvements or extensions that they make and grant Carnegie the
26 1.1 oster * rights to redistribute these changes.
27 1.1 oster */
28 1.1 oster
29 1.1 oster /********************************************
30 1.1 oster * rf_reconutil.c -- reconstruction utilities
31 1.1 oster ********************************************/
32 1.5 lukem
33 1.5 lukem #include <sys/cdefs.h>
34 1.17 oster __KERNEL_RCSID(0, "$NetBSD: rf_reconutil.c,v 1.17 2003/12/29 04:39:29 oster Exp $");
35 1.1 oster
36 1.4 oster #include <dev/raidframe/raidframevar.h>
37 1.4 oster
38 1.1 oster #include "rf_raid.h"
39 1.1 oster #include "rf_desc.h"
40 1.1 oster #include "rf_reconutil.h"
41 1.1 oster #include "rf_reconbuffer.h"
42 1.1 oster #include "rf_general.h"
43 1.1 oster #include "rf_decluster.h"
44 1.1 oster #include "rf_raid5_rotatedspare.h"
45 1.1 oster #include "rf_interdecluster.h"
46 1.1 oster #include "rf_chaindecluster.h"
47 1.1 oster
48 1.1 oster /*******************************************************************
49 1.1 oster * allocates/frees the reconstruction control information structures
50 1.1 oster *******************************************************************/
51 1.3 oster RF_ReconCtrl_t *
52 1.15 oster rf_MakeReconControl(reconDesc, fcol, scol)
53 1.3 oster RF_RaidReconDesc_t *reconDesc;
54 1.15 oster RF_RowCol_t fcol; /* failed column */
55 1.15 oster RF_RowCol_t scol; /* identifies which spare we're using */
56 1.1 oster {
57 1.3 oster RF_Raid_t *raidPtr = reconDesc->raidPtr;
58 1.3 oster RF_RaidLayout_t *layoutPtr = &raidPtr->Layout;
59 1.3 oster RF_ReconUnitCount_t RUsPerPU = layoutPtr->SUsPerPU / layoutPtr->SUsPerRU;
60 1.3 oster RF_ReconUnitCount_t numSpareRUs;
61 1.3 oster RF_ReconCtrl_t *reconCtrlPtr;
62 1.3 oster RF_ReconBuffer_t *rbuf;
63 1.14 jdolecek const RF_LayoutSW_t *lp;
64 1.12 oster #if (RF_INCLUDE_PARITY_DECLUSTERING_DS > 0)
65 1.12 oster int retcode;
66 1.12 oster #endif
67 1.3 oster RF_RowCol_t i;
68 1.3 oster
69 1.3 oster lp = raidPtr->Layout.map;
70 1.3 oster
71 1.3 oster /* make and zero the global reconstruction structure and the per-disk
72 1.3 oster * structure */
73 1.16 oster RF_Malloc(reconCtrlPtr, sizeof(RF_ReconCtrl_t), (RF_ReconCtrl_t *));
74 1.11 oster
75 1.11 oster /* note: this zeros the perDiskInfo */
76 1.16 oster RF_Malloc(reconCtrlPtr->perDiskInfo, raidPtr->numCol *
77 1.11 oster sizeof(RF_PerDiskReconCtrl_t), (RF_PerDiskReconCtrl_t *));
78 1.3 oster reconCtrlPtr->reconDesc = reconDesc;
79 1.3 oster reconCtrlPtr->fcol = fcol;
80 1.3 oster reconCtrlPtr->spareCol = scol;
81 1.3 oster reconCtrlPtr->lastPSID = layoutPtr->numStripe / layoutPtr->SUsPerPU;
82 1.3 oster reconCtrlPtr->percentComplete = 0;
83 1.3 oster
84 1.3 oster /* initialize each per-disk recon information structure */
85 1.3 oster for (i = 0; i < raidPtr->numCol; i++) {
86 1.3 oster reconCtrlPtr->perDiskInfo[i].reconCtrl = reconCtrlPtr;
87 1.3 oster reconCtrlPtr->perDiskInfo[i].col = i;
88 1.11 oster /* make it appear as if we just finished an RU */
89 1.11 oster reconCtrlPtr->perDiskInfo[i].curPSID = -1;
90 1.3 oster reconCtrlPtr->perDiskInfo[i].ru_count = RUsPerPU - 1;
91 1.3 oster }
92 1.3 oster
93 1.3 oster /* Get the number of spare units per disk and the sparemap in case
94 1.3 oster * spare is distributed */
95 1.3 oster
96 1.3 oster if (lp->GetNumSpareRUs) {
97 1.3 oster numSpareRUs = lp->GetNumSpareRUs(raidPtr);
98 1.3 oster } else {
99 1.3 oster numSpareRUs = 0;
100 1.3 oster }
101 1.3 oster
102 1.12 oster #if (RF_INCLUDE_PARITY_DECLUSTERING_DS > 0)
103 1.3 oster /*
104 1.3 oster * Not all distributed sparing archs need dynamic mappings
105 1.3 oster */
106 1.3 oster if (lp->InstallSpareTable) {
107 1.15 oster retcode = rf_InstallSpareTable(raidPtr, fcol);
108 1.3 oster if (retcode) {
109 1.3 oster RF_PANIC(); /* XXX fix this */
110 1.3 oster }
111 1.3 oster }
112 1.12 oster #endif
113 1.3 oster /* make the reconstruction map */
114 1.3 oster reconCtrlPtr->reconMap = rf_MakeReconMap(raidPtr, (int) (layoutPtr->SUsPerRU * layoutPtr->sectorsPerStripeUnit),
115 1.3 oster raidPtr->sectorsPerDisk, numSpareRUs);
116 1.3 oster
117 1.3 oster /* make the per-disk reconstruction buffers */
118 1.3 oster for (i = 0; i < raidPtr->numCol; i++) {
119 1.15 oster reconCtrlPtr->perDiskInfo[i].rbuf = (i == fcol) ? NULL : rf_MakeReconBuffer(raidPtr, i, RF_RBUF_TYPE_EXCLUSIVE);
120 1.3 oster }
121 1.3 oster
122 1.3 oster /* initialize the event queue */
123 1.17 oster simple_lock_init(&reconCtrlPtr->eq_mutex);
124 1.17 oster
125 1.17 oster reconCtrlPtr->eq_cond = 0;
126 1.3 oster reconCtrlPtr->eventQueue = NULL;
127 1.3 oster reconCtrlPtr->eq_count = 0;
128 1.3 oster
129 1.3 oster /* make the floating recon buffers and append them to the free list */
130 1.17 oster simple_lock_init(&reconCtrlPtr->rb_mutex);
131 1.17 oster
132 1.3 oster reconCtrlPtr->fullBufferList = NULL;
133 1.3 oster reconCtrlPtr->floatingRbufs = NULL;
134 1.3 oster reconCtrlPtr->committedRbufs = NULL;
135 1.3 oster for (i = 0; i < raidPtr->numFloatingReconBufs; i++) {
136 1.15 oster rbuf = rf_MakeReconBuffer(raidPtr, fcol,
137 1.11 oster RF_RBUF_TYPE_FLOATING);
138 1.3 oster rbuf->next = reconCtrlPtr->floatingRbufs;
139 1.3 oster reconCtrlPtr->floatingRbufs = rbuf;
140 1.3 oster }
141 1.3 oster
142 1.3 oster /* create the parity stripe status table */
143 1.3 oster reconCtrlPtr->pssTable = rf_MakeParityStripeStatusTable(raidPtr);
144 1.3 oster
145 1.3 oster /* set the initial min head sep counter val */
146 1.3 oster reconCtrlPtr->minHeadSepCounter = 0;
147 1.3 oster
148 1.3 oster return (reconCtrlPtr);
149 1.1 oster }
150 1.1 oster
151 1.3 oster void
152 1.15 oster rf_FreeReconControl(raidPtr)
153 1.3 oster RF_Raid_t *raidPtr;
154 1.1 oster {
155 1.15 oster RF_ReconCtrl_t *reconCtrlPtr = raidPtr->reconControl;
156 1.3 oster RF_ReconBuffer_t *t;
157 1.3 oster RF_ReconUnitNum_t i;
158 1.3 oster
159 1.3 oster RF_ASSERT(reconCtrlPtr);
160 1.3 oster for (i = 0; i < raidPtr->numCol; i++)
161 1.3 oster if (reconCtrlPtr->perDiskInfo[i].rbuf)
162 1.3 oster rf_FreeReconBuffer(reconCtrlPtr->perDiskInfo[i].rbuf);
163 1.3 oster for (i = 0; i < raidPtr->numFloatingReconBufs; i++) {
164 1.3 oster t = reconCtrlPtr->floatingRbufs;
165 1.3 oster RF_ASSERT(t);
166 1.3 oster reconCtrlPtr->floatingRbufs = t->next;
167 1.3 oster rf_FreeReconBuffer(t);
168 1.3 oster }
169 1.3 oster rf_mutex_destroy(&reconCtrlPtr->rb_mutex);
170 1.3 oster rf_mutex_destroy(&reconCtrlPtr->eq_mutex);
171 1.3 oster rf_FreeReconMap(reconCtrlPtr->reconMap);
172 1.3 oster rf_FreeParityStripeStatusTable(raidPtr, reconCtrlPtr->pssTable);
173 1.11 oster RF_Free(reconCtrlPtr->perDiskInfo,
174 1.11 oster raidPtr->numCol * sizeof(RF_PerDiskReconCtrl_t));
175 1.3 oster RF_Free(reconCtrlPtr, sizeof(*reconCtrlPtr));
176 1.1 oster }
177 1.1 oster
178 1.1 oster
179 1.1 oster /******************************************************************************
180 1.1 oster * computes the default head separation limit
181 1.1 oster *****************************************************************************/
182 1.3 oster RF_HeadSepLimit_t
183 1.3 oster rf_GetDefaultHeadSepLimit(raidPtr)
184 1.3 oster RF_Raid_t *raidPtr;
185 1.1 oster {
186 1.3 oster RF_HeadSepLimit_t hsl;
187 1.14 jdolecek const RF_LayoutSW_t *lp;
188 1.1 oster
189 1.3 oster lp = raidPtr->Layout.map;
190 1.3 oster if (lp->GetDefaultHeadSepLimit == NULL)
191 1.3 oster return (-1);
192 1.3 oster hsl = lp->GetDefaultHeadSepLimit(raidPtr);
193 1.3 oster return (hsl);
194 1.1 oster }
195 1.1 oster
196 1.1 oster
197 1.1 oster /******************************************************************************
198 1.1 oster * computes the default number of floating recon buffers
199 1.1 oster *****************************************************************************/
200 1.3 oster int
201 1.3 oster rf_GetDefaultNumFloatingReconBuffers(raidPtr)
202 1.3 oster RF_Raid_t *raidPtr;
203 1.1 oster {
204 1.14 jdolecek const RF_LayoutSW_t *lp;
205 1.3 oster int nrb;
206 1.1 oster
207 1.3 oster lp = raidPtr->Layout.map;
208 1.3 oster if (lp->GetDefaultNumFloatingReconBuffers == NULL)
209 1.3 oster return (3 * raidPtr->numCol);
210 1.3 oster nrb = lp->GetDefaultNumFloatingReconBuffers(raidPtr);
211 1.3 oster return (nrb);
212 1.1 oster }
213 1.1 oster
214 1.1 oster
215 1.1 oster /******************************************************************************
216 1.1 oster * creates and initializes a reconstruction buffer
217 1.1 oster *****************************************************************************/
218 1.3 oster RF_ReconBuffer_t *
219 1.3 oster rf_MakeReconBuffer(
220 1.3 oster RF_Raid_t * raidPtr,
221 1.3 oster RF_RowCol_t col,
222 1.3 oster RF_RbufType_t type)
223 1.1 oster {
224 1.3 oster RF_RaidLayout_t *layoutPtr = &raidPtr->Layout;
225 1.3 oster RF_ReconBuffer_t *t;
226 1.3 oster u_int recon_buffer_size = rf_RaidAddressToByte(raidPtr, layoutPtr->SUsPerRU * layoutPtr->sectorsPerStripeUnit);
227 1.3 oster
228 1.3 oster RF_Malloc(t, sizeof(RF_ReconBuffer_t), (RF_ReconBuffer_t *));
229 1.3 oster RF_Malloc(t->buffer, recon_buffer_size, (caddr_t));
230 1.3 oster t->raidPtr = raidPtr;
231 1.3 oster t->col = col;
232 1.3 oster t->priority = RF_IO_RECON_PRIORITY;
233 1.3 oster t->type = type;
234 1.3 oster t->pssPtr = NULL;
235 1.3 oster t->next = NULL;
236 1.3 oster return (t);
237 1.1 oster }
238 1.1 oster /******************************************************************************
239 1.1 oster * frees a reconstruction buffer
240 1.1 oster *****************************************************************************/
241 1.3 oster void
242 1.3 oster rf_FreeReconBuffer(rbuf)
243 1.3 oster RF_ReconBuffer_t *rbuf;
244 1.1 oster {
245 1.3 oster RF_Raid_t *raidPtr = rbuf->raidPtr;
246 1.9 oster u_int recon_buffer_size;
247 1.9 oster
248 1.9 oster recon_buffer_size = rf_RaidAddressToByte(raidPtr, raidPtr->Layout.SUsPerRU * raidPtr->Layout.sectorsPerStripeUnit);
249 1.3 oster
250 1.3 oster RF_Free(rbuf->buffer, recon_buffer_size);
251 1.3 oster RF_Free(rbuf, sizeof(*rbuf));
252 1.1 oster }
253 1.1 oster
254 1.10 oster #if RF_DEBUG_RECON
255 1.1 oster /******************************************************************************
256 1.1 oster * debug only: sanity check the number of floating recon bufs in use
257 1.1 oster *****************************************************************************/
258 1.3 oster void
259 1.3 oster rf_CheckFloatingRbufCount(raidPtr, dolock)
260 1.3 oster RF_Raid_t *raidPtr;
261 1.3 oster int dolock;
262 1.1 oster {
263 1.3 oster RF_ReconParityStripeStatus_t *p;
264 1.3 oster RF_PSStatusHeader_t *pssTable;
265 1.3 oster RF_ReconBuffer_t *rbuf;
266 1.3 oster int i, j, sum = 0;
267 1.3 oster
268 1.3 oster if (dolock)
269 1.15 oster RF_LOCK_MUTEX(raidPtr->reconControl->rb_mutex);
270 1.15 oster pssTable = raidPtr->reconControl->pssTable;
271 1.3 oster
272 1.3 oster for (i = 0; i < raidPtr->pssTableSize; i++) {
273 1.3 oster RF_LOCK_MUTEX(pssTable[i].mutex);
274 1.3 oster for (p = pssTable[i].chain; p; p = p->next) {
275 1.3 oster rbuf = (RF_ReconBuffer_t *) p->rbuf;
276 1.3 oster if (rbuf && rbuf->type == RF_RBUF_TYPE_FLOATING)
277 1.3 oster sum++;
278 1.3 oster
279 1.3 oster rbuf = (RF_ReconBuffer_t *) p->writeRbuf;
280 1.3 oster if (rbuf && rbuf->type == RF_RBUF_TYPE_FLOATING)
281 1.3 oster sum++;
282 1.3 oster
283 1.3 oster for (j = 0; j < p->xorBufCount; j++) {
284 1.3 oster rbuf = (RF_ReconBuffer_t *) p->rbufsForXor[j];
285 1.3 oster RF_ASSERT(rbuf);
286 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
287 1.3 oster sum++;
288 1.3 oster }
289 1.3 oster }
290 1.3 oster RF_UNLOCK_MUTEX(pssTable[i].mutex);
291 1.3 oster }
292 1.3 oster
293 1.15 oster for (rbuf = raidPtr->reconControl->floatingRbufs; rbuf;
294 1.11 oster rbuf = rbuf->next) {
295 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
296 1.3 oster sum++;
297 1.3 oster }
298 1.15 oster for (rbuf = raidPtr->reconControl->committedRbufs; rbuf;
299 1.11 oster rbuf = rbuf->next) {
300 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
301 1.3 oster sum++;
302 1.3 oster }
303 1.15 oster for (rbuf = raidPtr->reconControl->fullBufferList; rbuf;
304 1.11 oster rbuf = rbuf->next) {
305 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
306 1.3 oster sum++;
307 1.3 oster }
308 1.3 oster RF_ASSERT(sum == raidPtr->numFloatingReconBufs);
309 1.1 oster
310 1.3 oster if (dolock)
311 1.15 oster RF_UNLOCK_MUTEX(raidPtr->reconControl->rb_mutex);
312 1.1 oster }
313 1.7 oster #endif
314 1.7 oster
315