rf_reconutil.c revision 1.24 1 1.24 oster /* $NetBSD: rf_reconutil.c,v 1.24 2005/02/05 23:32:44 oster Exp $ */
2 1.1 oster /*
3 1.1 oster * Copyright (c) 1995 Carnegie-Mellon University.
4 1.1 oster * All rights reserved.
5 1.1 oster *
6 1.1 oster * Author: Mark Holland
7 1.1 oster *
8 1.1 oster * Permission to use, copy, modify and distribute this software and
9 1.1 oster * its documentation is hereby granted, provided that both the copyright
10 1.1 oster * notice and this permission notice appear in all copies of the
11 1.1 oster * software, derivative works or modified versions, and any portions
12 1.1 oster * thereof, and that both notices appear in supporting documentation.
13 1.1 oster *
14 1.1 oster * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
15 1.1 oster * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
16 1.1 oster * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
17 1.1 oster *
18 1.1 oster * Carnegie Mellon requests users of this software to return to
19 1.1 oster *
20 1.1 oster * Software Distribution Coordinator or Software.Distribution (at) CS.CMU.EDU
21 1.1 oster * School of Computer Science
22 1.1 oster * Carnegie Mellon University
23 1.1 oster * Pittsburgh PA 15213-3890
24 1.1 oster *
25 1.1 oster * any improvements or extensions that they make and grant Carnegie the
26 1.1 oster * rights to redistribute these changes.
27 1.1 oster */
28 1.1 oster
29 1.1 oster /********************************************
30 1.1 oster * rf_reconutil.c -- reconstruction utilities
31 1.1 oster ********************************************/
32 1.5 lukem
33 1.5 lukem #include <sys/cdefs.h>
34 1.24 oster __KERNEL_RCSID(0, "$NetBSD: rf_reconutil.c,v 1.24 2005/02/05 23:32:44 oster Exp $");
35 1.1 oster
36 1.4 oster #include <dev/raidframe/raidframevar.h>
37 1.4 oster
38 1.1 oster #include "rf_raid.h"
39 1.1 oster #include "rf_desc.h"
40 1.1 oster #include "rf_reconutil.h"
41 1.1 oster #include "rf_reconbuffer.h"
42 1.1 oster #include "rf_general.h"
43 1.1 oster #include "rf_decluster.h"
44 1.1 oster #include "rf_raid5_rotatedspare.h"
45 1.1 oster #include "rf_interdecluster.h"
46 1.1 oster #include "rf_chaindecluster.h"
47 1.1 oster
48 1.1 oster /*******************************************************************
49 1.1 oster * allocates/frees the reconstruction control information structures
50 1.1 oster *******************************************************************/
51 1.19 oster
52 1.19 oster /* fcol - failed column
53 1.19 oster * scol - identifies which spare we are using
54 1.19 oster */
55 1.19 oster
56 1.3 oster RF_ReconCtrl_t *
57 1.19 oster rf_MakeReconControl(RF_RaidReconDesc_t *reconDesc,
58 1.19 oster RF_RowCol_t fcol, RF_RowCol_t scol)
59 1.1 oster {
60 1.3 oster RF_Raid_t *raidPtr = reconDesc->raidPtr;
61 1.3 oster RF_RaidLayout_t *layoutPtr = &raidPtr->Layout;
62 1.3 oster RF_ReconUnitCount_t RUsPerPU = layoutPtr->SUsPerPU / layoutPtr->SUsPerRU;
63 1.3 oster RF_ReconUnitCount_t numSpareRUs;
64 1.3 oster RF_ReconCtrl_t *reconCtrlPtr;
65 1.3 oster RF_ReconBuffer_t *rbuf;
66 1.14 jdolecek const RF_LayoutSW_t *lp;
67 1.12 oster #if (RF_INCLUDE_PARITY_DECLUSTERING_DS > 0)
68 1.12 oster int retcode;
69 1.12 oster #endif
70 1.3 oster RF_RowCol_t i;
71 1.3 oster
72 1.3 oster lp = raidPtr->Layout.map;
73 1.3 oster
74 1.3 oster /* make and zero the global reconstruction structure and the per-disk
75 1.3 oster * structure */
76 1.16 oster RF_Malloc(reconCtrlPtr, sizeof(RF_ReconCtrl_t), (RF_ReconCtrl_t *));
77 1.11 oster
78 1.11 oster /* note: this zeros the perDiskInfo */
79 1.16 oster RF_Malloc(reconCtrlPtr->perDiskInfo, raidPtr->numCol *
80 1.11 oster sizeof(RF_PerDiskReconCtrl_t), (RF_PerDiskReconCtrl_t *));
81 1.3 oster reconCtrlPtr->reconDesc = reconDesc;
82 1.3 oster reconCtrlPtr->fcol = fcol;
83 1.3 oster reconCtrlPtr->spareCol = scol;
84 1.3 oster reconCtrlPtr->lastPSID = layoutPtr->numStripe / layoutPtr->SUsPerPU;
85 1.3 oster reconCtrlPtr->percentComplete = 0;
86 1.24 oster reconCtrlPtr->error = 0;
87 1.24 oster reconCtrlPtr->pending_writes = 0;
88 1.3 oster
89 1.3 oster /* initialize each per-disk recon information structure */
90 1.3 oster for (i = 0; i < raidPtr->numCol; i++) {
91 1.3 oster reconCtrlPtr->perDiskInfo[i].reconCtrl = reconCtrlPtr;
92 1.3 oster reconCtrlPtr->perDiskInfo[i].col = i;
93 1.11 oster /* make it appear as if we just finished an RU */
94 1.11 oster reconCtrlPtr->perDiskInfo[i].curPSID = -1;
95 1.3 oster reconCtrlPtr->perDiskInfo[i].ru_count = RUsPerPU - 1;
96 1.3 oster }
97 1.3 oster
98 1.3 oster /* Get the number of spare units per disk and the sparemap in case
99 1.3 oster * spare is distributed */
100 1.3 oster
101 1.3 oster if (lp->GetNumSpareRUs) {
102 1.3 oster numSpareRUs = lp->GetNumSpareRUs(raidPtr);
103 1.3 oster } else {
104 1.3 oster numSpareRUs = 0;
105 1.3 oster }
106 1.3 oster
107 1.12 oster #if (RF_INCLUDE_PARITY_DECLUSTERING_DS > 0)
108 1.3 oster /*
109 1.3 oster * Not all distributed sparing archs need dynamic mappings
110 1.3 oster */
111 1.3 oster if (lp->InstallSpareTable) {
112 1.15 oster retcode = rf_InstallSpareTable(raidPtr, fcol);
113 1.3 oster if (retcode) {
114 1.3 oster RF_PANIC(); /* XXX fix this */
115 1.3 oster }
116 1.3 oster }
117 1.12 oster #endif
118 1.3 oster /* make the reconstruction map */
119 1.3 oster reconCtrlPtr->reconMap = rf_MakeReconMap(raidPtr, (int) (layoutPtr->SUsPerRU * layoutPtr->sectorsPerStripeUnit),
120 1.3 oster raidPtr->sectorsPerDisk, numSpareRUs);
121 1.3 oster
122 1.3 oster /* make the per-disk reconstruction buffers */
123 1.3 oster for (i = 0; i < raidPtr->numCol; i++) {
124 1.15 oster reconCtrlPtr->perDiskInfo[i].rbuf = (i == fcol) ? NULL : rf_MakeReconBuffer(raidPtr, i, RF_RBUF_TYPE_EXCLUSIVE);
125 1.3 oster }
126 1.3 oster
127 1.3 oster /* initialize the event queue */
128 1.17 oster simple_lock_init(&reconCtrlPtr->eq_mutex);
129 1.17 oster
130 1.3 oster reconCtrlPtr->eventQueue = NULL;
131 1.3 oster reconCtrlPtr->eq_count = 0;
132 1.3 oster
133 1.3 oster /* make the floating recon buffers and append them to the free list */
134 1.17 oster simple_lock_init(&reconCtrlPtr->rb_mutex);
135 1.17 oster
136 1.3 oster reconCtrlPtr->fullBufferList = NULL;
137 1.3 oster reconCtrlPtr->floatingRbufs = NULL;
138 1.3 oster reconCtrlPtr->committedRbufs = NULL;
139 1.3 oster for (i = 0; i < raidPtr->numFloatingReconBufs; i++) {
140 1.15 oster rbuf = rf_MakeReconBuffer(raidPtr, fcol,
141 1.11 oster RF_RBUF_TYPE_FLOATING);
142 1.3 oster rbuf->next = reconCtrlPtr->floatingRbufs;
143 1.3 oster reconCtrlPtr->floatingRbufs = rbuf;
144 1.3 oster }
145 1.3 oster
146 1.3 oster /* create the parity stripe status table */
147 1.3 oster reconCtrlPtr->pssTable = rf_MakeParityStripeStatusTable(raidPtr);
148 1.3 oster
149 1.3 oster /* set the initial min head sep counter val */
150 1.3 oster reconCtrlPtr->minHeadSepCounter = 0;
151 1.3 oster
152 1.3 oster return (reconCtrlPtr);
153 1.1 oster }
154 1.1 oster
155 1.3 oster void
156 1.19 oster rf_FreeReconControl(RF_Raid_t *raidPtr)
157 1.1 oster {
158 1.15 oster RF_ReconCtrl_t *reconCtrlPtr = raidPtr->reconControl;
159 1.3 oster RF_ReconBuffer_t *t;
160 1.3 oster RF_ReconUnitNum_t i;
161 1.3 oster
162 1.3 oster RF_ASSERT(reconCtrlPtr);
163 1.3 oster for (i = 0; i < raidPtr->numCol; i++)
164 1.3 oster if (reconCtrlPtr->perDiskInfo[i].rbuf)
165 1.3 oster rf_FreeReconBuffer(reconCtrlPtr->perDiskInfo[i].rbuf);
166 1.24 oster
167 1.24 oster t = reconCtrlPtr->floatingRbufs;
168 1.24 oster while (t) {
169 1.3 oster reconCtrlPtr->floatingRbufs = t->next;
170 1.3 oster rf_FreeReconBuffer(t);
171 1.24 oster t = reconCtrlPtr->floatingRbufs;
172 1.3 oster }
173 1.24 oster
174 1.3 oster rf_FreeReconMap(reconCtrlPtr->reconMap);
175 1.3 oster rf_FreeParityStripeStatusTable(raidPtr, reconCtrlPtr->pssTable);
176 1.11 oster RF_Free(reconCtrlPtr->perDiskInfo,
177 1.11 oster raidPtr->numCol * sizeof(RF_PerDiskReconCtrl_t));
178 1.3 oster RF_Free(reconCtrlPtr, sizeof(*reconCtrlPtr));
179 1.1 oster }
180 1.1 oster
181 1.1 oster
182 1.1 oster /******************************************************************************
183 1.1 oster * computes the default head separation limit
184 1.1 oster *****************************************************************************/
185 1.3 oster RF_HeadSepLimit_t
186 1.19 oster rf_GetDefaultHeadSepLimit(RF_Raid_t *raidPtr)
187 1.1 oster {
188 1.3 oster RF_HeadSepLimit_t hsl;
189 1.14 jdolecek const RF_LayoutSW_t *lp;
190 1.1 oster
191 1.3 oster lp = raidPtr->Layout.map;
192 1.3 oster if (lp->GetDefaultHeadSepLimit == NULL)
193 1.3 oster return (-1);
194 1.3 oster hsl = lp->GetDefaultHeadSepLimit(raidPtr);
195 1.3 oster return (hsl);
196 1.1 oster }
197 1.1 oster
198 1.1 oster
199 1.1 oster /******************************************************************************
200 1.1 oster * computes the default number of floating recon buffers
201 1.1 oster *****************************************************************************/
202 1.3 oster int
203 1.19 oster rf_GetDefaultNumFloatingReconBuffers(RF_Raid_t *raidPtr)
204 1.1 oster {
205 1.14 jdolecek const RF_LayoutSW_t *lp;
206 1.3 oster int nrb;
207 1.1 oster
208 1.3 oster lp = raidPtr->Layout.map;
209 1.3 oster if (lp->GetDefaultNumFloatingReconBuffers == NULL)
210 1.3 oster return (3 * raidPtr->numCol);
211 1.3 oster nrb = lp->GetDefaultNumFloatingReconBuffers(raidPtr);
212 1.3 oster return (nrb);
213 1.1 oster }
214 1.1 oster
215 1.1 oster
216 1.1 oster /******************************************************************************
217 1.1 oster * creates and initializes a reconstruction buffer
218 1.1 oster *****************************************************************************/
219 1.3 oster RF_ReconBuffer_t *
220 1.19 oster rf_MakeReconBuffer(RF_Raid_t *raidPtr, RF_RowCol_t col, RF_RbufType_t type)
221 1.1 oster {
222 1.3 oster RF_RaidLayout_t *layoutPtr = &raidPtr->Layout;
223 1.3 oster RF_ReconBuffer_t *t;
224 1.3 oster u_int recon_buffer_size = rf_RaidAddressToByte(raidPtr, layoutPtr->SUsPerRU * layoutPtr->sectorsPerStripeUnit);
225 1.3 oster
226 1.22 oster t = pool_get(&rf_pools.reconbuffer, PR_WAITOK);
227 1.3 oster RF_Malloc(t->buffer, recon_buffer_size, (caddr_t));
228 1.3 oster t->raidPtr = raidPtr;
229 1.3 oster t->col = col;
230 1.3 oster t->priority = RF_IO_RECON_PRIORITY;
231 1.3 oster t->type = type;
232 1.3 oster t->pssPtr = NULL;
233 1.3 oster t->next = NULL;
234 1.3 oster return (t);
235 1.1 oster }
236 1.1 oster /******************************************************************************
237 1.1 oster * frees a reconstruction buffer
238 1.1 oster *****************************************************************************/
239 1.3 oster void
240 1.19 oster rf_FreeReconBuffer(RF_ReconBuffer_t *rbuf)
241 1.1 oster {
242 1.3 oster RF_Raid_t *raidPtr = rbuf->raidPtr;
243 1.9 oster u_int recon_buffer_size;
244 1.9 oster
245 1.9 oster recon_buffer_size = rf_RaidAddressToByte(raidPtr, raidPtr->Layout.SUsPerRU * raidPtr->Layout.sectorsPerStripeUnit);
246 1.3 oster
247 1.3 oster RF_Free(rbuf->buffer, recon_buffer_size);
248 1.22 oster pool_put(&rf_pools.reconbuffer, rbuf);
249 1.1 oster }
250 1.1 oster
251 1.10 oster #if RF_DEBUG_RECON
252 1.23 oster XXXX IF you use this, you really want to fix the locking in here.
253 1.1 oster /******************************************************************************
254 1.1 oster * debug only: sanity check the number of floating recon bufs in use
255 1.1 oster *****************************************************************************/
256 1.3 oster void
257 1.19 oster rf_CheckFloatingRbufCount(RF_Raid_t *raidPtr, int dolock)
258 1.1 oster {
259 1.3 oster RF_ReconParityStripeStatus_t *p;
260 1.3 oster RF_PSStatusHeader_t *pssTable;
261 1.3 oster RF_ReconBuffer_t *rbuf;
262 1.3 oster int i, j, sum = 0;
263 1.3 oster
264 1.3 oster if (dolock)
265 1.15 oster RF_LOCK_MUTEX(raidPtr->reconControl->rb_mutex);
266 1.15 oster pssTable = raidPtr->reconControl->pssTable;
267 1.3 oster
268 1.3 oster for (i = 0; i < raidPtr->pssTableSize; i++) {
269 1.3 oster RF_LOCK_MUTEX(pssTable[i].mutex);
270 1.3 oster for (p = pssTable[i].chain; p; p = p->next) {
271 1.3 oster rbuf = (RF_ReconBuffer_t *) p->rbuf;
272 1.3 oster if (rbuf && rbuf->type == RF_RBUF_TYPE_FLOATING)
273 1.3 oster sum++;
274 1.3 oster
275 1.3 oster rbuf = (RF_ReconBuffer_t *) p->writeRbuf;
276 1.3 oster if (rbuf && rbuf->type == RF_RBUF_TYPE_FLOATING)
277 1.3 oster sum++;
278 1.3 oster
279 1.3 oster for (j = 0; j < p->xorBufCount; j++) {
280 1.3 oster rbuf = (RF_ReconBuffer_t *) p->rbufsForXor[j];
281 1.3 oster RF_ASSERT(rbuf);
282 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
283 1.3 oster sum++;
284 1.3 oster }
285 1.3 oster }
286 1.3 oster RF_UNLOCK_MUTEX(pssTable[i].mutex);
287 1.3 oster }
288 1.3 oster
289 1.15 oster for (rbuf = raidPtr->reconControl->floatingRbufs; rbuf;
290 1.11 oster rbuf = rbuf->next) {
291 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
292 1.3 oster sum++;
293 1.3 oster }
294 1.15 oster for (rbuf = raidPtr->reconControl->committedRbufs; rbuf;
295 1.11 oster rbuf = rbuf->next) {
296 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
297 1.3 oster sum++;
298 1.3 oster }
299 1.15 oster for (rbuf = raidPtr->reconControl->fullBufferList; rbuf;
300 1.11 oster rbuf = rbuf->next) {
301 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
302 1.3 oster sum++;
303 1.3 oster }
304 1.3 oster RF_ASSERT(sum == raidPtr->numFloatingReconBufs);
305 1.1 oster
306 1.3 oster if (dolock)
307 1.15 oster RF_UNLOCK_MUTEX(raidPtr->reconControl->rb_mutex);
308 1.1 oster }
309 1.7 oster #endif
310 1.7 oster
311