rf_reconutil.c revision 1.32 1 1.32 mrg /* $NetBSD: rf_reconutil.c,v 1.32 2011/05/02 01:07:24 mrg Exp $ */
2 1.1 oster /*
3 1.1 oster * Copyright (c) 1995 Carnegie-Mellon University.
4 1.1 oster * All rights reserved.
5 1.1 oster *
6 1.1 oster * Author: Mark Holland
7 1.1 oster *
8 1.1 oster * Permission to use, copy, modify and distribute this software and
9 1.1 oster * its documentation is hereby granted, provided that both the copyright
10 1.1 oster * notice and this permission notice appear in all copies of the
11 1.1 oster * software, derivative works or modified versions, and any portions
12 1.1 oster * thereof, and that both notices appear in supporting documentation.
13 1.1 oster *
14 1.1 oster * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
15 1.1 oster * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
16 1.1 oster * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
17 1.1 oster *
18 1.1 oster * Carnegie Mellon requests users of this software to return to
19 1.1 oster *
20 1.1 oster * Software Distribution Coordinator or Software.Distribution (at) CS.CMU.EDU
21 1.1 oster * School of Computer Science
22 1.1 oster * Carnegie Mellon University
23 1.1 oster * Pittsburgh PA 15213-3890
24 1.1 oster *
25 1.1 oster * any improvements or extensions that they make and grant Carnegie the
26 1.1 oster * rights to redistribute these changes.
27 1.1 oster */
28 1.1 oster
29 1.1 oster /********************************************
30 1.1 oster * rf_reconutil.c -- reconstruction utilities
31 1.1 oster ********************************************/
32 1.5 lukem
33 1.5 lukem #include <sys/cdefs.h>
34 1.32 mrg __KERNEL_RCSID(0, "$NetBSD: rf_reconutil.c,v 1.32 2011/05/02 01:07:24 mrg Exp $");
35 1.1 oster
36 1.4 oster #include <dev/raidframe/raidframevar.h>
37 1.4 oster
38 1.1 oster #include "rf_raid.h"
39 1.1 oster #include "rf_desc.h"
40 1.1 oster #include "rf_reconutil.h"
41 1.1 oster #include "rf_reconbuffer.h"
42 1.1 oster #include "rf_general.h"
43 1.1 oster #include "rf_decluster.h"
44 1.1 oster #include "rf_raid5_rotatedspare.h"
45 1.1 oster #include "rf_interdecluster.h"
46 1.1 oster #include "rf_chaindecluster.h"
47 1.1 oster
48 1.1 oster /*******************************************************************
49 1.1 oster * allocates/frees the reconstruction control information structures
50 1.1 oster *******************************************************************/
51 1.19 oster
52 1.19 oster /* fcol - failed column
53 1.19 oster * scol - identifies which spare we are using
54 1.19 oster */
55 1.19 oster
56 1.3 oster RF_ReconCtrl_t *
57 1.25 perry rf_MakeReconControl(RF_RaidReconDesc_t *reconDesc,
58 1.19 oster RF_RowCol_t fcol, RF_RowCol_t scol)
59 1.1 oster {
60 1.3 oster RF_Raid_t *raidPtr = reconDesc->raidPtr;
61 1.3 oster RF_RaidLayout_t *layoutPtr = &raidPtr->Layout;
62 1.3 oster RF_ReconUnitCount_t RUsPerPU = layoutPtr->SUsPerPU / layoutPtr->SUsPerRU;
63 1.3 oster RF_ReconUnitCount_t numSpareRUs;
64 1.3 oster RF_ReconCtrl_t *reconCtrlPtr;
65 1.3 oster RF_ReconBuffer_t *rbuf;
66 1.14 jdolecek const RF_LayoutSW_t *lp;
67 1.12 oster #if (RF_INCLUDE_PARITY_DECLUSTERING_DS > 0)
68 1.12 oster int retcode;
69 1.12 oster #endif
70 1.3 oster RF_RowCol_t i;
71 1.3 oster
72 1.3 oster lp = raidPtr->Layout.map;
73 1.3 oster
74 1.3 oster /* make and zero the global reconstruction structure and the per-disk
75 1.3 oster * structure */
76 1.16 oster RF_Malloc(reconCtrlPtr, sizeof(RF_ReconCtrl_t), (RF_ReconCtrl_t *));
77 1.11 oster
78 1.11 oster /* note: this zeros the perDiskInfo */
79 1.16 oster RF_Malloc(reconCtrlPtr->perDiskInfo, raidPtr->numCol *
80 1.11 oster sizeof(RF_PerDiskReconCtrl_t), (RF_PerDiskReconCtrl_t *));
81 1.3 oster reconCtrlPtr->reconDesc = reconDesc;
82 1.3 oster reconCtrlPtr->fcol = fcol;
83 1.3 oster reconCtrlPtr->spareCol = scol;
84 1.3 oster reconCtrlPtr->lastPSID = layoutPtr->numStripe / layoutPtr->SUsPerPU;
85 1.3 oster reconCtrlPtr->percentComplete = 0;
86 1.24 oster reconCtrlPtr->error = 0;
87 1.24 oster reconCtrlPtr->pending_writes = 0;
88 1.3 oster
89 1.3 oster /* initialize each per-disk recon information structure */
90 1.3 oster for (i = 0; i < raidPtr->numCol; i++) {
91 1.3 oster reconCtrlPtr->perDiskInfo[i].reconCtrl = reconCtrlPtr;
92 1.3 oster reconCtrlPtr->perDiskInfo[i].col = i;
93 1.11 oster /* make it appear as if we just finished an RU */
94 1.25 perry reconCtrlPtr->perDiskInfo[i].curPSID = -1;
95 1.3 oster reconCtrlPtr->perDiskInfo[i].ru_count = RUsPerPU - 1;
96 1.3 oster }
97 1.3 oster
98 1.3 oster /* Get the number of spare units per disk and the sparemap in case
99 1.3 oster * spare is distributed */
100 1.3 oster
101 1.3 oster if (lp->GetNumSpareRUs) {
102 1.3 oster numSpareRUs = lp->GetNumSpareRUs(raidPtr);
103 1.3 oster } else {
104 1.3 oster numSpareRUs = 0;
105 1.3 oster }
106 1.3 oster
107 1.12 oster #if (RF_INCLUDE_PARITY_DECLUSTERING_DS > 0)
108 1.3 oster /*
109 1.3 oster * Not all distributed sparing archs need dynamic mappings
110 1.3 oster */
111 1.3 oster if (lp->InstallSpareTable) {
112 1.27 oster retcode = rf_InstallSpareTable(raidPtr, 0, fcol);
113 1.3 oster if (retcode) {
114 1.3 oster RF_PANIC(); /* XXX fix this */
115 1.3 oster }
116 1.3 oster }
117 1.12 oster #endif
118 1.3 oster /* make the reconstruction map */
119 1.3 oster reconCtrlPtr->reconMap = rf_MakeReconMap(raidPtr, (int) (layoutPtr->SUsPerRU * layoutPtr->sectorsPerStripeUnit),
120 1.3 oster raidPtr->sectorsPerDisk, numSpareRUs);
121 1.3 oster
122 1.3 oster /* make the per-disk reconstruction buffers */
123 1.3 oster for (i = 0; i < raidPtr->numCol; i++) {
124 1.15 oster reconCtrlPtr->perDiskInfo[i].rbuf = (i == fcol) ? NULL : rf_MakeReconBuffer(raidPtr, i, RF_RBUF_TYPE_EXCLUSIVE);
125 1.3 oster }
126 1.3 oster
127 1.3 oster /* initialize the event queue */
128 1.32 mrg rf_init_mutex2(reconCtrlPtr->eq_mutex, IPL_VM);
129 1.32 mrg rf_init_cond2(reconCtrlPtr->eq_cv, "rfevq");
130 1.17 oster
131 1.3 oster reconCtrlPtr->eventQueue = NULL;
132 1.3 oster reconCtrlPtr->eq_count = 0;
133 1.3 oster
134 1.3 oster /* make the floating recon buffers and append them to the free list */
135 1.29 mrg rf_mutex_init(&reconCtrlPtr->rb_mutex);
136 1.17 oster
137 1.3 oster reconCtrlPtr->fullBufferList = NULL;
138 1.3 oster reconCtrlPtr->floatingRbufs = NULL;
139 1.3 oster reconCtrlPtr->committedRbufs = NULL;
140 1.3 oster for (i = 0; i < raidPtr->numFloatingReconBufs; i++) {
141 1.25 perry rbuf = rf_MakeReconBuffer(raidPtr, fcol,
142 1.11 oster RF_RBUF_TYPE_FLOATING);
143 1.3 oster rbuf->next = reconCtrlPtr->floatingRbufs;
144 1.3 oster reconCtrlPtr->floatingRbufs = rbuf;
145 1.3 oster }
146 1.3 oster
147 1.3 oster /* create the parity stripe status table */
148 1.3 oster reconCtrlPtr->pssTable = rf_MakeParityStripeStatusTable(raidPtr);
149 1.3 oster
150 1.3 oster /* set the initial min head sep counter val */
151 1.3 oster reconCtrlPtr->minHeadSepCounter = 0;
152 1.3 oster
153 1.3 oster return (reconCtrlPtr);
154 1.1 oster }
155 1.1 oster
156 1.25 perry void
157 1.19 oster rf_FreeReconControl(RF_Raid_t *raidPtr)
158 1.1 oster {
159 1.15 oster RF_ReconCtrl_t *reconCtrlPtr = raidPtr->reconControl;
160 1.3 oster RF_ReconBuffer_t *t;
161 1.3 oster RF_ReconUnitNum_t i;
162 1.3 oster
163 1.3 oster RF_ASSERT(reconCtrlPtr);
164 1.3 oster for (i = 0; i < raidPtr->numCol; i++)
165 1.3 oster if (reconCtrlPtr->perDiskInfo[i].rbuf)
166 1.3 oster rf_FreeReconBuffer(reconCtrlPtr->perDiskInfo[i].rbuf);
167 1.24 oster
168 1.24 oster t = reconCtrlPtr->floatingRbufs;
169 1.24 oster while (t) {
170 1.3 oster reconCtrlPtr->floatingRbufs = t->next;
171 1.3 oster rf_FreeReconBuffer(t);
172 1.24 oster t = reconCtrlPtr->floatingRbufs;
173 1.3 oster }
174 1.24 oster
175 1.32 mrg rf_destroy_mutex2(reconCtrlPtr->eq_mutex);
176 1.32 mrg rf_destroy_cond2(reconCtrlPtr->eq_cv);
177 1.32 mrg
178 1.3 oster rf_FreeReconMap(reconCtrlPtr->reconMap);
179 1.3 oster rf_FreeParityStripeStatusTable(raidPtr, reconCtrlPtr->pssTable);
180 1.25 perry RF_Free(reconCtrlPtr->perDiskInfo,
181 1.11 oster raidPtr->numCol * sizeof(RF_PerDiskReconCtrl_t));
182 1.3 oster RF_Free(reconCtrlPtr, sizeof(*reconCtrlPtr));
183 1.1 oster }
184 1.1 oster
185 1.1 oster
186 1.1 oster /******************************************************************************
187 1.1 oster * computes the default head separation limit
188 1.1 oster *****************************************************************************/
189 1.25 perry RF_HeadSepLimit_t
190 1.19 oster rf_GetDefaultHeadSepLimit(RF_Raid_t *raidPtr)
191 1.1 oster {
192 1.3 oster RF_HeadSepLimit_t hsl;
193 1.14 jdolecek const RF_LayoutSW_t *lp;
194 1.1 oster
195 1.3 oster lp = raidPtr->Layout.map;
196 1.3 oster if (lp->GetDefaultHeadSepLimit == NULL)
197 1.3 oster return (-1);
198 1.3 oster hsl = lp->GetDefaultHeadSepLimit(raidPtr);
199 1.3 oster return (hsl);
200 1.1 oster }
201 1.1 oster
202 1.1 oster
203 1.1 oster /******************************************************************************
204 1.1 oster * computes the default number of floating recon buffers
205 1.1 oster *****************************************************************************/
206 1.25 perry int
207 1.19 oster rf_GetDefaultNumFloatingReconBuffers(RF_Raid_t *raidPtr)
208 1.1 oster {
209 1.14 jdolecek const RF_LayoutSW_t *lp;
210 1.3 oster int nrb;
211 1.1 oster
212 1.3 oster lp = raidPtr->Layout.map;
213 1.3 oster if (lp->GetDefaultNumFloatingReconBuffers == NULL)
214 1.3 oster return (3 * raidPtr->numCol);
215 1.3 oster nrb = lp->GetDefaultNumFloatingReconBuffers(raidPtr);
216 1.3 oster return (nrb);
217 1.1 oster }
218 1.1 oster
219 1.1 oster
220 1.1 oster /******************************************************************************
221 1.1 oster * creates and initializes a reconstruction buffer
222 1.1 oster *****************************************************************************/
223 1.3 oster RF_ReconBuffer_t *
224 1.19 oster rf_MakeReconBuffer(RF_Raid_t *raidPtr, RF_RowCol_t col, RF_RbufType_t type)
225 1.1 oster {
226 1.3 oster RF_RaidLayout_t *layoutPtr = &raidPtr->Layout;
227 1.3 oster RF_ReconBuffer_t *t;
228 1.3 oster u_int recon_buffer_size = rf_RaidAddressToByte(raidPtr, layoutPtr->SUsPerRU * layoutPtr->sectorsPerStripeUnit);
229 1.3 oster
230 1.22 oster t = pool_get(&rf_pools.reconbuffer, PR_WAITOK);
231 1.28 christos RF_Malloc(t->buffer, recon_buffer_size, (void *));
232 1.3 oster t->raidPtr = raidPtr;
233 1.3 oster t->col = col;
234 1.3 oster t->priority = RF_IO_RECON_PRIORITY;
235 1.3 oster t->type = type;
236 1.3 oster t->pssPtr = NULL;
237 1.3 oster t->next = NULL;
238 1.3 oster return (t);
239 1.1 oster }
240 1.1 oster /******************************************************************************
241 1.1 oster * frees a reconstruction buffer
242 1.1 oster *****************************************************************************/
243 1.25 perry void
244 1.19 oster rf_FreeReconBuffer(RF_ReconBuffer_t *rbuf)
245 1.1 oster {
246 1.3 oster RF_Raid_t *raidPtr = rbuf->raidPtr;
247 1.9 oster u_int recon_buffer_size;
248 1.9 oster
249 1.9 oster recon_buffer_size = rf_RaidAddressToByte(raidPtr, raidPtr->Layout.SUsPerRU * raidPtr->Layout.sectorsPerStripeUnit);
250 1.3 oster
251 1.3 oster RF_Free(rbuf->buffer, recon_buffer_size);
252 1.22 oster pool_put(&rf_pools.reconbuffer, rbuf);
253 1.1 oster }
254 1.1 oster
255 1.10 oster #if RF_DEBUG_RECON
256 1.23 oster XXXX IF you use this, you really want to fix the locking in here.
257 1.1 oster /******************************************************************************
258 1.1 oster * debug only: sanity check the number of floating recon bufs in use
259 1.1 oster *****************************************************************************/
260 1.25 perry void
261 1.19 oster rf_CheckFloatingRbufCount(RF_Raid_t *raidPtr, int dolock)
262 1.1 oster {
263 1.3 oster RF_ReconParityStripeStatus_t *p;
264 1.3 oster RF_PSStatusHeader_t *pssTable;
265 1.3 oster RF_ReconBuffer_t *rbuf;
266 1.3 oster int i, j, sum = 0;
267 1.3 oster
268 1.3 oster if (dolock)
269 1.15 oster RF_LOCK_MUTEX(raidPtr->reconControl->rb_mutex);
270 1.15 oster pssTable = raidPtr->reconControl->pssTable;
271 1.3 oster
272 1.3 oster for (i = 0; i < raidPtr->pssTableSize; i++) {
273 1.3 oster RF_LOCK_MUTEX(pssTable[i].mutex);
274 1.3 oster for (p = pssTable[i].chain; p; p = p->next) {
275 1.3 oster rbuf = (RF_ReconBuffer_t *) p->rbuf;
276 1.3 oster if (rbuf && rbuf->type == RF_RBUF_TYPE_FLOATING)
277 1.3 oster sum++;
278 1.3 oster
279 1.3 oster rbuf = (RF_ReconBuffer_t *) p->writeRbuf;
280 1.3 oster if (rbuf && rbuf->type == RF_RBUF_TYPE_FLOATING)
281 1.3 oster sum++;
282 1.3 oster
283 1.3 oster for (j = 0; j < p->xorBufCount; j++) {
284 1.3 oster rbuf = (RF_ReconBuffer_t *) p->rbufsForXor[j];
285 1.3 oster RF_ASSERT(rbuf);
286 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
287 1.3 oster sum++;
288 1.3 oster }
289 1.3 oster }
290 1.3 oster RF_UNLOCK_MUTEX(pssTable[i].mutex);
291 1.3 oster }
292 1.3 oster
293 1.25 perry for (rbuf = raidPtr->reconControl->floatingRbufs; rbuf;
294 1.11 oster rbuf = rbuf->next) {
295 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
296 1.3 oster sum++;
297 1.3 oster }
298 1.25 perry for (rbuf = raidPtr->reconControl->committedRbufs; rbuf;
299 1.11 oster rbuf = rbuf->next) {
300 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
301 1.3 oster sum++;
302 1.3 oster }
303 1.25 perry for (rbuf = raidPtr->reconControl->fullBufferList; rbuf;
304 1.11 oster rbuf = rbuf->next) {
305 1.3 oster if (rbuf->type == RF_RBUF_TYPE_FLOATING)
306 1.3 oster sum++;
307 1.3 oster }
308 1.3 oster RF_ASSERT(sum == raidPtr->numFloatingReconBufs);
309 1.1 oster
310 1.3 oster if (dolock)
311 1.15 oster RF_UNLOCK_MUTEX(raidPtr->reconControl->rb_mutex);
312 1.1 oster }
313 1.7 oster #endif
314 1.7 oster
315