subr_lockdebug.c revision 1.1.2.3 1 /* $NetBSD: subr_lockdebug.c,v 1.1.2.3 2006/11/17 16:34:37 ad Exp $ */
2
3 /*-
4 * Copyright (c) 2006 The NetBSD Foundation, Inc.
5 * All rights reserved.
6 *
7 * This code is derived from software contributed to The NetBSD Foundation
8 * by Andrew Doran.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 * 3. All advertising materials mentioning features or use of this software
19 * must display the following acknowledgement:
20 * This product includes software developed by the NetBSD
21 * Foundation, Inc. and its contributors.
22 * 4. Neither the name of The NetBSD Foundation nor the names of its
23 * contributors may be used to endorse or promote products derived
24 * from this software without specific prior written permission.
25 *
26 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
27 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
28 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
29 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
30 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
31 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
32 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
33 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
34 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
35 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
36 * POSSIBILITY OF SUCH DAMAGE.
37 */
38
39 /*
40 * Basic lock debugging code shared among lock primatives.
41 */
42
43 #include "opt_multiprocessor.h"
44
45 #include <sys/cdefs.h>
46 __KERNEL_RCSID(0, "$NetBSD: subr_lockdebug.c,v 1.1.2.3 2006/11/17 16:34:37 ad Exp $");
47
48 #include <sys/param.h>
49 #include <sys/proc.h>
50 #include <sys/systm.h>
51 #include <sys/malloc.h>
52 #include <sys/lock.h>
53 #include <sys/lockdebug.h>
54
55 #include <machine/cpu.h>
56
57 #ifdef LOCKDEBUG
58
59 #define LD_BATCH_SHIFT 9
60 #define LD_BATCH (1 << LD_BATCH_SHIFT)
61 #define LD_BATCH_MASK (LD_BATCH - 1)
62 #define LD_MAX_LOCKS 1048576
63 #define LD_SLOP 16
64
65 #define LD_LOCKED 0x01
66 #define LD_SLEEPER 0x02
67
68 #define LD_NOID LD_MAX_LOCKS
69
70 typedef struct lockdebuglk {
71 __cpu_simple_lock_t lk_lock;
72 int lk_oldspl;
73 } volatile lockdebuglk_t;
74
75 typedef struct lockdebug {
76 _TAILQ_ENTRY(struct lockdebug, volatile) ld_chain;
77 volatile void *ld_lock;
78 lockops_t *ld_lockops;
79 struct lwp *ld_lwp;
80 uintptr_t ld_locked;
81 uintptr_t ld_unlocked;
82 u_int ld_id;
83 u_short ld_cpu;
84 u_short ld_shares;
85 u_char ld_flags;
86 } volatile lockdebug_t;
87
88 typedef _TAILQ_HEAD(lockdebuglist, struct lockdebug, volatile) lockdebuglist_t;
89
90 lockdebuglk_t ld_sleeper_lk;
91 lockdebuglk_t ld_spinner_lk;
92 lockdebuglk_t ld_free_lk;
93
94 lockdebuglist_t ld_sleepers;
95 lockdebuglist_t ld_spinners;
96 lockdebuglist_t ld_free;
97 int ld_nfree;
98 int ld_freeptr;
99 int ld_recurse;
100 lockdebug_t *ld_table[LD_MAX_LOCKS / LD_BATCH];
101 char ld_panicbuf[1024];
102
103 lockdebug_t ld_prime[LD_BATCH];
104
105 MALLOC_DEFINE(M_LOCKDEBUG, "lockdebug", "lockdebug structures");
106
107 void lockdebug_abort1(lockdebug_t *, lockdebuglk_t *lk, const char *,
108 const char *);
109 void lockdebug_more(void);
110
111 static inline void
112 lockdebug_lock(lockdebuglk_t *lk)
113 {
114 int s;
115
116 s = spllock();
117 __cpu_simple_lock(&lk->lk_lock);
118 lk->lk_oldspl = s;
119 }
120
121 static inline void
122 lockdebug_unlock(lockdebuglk_t *lk)
123 {
124 int s;
125
126 s = lk->lk_oldspl;
127 __cpu_simple_unlock(&lk->lk_lock);
128 splx(s);
129 }
130
131 /*
132 * lockdebug_lookup:
133 *
134 * Find a lockdebug structure by ID and return it locked.
135 */
136 static inline lockdebug_t *
137 lockdebug_lookup(u_int id, lockdebuglk_t **lk)
138 {
139 lockdebug_t *ld;
140
141 if (id == LD_NOID)
142 return NULL;
143
144 ld = ld_table[id >> LD_BATCH_SHIFT] + (id & LD_BATCH_MASK);
145
146 if (id == 0 || id >= LD_MAX_LOCKS || ld == NULL || ld->ld_lock == NULL)
147 panic("lockdebug_lookup: uninitialized lock (id=%d)", id);
148
149 if (ld->ld_id != id)
150 panic("lockdebug_lookup: corrupt table");
151
152 if ((ld->ld_flags & LD_SLEEPER) != 0)
153 *lk = &ld_sleeper_lk;
154 else
155 *lk = &ld_spinner_lk;
156
157 lockdebug_lock(*lk);
158 return ld;
159 }
160
161 /*
162 * lockdebug_init:
163 *
164 * Initialize the lockdebug system. Allocate an initial pool of
165 * lockdebug structures before the VM system is up and running.
166 */
167 void
168 lockdebug_init(void)
169 {
170 lockdebug_t *ld;
171 int i;
172
173 __cpu_simple_lock_init(&ld_sleeper_lk.lk_lock);
174 __cpu_simple_lock_init(&ld_spinner_lk.lk_lock);
175 __cpu_simple_lock_init(&ld_free_lk.lk_lock);
176
177 TAILQ_INIT(&ld_free);
178 TAILQ_INIT(&ld_sleepers);
179 TAILQ_INIT(&ld_spinners);
180
181 ld = ld_prime;
182 ld_table[0] = ld;
183 for (i = 1, ld++; i < LD_BATCH; i++, ld++) {
184 ld->ld_id = i;
185 TAILQ_INSERT_TAIL(&ld_free, ld, ld_chain);
186 }
187 ld_freeptr = 1;
188 ld_nfree = LD_BATCH;
189 }
190
191 /*
192 * lockdebug_alloc:
193 *
194 * A lock is being initialized, so allocate an associated debug
195 * structure.
196 */
197 u_int
198 lockdebug_alloc(volatile void *lock, lockops_t *lo)
199 {
200 struct cpu_info *ci;
201 lockdebug_t *ld;
202
203 if (panicstr != NULL)
204 return 0;
205
206 ci = curcpu();
207
208 /*
209 * Pinch a new debug structure. We may recurse because we call
210 * malloc(), which may need to initialize new locks somewhere
211 * down the path. If not recursing, we try to maintain at keep
212 * LD_SLOP structures free, which should hopefully be enough to
213 * satisfy malloc(). If we can't provide a structure, not to
214 * worry: we'll just mark the lock as not having an ID.
215 */
216 lockdebug_lock(&ld_free_lk);
217 ci->ci_lkdebug_recurse++;
218
219 if (TAILQ_EMPTY(&ld_free)) {
220 if (ci->ci_lkdebug_recurse > 1) {
221 ci->ci_lkdebug_recurse--;
222 lockdebug_unlock(&ld_free_lk);
223 return (LD_NOID);
224 }
225 lockdebug_more();
226 } else if (ci->ci_lkdebug_recurse == 1 && ld_nfree < LD_SLOP)
227 lockdebug_more();
228
229 ld = TAILQ_FIRST(&ld_free);
230 TAILQ_REMOVE(&ld_free, ld, ld_chain);
231 ld_nfree--;
232
233 ci->ci_lkdebug_recurse--;
234 lockdebug_unlock(&ld_free_lk);
235
236 if (ld->ld_lock != NULL)
237 panic("lockdebug_alloc: corrupt table");
238
239 if (lo->lo_sleeplock)
240 lockdebug_lock(&ld_sleeper_lk);
241 else
242 lockdebug_lock(&ld_spinner_lk);
243
244 /* Initialise the structure. */
245 ld->ld_lock = lock;
246 ld->ld_lockops = lo;
247 ld->ld_locked = 0;
248 ld->ld_unlocked = 0;
249 ld->ld_lwp = NULL;
250
251 if (lo->lo_sleeplock) {
252 ld->ld_flags = LD_SLEEPER;
253 lockdebug_unlock(&ld_sleeper_lk);
254 } else {
255 ld->ld_flags = 0;
256 lockdebug_unlock(&ld_spinner_lk);
257 }
258
259 return ld->ld_id;
260 }
261
262 /*
263 * lockdebug_free:
264 *
265 * A lock is being destroyed, so release debugging resources.
266 */
267 void
268 lockdebug_free(volatile void *lock, u_int id)
269 {
270 lockdebug_t *ld;
271 lockdebuglk_t *lk;
272
273 if (panicstr != NULL)
274 return;
275
276 if ((ld = lockdebug_lookup(id, &lk)) == NULL)
277 return;
278
279 if (ld->ld_lock != lock) {
280 panic("lockdebug_free: destroying uninitialized lock %p"
281 "(ld_id=%d ld_lock=%p)", lock, id, ld->ld_lock);
282 lockdebug_abort1(ld, lk, __FUNCTION__, "lock record follows");
283 }
284 if ((ld->ld_flags & LD_LOCKED) != 0)
285 lockdebug_abort1(ld, lk, __FUNCTION__, "is locked");
286
287 ld->ld_lock = NULL;
288
289 lockdebug_unlock(lk);
290
291 lockdebug_lock(&ld_free_lk);
292 TAILQ_INSERT_TAIL(&ld_free, ld, ld_chain);
293 ld_nfree++;
294 lockdebug_unlock(&ld_free_lk);
295 }
296
297 /*
298 * lockdebug_more:
299 *
300 * Allocate a batch of debug structures and add to the free list. Must
301 * be called with ld_free_lk held.
302 */
303 void
304 lockdebug_more(void)
305 {
306 lockdebug_t *ld;
307 void *block;
308 int i, base;
309
310 while (ld_nfree < LD_SLOP) {
311 lockdebug_unlock(&ld_free_lk);
312 block = malloc(LD_BATCH * sizeof(lockdebug_t), M_LOCKDEBUG,
313 M_NOWAIT | M_ZERO); /* XXX M_NOWAIT */
314 lockdebug_lock(&ld_free_lk);
315
316 base = ld_freeptr;
317 if (ld_table[base] != NULL) {
318 /* Somebody beat us to it. */
319 lockdebug_unlock(&ld_free_lk);
320 free(block, M_LOCKDEBUG);
321 lockdebug_lock(&ld_free_lk);
322 continue;
323 }
324 ld_table[base] = block;
325 ld_freeptr++;
326 ld_nfree += LD_BATCH;
327 ld = block;
328 base <<= LD_BATCH_SHIFT;
329
330 for (i = 0; i < LD_BATCH; i++, ld++) {
331 ld->ld_id = i + base;
332 ld->ld_lock = NULL;
333 TAILQ_INSERT_TAIL(&ld_free, ld, ld_chain);
334 }
335
336 mb_write();
337 ld_table[base] = ld;
338 }
339 }
340
341 /*
342 * lockdebug_locked:
343 *
344 * Process a lock acquire operation.
345 */
346 void
347 lockdebug_locked(u_int id, uintptr_t where, int shared)
348 {
349 struct lwp *l = curlwp;
350 lockdebuglk_t *lk;
351 lockdebug_t *ld;
352
353 if (panicstr != NULL)
354 return;
355
356 if ((ld = lockdebug_lookup(id, &lk)) == NULL)
357 return;
358
359 if ((ld->ld_flags & LD_LOCKED) != 0)
360 lockdebug_abort1(ld, lk, __FUNCTION__, "already locked");
361
362 if (shared) {
363 if (l == NULL)
364 lockdebug_abort1(ld, lk, __FUNCTION__, "releasing "
365 "shared lock from interrupt context");
366
367 l->l_shlocks++;
368 ld->ld_shares++;
369 } else {
370 ld->ld_flags |= LD_LOCKED;
371 ld->ld_locked = where;
372 ld->ld_cpu = (u_short)cpu_number();
373 ld->ld_lwp = l;
374
375 if ((ld->ld_flags & LD_SLEEPER) != 0) {
376 l->l_exlocks++;
377 TAILQ_INSERT_TAIL(&ld_sleepers, ld, ld_chain);
378 } else {
379 curcpu()->ci_spin_locks2++;
380 TAILQ_INSERT_TAIL(&ld_spinners, ld, ld_chain);
381 }
382 }
383
384 lockdebug_unlock(lk);
385 }
386
387 /*
388 * lockdebug_unlocked:
389 *
390 * Process a lock release operation.
391 */
392 void
393 lockdebug_unlocked(u_int id, uintptr_t where, int shared)
394 {
395 struct lwp *l = curlwp;
396 lockdebuglk_t *lk;
397 lockdebug_t *ld;
398
399 if (panicstr != NULL)
400 return;
401
402 if ((ld = lockdebug_lookup(id, &lk)) == NULL)
403 return;
404
405 if (shared) {
406 if (l == NULL)
407 lockdebug_abort1(ld, lk, __FUNCTION__, "acquiring "
408 "shared lock from interrupt context");
409 if (l->l_shlocks == 0)
410 lockdebug_abort1(ld, lk, __FUNCTION__, "no shared "
411 "locks held by LWP");
412 if (ld->ld_shares == 0)
413 lockdebug_abort1(ld, lk, __FUNCTION__, "no shared "
414 "holds on this lock");
415 l->l_shlocks--;
416 ld->ld_shares--;
417 } else {
418 if ((ld->ld_flags & LD_LOCKED) == 0)
419 lockdebug_abort1(ld, lk, __FUNCTION__, "not locked");
420
421 if ((ld->ld_flags & LD_SLEEPER) != 0) {
422 if (ld->ld_lwp != curlwp)
423 lockdebug_abort1(ld, lk, __FUNCTION__,
424 "not held by current LWP");
425 ld->ld_flags &= ~LD_LOCKED;
426 ld->ld_unlocked = where;
427 ld->ld_lwp = NULL;
428 curlwp->l_exlocks--;
429 TAILQ_REMOVE(&ld_sleepers, ld, ld_chain);
430 } else {
431 if (ld->ld_cpu != (u_short)cpu_number())
432 lockdebug_abort1(ld, lk, __FUNCTION__,
433 "not held by current CPU");
434 ld->ld_flags &= ~LD_LOCKED;
435 ld->ld_unlocked = where;
436 ld->ld_lwp = NULL;
437 curcpu()->ci_spin_locks2--;
438 TAILQ_REMOVE(&ld_spinners, ld, ld_chain);
439 }
440 }
441
442 lockdebug_unlock(lk);
443 }
444
445 /*
446 * lockdebug_barrier:
447 *
448 * Panic if we hold more than one specified spin lock, and optionally,
449 * if we hold sleep locks.
450 */
451 void
452 lockdebug_barrier(volatile void *spinlock, int slplocks)
453 {
454 struct lwp *l = curlwp;
455 lockdebug_t *ld;
456 u_short cpuno;
457
458 if (panicstr != NULL)
459 return;
460
461 if (curcpu()->ci_spin_locks2 != 0) {
462 cpuno = (u_short)cpu_number();
463
464 lockdebug_lock(&ld_spinner_lk);
465 TAILQ_FOREACH(ld, &ld_spinners, ld_chain) {
466 if (ld->ld_lock == spinlock) {
467 if (ld->ld_cpu != cpuno)
468 lockdebug_abort1(ld, &ld_spinner_lk,
469 __FUNCTION__,
470 "not held by current CPU");
471 continue;
472 }
473 if (ld->ld_cpu == cpuno)
474 lockdebug_abort1(ld, &ld_spinner_lk,
475 __FUNCTION__, "spin lock held");
476 }
477 lockdebug_unlock(&ld_spinner_lk);
478 }
479
480 if (!slplocks) {
481 if (l->l_exlocks != 0) {
482 lockdebug_lock(&ld_sleeper_lk);
483 TAILQ_FOREACH(ld, &ld_sleepers, ld_chain) {
484 if (ld->ld_lwp == l)
485 lockdebug_abort1(ld, &ld_sleeper_lk,
486 __FUNCTION__, "sleep lock held");
487 }
488 lockdebug_unlock(&ld_sleeper_lk);
489 }
490 if (l->l_shlocks != 0)
491 panic("lockdebug_barrier: holding %d shared locks",
492 l->l_shlocks);
493 }
494 }
495
496 void
497 lockdebug_abort1(lockdebug_t *ld, lockdebuglk_t *lk, const char *func,
498 const char *msg)
499 {
500 char *buf;
501 int p;
502
503 /*
504 * The kernel is about to fall flat on its face, so assume that 1k
505 * will be enough to hold the dump and abuse the return value from
506 * snprintf.
507 */
508 buf = ld_panicbuf;
509
510 p = snprintf(buf, sizeof(buf), "%s error: %s: %s\n\n",
511 ld->ld_lockops->lo_name, func, msg);
512
513 p += snprintf(buf + p, sizeof(buf) - p,
514 "lock address : %#018lx type : %18s\n"
515 "shared holds : %18d exclusive: %12slocked\n"
516 "last locked : %#018lx unlocked : %#018lx\n"
517 "current cpu : %18d last held: %18d\n"
518 "current lwp : %#018lx last held: %#018lx\n",
519 (long)ld->ld_lock,
520 ((ld->ld_flags & LD_SLEEPER) == 0 ? "spin" : "sleep"),
521 ld->ld_shares, ((ld->ld_flags & LD_LOCKED) == 0 ? "un" : " "),
522 (long)ld->ld_locked, (long)ld->ld_unlocked,
523 (int)cpu_number(), (int)ld->ld_cpu,
524 (long)curlwp, (long)ld->ld_lwp);
525
526 if (ld->ld_lockops->lo_dump != NULL)
527 (void)(*ld->ld_lockops->lo_dump)(ld->ld_lock, buf + p,
528 sizeof(buf) - p);
529
530 lockdebug_unlock(lk);
531 printf("%s", buf);
532 panic("LOCKDEBUG");
533 }
534
535 #endif /* LOCKDEBUG */
536
537 /*
538 * lockdebug_abort:
539 *
540 * An error has been trapped - dump lock info and call panic().
541 */
542 void
543 lockdebug_abort(int id, volatile void *lock, lockops_t *ops,
544 const char *func, const char *msg)
545 {
546 char buf[192];
547 #ifdef LOCKDEBUG
548 lockdebug_t *ld;
549 lockdebuglk_t *lk;
550
551 if ((ld = lockdebug_lookup(id, &lk)) != NULL) {
552 lockdebug_abort1(ld, lk, func, msg);
553 /* NOTREACHED */
554 }
555 #endif /* LOCKDEBUG */
556
557 /*
558 * The kernel is about to fall flat on its face, so assume that 192
559 * bytes will be enough to hold the dump.
560 */
561 printf("%s error: %s: %s\n\n"
562 "lock address : %#018lx\n"
563 "current cpu : %18d\n"
564 "current lwp : %#018lx\n",
565 ops->lo_name, func, msg, (long)lock, (int)cpu_number(),
566 (long)curlwp);
567
568 (void)(*ops->lo_dump)(lock, buf, sizeof(buf));
569
570 printf("%s", buf);
571
572 panic("lock error");
573 }
574