Home | History | Annotate | Line # | Download | only in kern
kern_condvar.c revision 1.32.6.1
      1  1.32.6.1    rmind /*	$NetBSD: kern_condvar.c,v 1.32.6.1 2014/05/18 17:46:07 rmind Exp $	*/
      2       1.2       ad 
      3       1.2       ad /*-
      4      1.15       ad  * Copyright (c) 2006, 2007, 2008 The NetBSD Foundation, Inc.
      5       1.2       ad  * All rights reserved.
      6       1.2       ad  *
      7       1.2       ad  * This code is derived from software contributed to The NetBSD Foundation
      8       1.2       ad  * by Andrew Doran.
      9       1.2       ad  *
     10       1.2       ad  * Redistribution and use in source and binary forms, with or without
     11       1.2       ad  * modification, are permitted provided that the following conditions
     12       1.2       ad  * are met:
     13       1.2       ad  * 1. Redistributions of source code must retain the above copyright
     14       1.2       ad  *    notice, this list of conditions and the following disclaimer.
     15       1.2       ad  * 2. Redistributions in binary form must reproduce the above copyright
     16       1.2       ad  *    notice, this list of conditions and the following disclaimer in the
     17       1.2       ad  *    documentation and/or other materials provided with the distribution.
     18       1.2       ad  *
     19       1.2       ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20       1.2       ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21       1.2       ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22       1.2       ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23       1.2       ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24       1.2       ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25       1.2       ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26       1.2       ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27       1.2       ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28       1.2       ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29       1.2       ad  * POSSIBILITY OF SUCH DAMAGE.
     30       1.2       ad  */
     31       1.2       ad 
     32       1.2       ad /*
     33      1.24       ad  * Kernel condition variable implementation.
     34       1.2       ad  */
     35       1.2       ad 
     36       1.2       ad #include <sys/cdefs.h>
     37  1.32.6.1    rmind __KERNEL_RCSID(0, "$NetBSD: kern_condvar.c,v 1.32.6.1 2014/05/18 17:46:07 rmind Exp $");
     38       1.2       ad 
     39       1.2       ad #include <sys/param.h>
     40       1.2       ad #include <sys/proc.h>
     41       1.2       ad #include <sys/sched.h>
     42       1.2       ad #include <sys/systm.h>
     43       1.2       ad #include <sys/condvar.h>
     44       1.2       ad #include <sys/sleepq.h>
     45      1.20       ad #include <sys/lockdebug.h>
     46      1.24       ad #include <sys/cpu.h>
     47      1.20       ad 
     48      1.26  thorpej /*
     49      1.26  thorpej  * Accessors for the private contents of the kcondvar_t data type.
     50      1.26  thorpej  *
     51      1.26  thorpej  *	cv_opaque[0]	sleepq...
     52      1.26  thorpej  *	cv_opaque[1]	...pointers
     53      1.26  thorpej  *	cv_opaque[2]	description for ps(1)
     54      1.26  thorpej  *
     55      1.26  thorpej  * cv_opaque[0..1] is protected by the interlock passed to cv_wait() (enqueue
     56      1.26  thorpej  * only), and the sleep queue lock acquired with sleeptab_lookup() (enqueue
     57      1.26  thorpej  * and dequeue).
     58      1.26  thorpej  *
     59      1.26  thorpej  * cv_opaque[2] (the wmesg) is static and does not change throughout the life
     60      1.26  thorpej  * of the CV.
     61      1.26  thorpej  */
     62      1.26  thorpej #define	CV_SLEEPQ(cv)		((sleepq_t *)(cv)->cv_opaque)
     63      1.26  thorpej #define	CV_WMESG(cv)		((const char *)(cv)->cv_opaque[2])
     64      1.26  thorpej #define	CV_SET_WMESG(cv, v) 	(cv)->cv_opaque[2] = __UNCONST(v)
     65      1.26  thorpej 
     66      1.26  thorpej #define	CV_DEBUG_P(cv)	(CV_WMESG(cv) != nodebug)
     67      1.20       ad #define	CV_RA		((uintptr_t)__builtin_return_address(0))
     68       1.2       ad 
     69      1.27    rmind static void	cv_unsleep(lwp_t *, bool);
     70      1.20       ad static void	cv_wakeup_one(kcondvar_t *);
     71      1.20       ad static void	cv_wakeup_all(kcondvar_t *);
     72       1.2       ad 
     73      1.10       ad static syncobj_t cv_syncobj = {
     74       1.2       ad 	SOBJ_SLEEPQ_SORTED,
     75       1.2       ad 	cv_unsleep,
     76      1.14       ad 	sleepq_changepri,
     77       1.4     yamt 	sleepq_lendpri,
     78       1.4     yamt 	syncobj_noowner,
     79       1.2       ad };
     80       1.2       ad 
     81      1.20       ad lockops_t cv_lockops = {
     82      1.20       ad 	"Condition variable",
     83      1.20       ad 	LOCKOPS_CV,
     84      1.20       ad 	NULL
     85      1.20       ad };
     86      1.20       ad 
     87      1.10       ad static const char deadcv[] = "deadcv";
     88  1.32.6.1    rmind #ifdef LOCKDEBUG
     89      1.20       ad static const char nodebug[] = "nodebug";
     90  1.32.6.1    rmind #endif
     91      1.10       ad 
     92       1.2       ad /*
     93       1.2       ad  * cv_init:
     94       1.2       ad  *
     95       1.2       ad  *	Initialize a condition variable for use.
     96       1.2       ad  */
     97       1.2       ad void
     98       1.2       ad cv_init(kcondvar_t *cv, const char *wmesg)
     99       1.2       ad {
    100      1.21       ad #ifdef LOCKDEBUG
    101      1.20       ad 	bool dodebug;
    102       1.2       ad 
    103      1.20       ad 	dodebug = LOCKDEBUG_ALLOC(cv, &cv_lockops,
    104      1.20       ad 	    (uintptr_t)__builtin_return_address(0));
    105      1.21       ad 	if (!dodebug) {
    106      1.20       ad 		/* XXX This will break vfs_lockf. */
    107      1.21       ad 		wmesg = nodebug;
    108      1.20       ad 	}
    109      1.21       ad #endif
    110      1.21       ad 	KASSERT(wmesg != NULL);
    111      1.26  thorpej 	CV_SET_WMESG(cv, wmesg);
    112      1.20       ad 	sleepq_init(CV_SLEEPQ(cv));
    113       1.2       ad }
    114       1.2       ad 
    115       1.2       ad /*
    116       1.2       ad  * cv_destroy:
    117       1.2       ad  *
    118       1.2       ad  *	Tear down a condition variable.
    119       1.2       ad  */
    120       1.2       ad void
    121       1.2       ad cv_destroy(kcondvar_t *cv)
    122       1.2       ad {
    123       1.2       ad 
    124      1.20       ad 	LOCKDEBUG_FREE(CV_DEBUG_P(cv), cv);
    125       1.2       ad #ifdef DIAGNOSTIC
    126      1.15       ad 	KASSERT(cv_is_valid(cv));
    127      1.26  thorpej 	CV_SET_WMESG(cv, deadcv);
    128       1.2       ad #endif
    129       1.2       ad }
    130       1.2       ad 
    131       1.2       ad /*
    132       1.2       ad  * cv_enter:
    133       1.2       ad  *
    134       1.2       ad  *	Look up and lock the sleep queue corresponding to the given
    135       1.2       ad  *	condition variable, and increment the number of waiters.
    136       1.2       ad  */
    137      1.20       ad static inline void
    138       1.6       ad cv_enter(kcondvar_t *cv, kmutex_t *mtx, lwp_t *l)
    139       1.2       ad {
    140       1.2       ad 	sleepq_t *sq;
    141      1.18       ad 	kmutex_t *mp;
    142       1.2       ad 
    143      1.15       ad 	KASSERT(cv_is_valid(cv));
    144      1.24       ad 	KASSERT(!cpu_intr_p());
    145      1.14       ad 	KASSERT((l->l_pflag & LP_INTR) == 0 || panicstr != NULL);
    146       1.2       ad 
    147      1.20       ad 	LOCKDEBUG_LOCKED(CV_DEBUG_P(cv), cv, mtx, CV_RA, 0);
    148      1.20       ad 
    149      1.14       ad 	l->l_kpriority = true;
    150      1.24       ad 	mp = sleepq_hashlock(cv);
    151      1.20       ad 	sq = CV_SLEEPQ(cv);
    152      1.18       ad 	sleepq_enter(sq, l, mp);
    153      1.26  thorpej 	sleepq_enqueue(sq, cv, CV_WMESG(cv), &cv_syncobj);
    154       1.2       ad 	mutex_exit(mtx);
    155      1.24       ad 	KASSERT(cv_has_waiters(cv));
    156       1.2       ad }
    157       1.2       ad 
    158       1.2       ad /*
    159       1.6       ad  * cv_exit:
    160       1.6       ad  *
    161       1.6       ad  *	After resuming execution, check to see if we have been restarted
    162       1.6       ad  *	as a result of cv_signal().  If we have, but cannot take the
    163       1.6       ad  *	wakeup (because of eg a pending Unix signal or timeout) then try
    164       1.6       ad  *	to ensure that another LWP sees it.  This is necessary because
    165       1.6       ad  *	there may be multiple waiters, and at least one should take the
    166       1.6       ad  *	wakeup if possible.
    167       1.6       ad  */
    168       1.6       ad static inline int
    169       1.6       ad cv_exit(kcondvar_t *cv, kmutex_t *mtx, lwp_t *l, const int error)
    170       1.6       ad {
    171       1.6       ad 
    172       1.6       ad 	mutex_enter(mtx);
    173      1.20       ad 	if (__predict_false(error != 0))
    174       1.6       ad 		cv_signal(cv);
    175       1.6       ad 
    176      1.20       ad 	LOCKDEBUG_UNLOCKED(CV_DEBUG_P(cv), cv, CV_RA, 0);
    177      1.15       ad 	KASSERT(cv_is_valid(cv));
    178      1.10       ad 
    179       1.6       ad 	return error;
    180       1.6       ad }
    181       1.6       ad 
    182       1.6       ad /*
    183       1.2       ad  * cv_unsleep:
    184       1.2       ad  *
    185       1.2       ad  *	Remove an LWP from the condition variable and sleep queue.  This
    186       1.2       ad  *	is called when the LWP has not been awoken normally but instead
    187       1.2       ad  *	interrupted: for example, when a signal is received.  Must be
    188       1.2       ad  *	called with the LWP locked, and must return it unlocked.
    189       1.2       ad  */
    190      1.27    rmind static void
    191      1.16       ad cv_unsleep(lwp_t *l, bool cleanup)
    192       1.2       ad {
    193  1.32.6.1    rmind 	kcondvar_t *cv __diagused;
    194       1.2       ad 
    195      1.15       ad 	cv = (kcondvar_t *)(uintptr_t)l->l_wchan;
    196      1.15       ad 
    197      1.20       ad 	KASSERT(l->l_wchan == (wchan_t)cv);
    198      1.20       ad 	KASSERT(l->l_sleepq == CV_SLEEPQ(cv));
    199      1.15       ad 	KASSERT(cv_is_valid(cv));
    200      1.24       ad 	KASSERT(cv_has_waiters(cv));
    201       1.2       ad 
    202      1.27    rmind 	sleepq_unsleep(l, cleanup);
    203       1.2       ad }
    204       1.2       ad 
    205       1.2       ad /*
    206       1.2       ad  * cv_wait:
    207       1.2       ad  *
    208       1.2       ad  *	Wait non-interruptably on a condition variable until awoken.
    209       1.2       ad  */
    210       1.2       ad void
    211       1.2       ad cv_wait(kcondvar_t *cv, kmutex_t *mtx)
    212       1.2       ad {
    213       1.6       ad 	lwp_t *l = curlwp;
    214       1.2       ad 
    215       1.8     yamt 	KASSERT(mutex_owned(mtx));
    216       1.2       ad 
    217      1.20       ad 	cv_enter(cv, mtx, l);
    218       1.8     yamt 	(void)sleepq_block(0, false);
    219       1.6       ad 	(void)cv_exit(cv, mtx, l, 0);
    220       1.2       ad }
    221       1.2       ad 
    222       1.2       ad /*
    223       1.2       ad  * cv_wait_sig:
    224       1.2       ad  *
    225       1.2       ad  *	Wait on a condition variable until a awoken or a signal is received.
    226       1.2       ad  *	Will also return early if the process is exiting.  Returns zero if
    227      1.29      jym  *	awoken normally, ERESTART if a signal was received and the system
    228       1.2       ad  *	call is restartable, or EINTR otherwise.
    229       1.2       ad  */
    230       1.2       ad int
    231       1.2       ad cv_wait_sig(kcondvar_t *cv, kmutex_t *mtx)
    232       1.2       ad {
    233       1.6       ad 	lwp_t *l = curlwp;
    234       1.2       ad 	int error;
    235       1.2       ad 
    236       1.8     yamt 	KASSERT(mutex_owned(mtx));
    237       1.2       ad 
    238      1.20       ad 	cv_enter(cv, mtx, l);
    239       1.8     yamt 	error = sleepq_block(0, true);
    240       1.6       ad 	return cv_exit(cv, mtx, l, error);
    241       1.2       ad }
    242       1.2       ad 
    243       1.2       ad /*
    244       1.2       ad  * cv_timedwait:
    245       1.2       ad  *
    246       1.2       ad  *	Wait on a condition variable until awoken or the specified timeout
    247       1.2       ad  *	expires.  Returns zero if awoken normally or EWOULDBLOCK if the
    248       1.2       ad  *	timeout expired.
    249      1.31      apb  *
    250      1.31      apb  *	timo is a timeout in ticks.  timo = 0 specifies an infinite timeout.
    251       1.2       ad  */
    252       1.2       ad int
    253       1.2       ad cv_timedwait(kcondvar_t *cv, kmutex_t *mtx, int timo)
    254       1.2       ad {
    255       1.6       ad 	lwp_t *l = curlwp;
    256       1.2       ad 	int error;
    257       1.2       ad 
    258       1.8     yamt 	KASSERT(mutex_owned(mtx));
    259       1.2       ad 
    260      1.20       ad 	cv_enter(cv, mtx, l);
    261       1.8     yamt 	error = sleepq_block(timo, false);
    262       1.6       ad 	return cv_exit(cv, mtx, l, error);
    263       1.2       ad }
    264       1.2       ad 
    265       1.2       ad /*
    266       1.2       ad  * cv_timedwait_sig:
    267       1.2       ad  *
    268       1.2       ad  *	Wait on a condition variable until a timeout expires, awoken or a
    269       1.2       ad  *	signal is received.  Will also return early if the process is
    270      1.29      jym  *	exiting.  Returns zero if awoken normally, EWOULDBLOCK if the
    271       1.2       ad  *	timeout expires, ERESTART if a signal was received and the system
    272       1.2       ad  *	call is restartable, or EINTR otherwise.
    273      1.32      apb  *
    274      1.32      apb  *	timo is a timeout in ticks.  timo = 0 specifies an infinite timeout.
    275       1.2       ad  */
    276       1.2       ad int
    277       1.2       ad cv_timedwait_sig(kcondvar_t *cv, kmutex_t *mtx, int timo)
    278       1.2       ad {
    279       1.6       ad 	lwp_t *l = curlwp;
    280       1.2       ad 	int error;
    281       1.2       ad 
    282       1.8     yamt 	KASSERT(mutex_owned(mtx));
    283       1.2       ad 
    284      1.20       ad 	cv_enter(cv, mtx, l);
    285       1.8     yamt 	error = sleepq_block(timo, true);
    286       1.6       ad 	return cv_exit(cv, mtx, l, error);
    287       1.2       ad }
    288       1.2       ad 
    289       1.2       ad /*
    290       1.2       ad  * cv_signal:
    291       1.2       ad  *
    292       1.2       ad  *	Wake the highest priority LWP waiting on a condition variable.
    293       1.2       ad  *	Must be called with the interlocking mutex held.
    294       1.2       ad  */
    295       1.2       ad void
    296       1.2       ad cv_signal(kcondvar_t *cv)
    297       1.2       ad {
    298      1.20       ad 
    299      1.22       ad 	/* LOCKDEBUG_WAKEUP(CV_DEBUG_P(cv), cv, CV_RA); */
    300      1.20       ad 	KASSERT(cv_is_valid(cv));
    301      1.20       ad 
    302      1.24       ad 	if (__predict_false(!TAILQ_EMPTY(CV_SLEEPQ(cv))))
    303      1.24       ad 		cv_wakeup_one(cv);
    304      1.20       ad }
    305      1.20       ad 
    306      1.20       ad static void __noinline
    307      1.20       ad cv_wakeup_one(kcondvar_t *cv)
    308      1.20       ad {
    309       1.2       ad 	sleepq_t *sq;
    310      1.18       ad 	kmutex_t *mp;
    311      1.20       ad 	lwp_t *l;
    312       1.2       ad 
    313      1.15       ad 	KASSERT(cv_is_valid(cv));
    314      1.15       ad 
    315      1.24       ad 	mp = sleepq_hashlock(cv);
    316      1.20       ad 	sq = CV_SLEEPQ(cv);
    317      1.20       ad 	l = TAILQ_FIRST(sq);
    318      1.20       ad 	if (l == NULL) {
    319      1.20       ad 		mutex_spin_exit(mp);
    320       1.2       ad 		return;
    321      1.20       ad 	}
    322      1.20       ad 	KASSERT(l->l_sleepq == sq);
    323      1.20       ad 	KASSERT(l->l_mutex == mp);
    324      1.20       ad 	KASSERT(l->l_wchan == cv);
    325      1.27    rmind 	sleepq_remove(sq, l);
    326      1.20       ad 	mutex_spin_exit(mp);
    327       1.2       ad 
    328      1.15       ad 	KASSERT(cv_is_valid(cv));
    329       1.2       ad }
    330       1.2       ad 
    331       1.2       ad /*
    332       1.2       ad  * cv_broadcast:
    333       1.2       ad  *
    334       1.2       ad  *	Wake all LWPs waiting on a condition variable.  Must be called
    335       1.2       ad  *	with the interlocking mutex held.
    336       1.2       ad  */
    337       1.2       ad void
    338       1.2       ad cv_broadcast(kcondvar_t *cv)
    339       1.2       ad {
    340      1.20       ad 
    341      1.22       ad 	/* LOCKDEBUG_WAKEUP(CV_DEBUG_P(cv), cv, CV_RA); */
    342      1.20       ad 	KASSERT(cv_is_valid(cv));
    343      1.20       ad 
    344      1.24       ad 	if (__predict_false(!TAILQ_EMPTY(CV_SLEEPQ(cv))))
    345      1.24       ad 		cv_wakeup_all(cv);
    346      1.20       ad }
    347      1.20       ad 
    348      1.20       ad static void __noinline
    349      1.20       ad cv_wakeup_all(kcondvar_t *cv)
    350      1.20       ad {
    351       1.2       ad 	sleepq_t *sq;
    352      1.18       ad 	kmutex_t *mp;
    353      1.20       ad 	lwp_t *l, *next;
    354       1.2       ad 
    355      1.15       ad 	KASSERT(cv_is_valid(cv));
    356      1.15       ad 
    357      1.24       ad 	mp = sleepq_hashlock(cv);
    358      1.20       ad 	sq = CV_SLEEPQ(cv);
    359      1.20       ad 	for (l = TAILQ_FIRST(sq); l != NULL; l = next) {
    360      1.20       ad 		KASSERT(l->l_sleepq == sq);
    361      1.20       ad 		KASSERT(l->l_mutex == mp);
    362      1.20       ad 		KASSERT(l->l_wchan == cv);
    363      1.20       ad 		next = TAILQ_NEXT(l, l_sleepchain);
    364      1.27    rmind 		sleepq_remove(sq, l);
    365      1.20       ad 	}
    366      1.20       ad 	mutex_spin_exit(mp);
    367       1.2       ad 
    368      1.15       ad 	KASSERT(cv_is_valid(cv));
    369       1.2       ad }
    370       1.2       ad 
    371       1.2       ad /*
    372       1.2       ad  * cv_has_waiters:
    373       1.2       ad  *
    374       1.2       ad  *	For diagnostic assertions: return non-zero if a condition
    375       1.2       ad  *	variable has waiters.
    376       1.2       ad  */
    377       1.7       ad bool
    378       1.2       ad cv_has_waiters(kcondvar_t *cv)
    379       1.2       ad {
    380      1.23    chris 
    381      1.25       ad 	return !TAILQ_EMPTY(CV_SLEEPQ(cv));
    382       1.2       ad }
    383      1.15       ad 
    384      1.15       ad /*
    385      1.15       ad  * cv_is_valid:
    386      1.15       ad  *
    387      1.15       ad  *	For diagnostic assertions: return non-zero if a condition
    388      1.15       ad  *	variable appears to be valid.  No locks need be held.
    389      1.15       ad  */
    390      1.15       ad bool
    391      1.15       ad cv_is_valid(kcondvar_t *cv)
    392      1.15       ad {
    393      1.15       ad 
    394      1.26  thorpej 	return CV_WMESG(cv) != deadcv && CV_WMESG(cv) != NULL;
    395      1.15       ad }
    396