Home | History | Annotate | Line # | Download | only in kern
kern_condvar.c revision 1.30.12.2
      1       1.30  uebayasi /*	$NetBSD: kern_condvar.c,v 1.30.12.2 2014/08/20 00:04:28 tls Exp $	*/
      2        1.2        ad 
      3        1.2        ad /*-
      4       1.15        ad  * Copyright (c) 2006, 2007, 2008 The NetBSD Foundation, Inc.
      5        1.2        ad  * All rights reserved.
      6        1.2        ad  *
      7        1.2        ad  * This code is derived from software contributed to The NetBSD Foundation
      8        1.2        ad  * by Andrew Doran.
      9        1.2        ad  *
     10        1.2        ad  * Redistribution and use in source and binary forms, with or without
     11        1.2        ad  * modification, are permitted provided that the following conditions
     12        1.2        ad  * are met:
     13        1.2        ad  * 1. Redistributions of source code must retain the above copyright
     14        1.2        ad  *    notice, this list of conditions and the following disclaimer.
     15        1.2        ad  * 2. Redistributions in binary form must reproduce the above copyright
     16        1.2        ad  *    notice, this list of conditions and the following disclaimer in the
     17        1.2        ad  *    documentation and/or other materials provided with the distribution.
     18        1.2        ad  *
     19        1.2        ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20        1.2        ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21        1.2        ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22        1.2        ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23        1.2        ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24        1.2        ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25        1.2        ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26        1.2        ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27        1.2        ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28        1.2        ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29        1.2        ad  * POSSIBILITY OF SUCH DAMAGE.
     30        1.2        ad  */
     31        1.2        ad 
     32        1.2        ad /*
     33       1.24        ad  * Kernel condition variable implementation.
     34        1.2        ad  */
     35        1.2        ad 
     36        1.2        ad #include <sys/cdefs.h>
     37       1.30  uebayasi __KERNEL_RCSID(0, "$NetBSD: kern_condvar.c,v 1.30.12.2 2014/08/20 00:04:28 tls Exp $");
     38        1.2        ad 
     39        1.2        ad #include <sys/param.h>
     40        1.2        ad #include <sys/proc.h>
     41        1.2        ad #include <sys/sched.h>
     42        1.2        ad #include <sys/systm.h>
     43        1.2        ad #include <sys/condvar.h>
     44        1.2        ad #include <sys/sleepq.h>
     45       1.20        ad #include <sys/lockdebug.h>
     46       1.24        ad #include <sys/cpu.h>
     47       1.20        ad 
     48       1.26   thorpej /*
     49       1.26   thorpej  * Accessors for the private contents of the kcondvar_t data type.
     50       1.26   thorpej  *
     51       1.26   thorpej  *	cv_opaque[0]	sleepq...
     52       1.26   thorpej  *	cv_opaque[1]	...pointers
     53       1.26   thorpej  *	cv_opaque[2]	description for ps(1)
     54       1.26   thorpej  *
     55       1.26   thorpej  * cv_opaque[0..1] is protected by the interlock passed to cv_wait() (enqueue
     56       1.26   thorpej  * only), and the sleep queue lock acquired with sleeptab_lookup() (enqueue
     57       1.26   thorpej  * and dequeue).
     58       1.26   thorpej  *
     59       1.26   thorpej  * cv_opaque[2] (the wmesg) is static and does not change throughout the life
     60       1.26   thorpej  * of the CV.
     61       1.26   thorpej  */
     62       1.26   thorpej #define	CV_SLEEPQ(cv)		((sleepq_t *)(cv)->cv_opaque)
     63       1.26   thorpej #define	CV_WMESG(cv)		((const char *)(cv)->cv_opaque[2])
     64       1.26   thorpej #define	CV_SET_WMESG(cv, v) 	(cv)->cv_opaque[2] = __UNCONST(v)
     65       1.26   thorpej 
     66       1.26   thorpej #define	CV_DEBUG_P(cv)	(CV_WMESG(cv) != nodebug)
     67       1.20        ad #define	CV_RA		((uintptr_t)__builtin_return_address(0))
     68        1.2        ad 
     69       1.27     rmind static void	cv_unsleep(lwp_t *, bool);
     70       1.20        ad static void	cv_wakeup_one(kcondvar_t *);
     71       1.20        ad static void	cv_wakeup_all(kcondvar_t *);
     72        1.2        ad 
     73       1.10        ad static syncobj_t cv_syncobj = {
     74        1.2        ad 	SOBJ_SLEEPQ_SORTED,
     75        1.2        ad 	cv_unsleep,
     76       1.14        ad 	sleepq_changepri,
     77        1.4      yamt 	sleepq_lendpri,
     78        1.4      yamt 	syncobj_noowner,
     79        1.2        ad };
     80        1.2        ad 
     81       1.20        ad lockops_t cv_lockops = {
     82       1.20        ad 	"Condition variable",
     83       1.20        ad 	LOCKOPS_CV,
     84       1.20        ad 	NULL
     85       1.20        ad };
     86       1.20        ad 
     87       1.10        ad static const char deadcv[] = "deadcv";
     88  1.30.12.2       tls #ifdef LOCKDEBUG
     89       1.20        ad static const char nodebug[] = "nodebug";
     90  1.30.12.2       tls #endif
     91       1.10        ad 
     92        1.2        ad /*
     93        1.2        ad  * cv_init:
     94        1.2        ad  *
     95        1.2        ad  *	Initialize a condition variable for use.
     96        1.2        ad  */
     97        1.2        ad void
     98        1.2        ad cv_init(kcondvar_t *cv, const char *wmesg)
     99        1.2        ad {
    100       1.21        ad #ifdef LOCKDEBUG
    101       1.20        ad 	bool dodebug;
    102        1.2        ad 
    103       1.20        ad 	dodebug = LOCKDEBUG_ALLOC(cv, &cv_lockops,
    104       1.20        ad 	    (uintptr_t)__builtin_return_address(0));
    105       1.21        ad 	if (!dodebug) {
    106       1.20        ad 		/* XXX This will break vfs_lockf. */
    107       1.21        ad 		wmesg = nodebug;
    108       1.20        ad 	}
    109       1.21        ad #endif
    110       1.21        ad 	KASSERT(wmesg != NULL);
    111       1.26   thorpej 	CV_SET_WMESG(cv, wmesg);
    112       1.20        ad 	sleepq_init(CV_SLEEPQ(cv));
    113        1.2        ad }
    114        1.2        ad 
    115        1.2        ad /*
    116        1.2        ad  * cv_destroy:
    117        1.2        ad  *
    118        1.2        ad  *	Tear down a condition variable.
    119        1.2        ad  */
    120        1.2        ad void
    121        1.2        ad cv_destroy(kcondvar_t *cv)
    122        1.2        ad {
    123        1.2        ad 
    124       1.20        ad 	LOCKDEBUG_FREE(CV_DEBUG_P(cv), cv);
    125        1.2        ad #ifdef DIAGNOSTIC
    126       1.15        ad 	KASSERT(cv_is_valid(cv));
    127       1.26   thorpej 	CV_SET_WMESG(cv, deadcv);
    128        1.2        ad #endif
    129        1.2        ad }
    130        1.2        ad 
    131        1.2        ad /*
    132        1.2        ad  * cv_enter:
    133        1.2        ad  *
    134        1.2        ad  *	Look up and lock the sleep queue corresponding to the given
    135        1.2        ad  *	condition variable, and increment the number of waiters.
    136        1.2        ad  */
    137       1.20        ad static inline void
    138        1.6        ad cv_enter(kcondvar_t *cv, kmutex_t *mtx, lwp_t *l)
    139        1.2        ad {
    140        1.2        ad 	sleepq_t *sq;
    141       1.18        ad 	kmutex_t *mp;
    142        1.2        ad 
    143       1.15        ad 	KASSERT(cv_is_valid(cv));
    144       1.24        ad 	KASSERT(!cpu_intr_p());
    145       1.14        ad 	KASSERT((l->l_pflag & LP_INTR) == 0 || panicstr != NULL);
    146        1.2        ad 
    147       1.20        ad 	LOCKDEBUG_LOCKED(CV_DEBUG_P(cv), cv, mtx, CV_RA, 0);
    148       1.20        ad 
    149       1.14        ad 	l->l_kpriority = true;
    150       1.24        ad 	mp = sleepq_hashlock(cv);
    151       1.20        ad 	sq = CV_SLEEPQ(cv);
    152       1.18        ad 	sleepq_enter(sq, l, mp);
    153       1.26   thorpej 	sleepq_enqueue(sq, cv, CV_WMESG(cv), &cv_syncobj);
    154        1.2        ad 	mutex_exit(mtx);
    155       1.24        ad 	KASSERT(cv_has_waiters(cv));
    156        1.2        ad }
    157        1.2        ad 
    158        1.2        ad /*
    159        1.6        ad  * cv_exit:
    160        1.6        ad  *
    161        1.6        ad  *	After resuming execution, check to see if we have been restarted
    162        1.6        ad  *	as a result of cv_signal().  If we have, but cannot take the
    163        1.6        ad  *	wakeup (because of eg a pending Unix signal or timeout) then try
    164        1.6        ad  *	to ensure that another LWP sees it.  This is necessary because
    165        1.6        ad  *	there may be multiple waiters, and at least one should take the
    166        1.6        ad  *	wakeup if possible.
    167        1.6        ad  */
    168        1.6        ad static inline int
    169        1.6        ad cv_exit(kcondvar_t *cv, kmutex_t *mtx, lwp_t *l, const int error)
    170        1.6        ad {
    171        1.6        ad 
    172        1.6        ad 	mutex_enter(mtx);
    173       1.20        ad 	if (__predict_false(error != 0))
    174        1.6        ad 		cv_signal(cv);
    175        1.6        ad 
    176       1.20        ad 	LOCKDEBUG_UNLOCKED(CV_DEBUG_P(cv), cv, CV_RA, 0);
    177       1.15        ad 	KASSERT(cv_is_valid(cv));
    178       1.10        ad 
    179        1.6        ad 	return error;
    180        1.6        ad }
    181        1.6        ad 
    182        1.6        ad /*
    183        1.2        ad  * cv_unsleep:
    184        1.2        ad  *
    185        1.2        ad  *	Remove an LWP from the condition variable and sleep queue.  This
    186        1.2        ad  *	is called when the LWP has not been awoken normally but instead
    187        1.2        ad  *	interrupted: for example, when a signal is received.  Must be
    188        1.2        ad  *	called with the LWP locked, and must return it unlocked.
    189        1.2        ad  */
    190       1.27     rmind static void
    191       1.16        ad cv_unsleep(lwp_t *l, bool cleanup)
    192        1.2        ad {
    193  1.30.12.2       tls 	kcondvar_t *cv __diagused;
    194        1.2        ad 
    195       1.15        ad 	cv = (kcondvar_t *)(uintptr_t)l->l_wchan;
    196       1.15        ad 
    197       1.20        ad 	KASSERT(l->l_wchan == (wchan_t)cv);
    198       1.20        ad 	KASSERT(l->l_sleepq == CV_SLEEPQ(cv));
    199       1.15        ad 	KASSERT(cv_is_valid(cv));
    200       1.24        ad 	KASSERT(cv_has_waiters(cv));
    201        1.2        ad 
    202       1.27     rmind 	sleepq_unsleep(l, cleanup);
    203        1.2        ad }
    204        1.2        ad 
    205        1.2        ad /*
    206        1.2        ad  * cv_wait:
    207        1.2        ad  *
    208        1.2        ad  *	Wait non-interruptably on a condition variable until awoken.
    209        1.2        ad  */
    210        1.2        ad void
    211        1.2        ad cv_wait(kcondvar_t *cv, kmutex_t *mtx)
    212        1.2        ad {
    213        1.6        ad 	lwp_t *l = curlwp;
    214        1.2        ad 
    215        1.8      yamt 	KASSERT(mutex_owned(mtx));
    216        1.2        ad 
    217       1.20        ad 	cv_enter(cv, mtx, l);
    218        1.8      yamt 	(void)sleepq_block(0, false);
    219        1.6        ad 	(void)cv_exit(cv, mtx, l, 0);
    220        1.2        ad }
    221        1.2        ad 
    222        1.2        ad /*
    223        1.2        ad  * cv_wait_sig:
    224        1.2        ad  *
    225        1.2        ad  *	Wait on a condition variable until a awoken or a signal is received.
    226        1.2        ad  *	Will also return early if the process is exiting.  Returns zero if
    227       1.29       jym  *	awoken normally, ERESTART if a signal was received and the system
    228        1.2        ad  *	call is restartable, or EINTR otherwise.
    229        1.2        ad  */
    230        1.2        ad int
    231        1.2        ad cv_wait_sig(kcondvar_t *cv, kmutex_t *mtx)
    232        1.2        ad {
    233        1.6        ad 	lwp_t *l = curlwp;
    234        1.2        ad 	int error;
    235        1.2        ad 
    236        1.8      yamt 	KASSERT(mutex_owned(mtx));
    237        1.2        ad 
    238       1.20        ad 	cv_enter(cv, mtx, l);
    239        1.8      yamt 	error = sleepq_block(0, true);
    240        1.6        ad 	return cv_exit(cv, mtx, l, error);
    241        1.2        ad }
    242        1.2        ad 
    243        1.2        ad /*
    244        1.2        ad  * cv_timedwait:
    245        1.2        ad  *
    246        1.2        ad  *	Wait on a condition variable until awoken or the specified timeout
    247        1.2        ad  *	expires.  Returns zero if awoken normally or EWOULDBLOCK if the
    248        1.2        ad  *	timeout expired.
    249  1.30.12.1       tls  *
    250  1.30.12.1       tls  *	timo is a timeout in ticks.  timo = 0 specifies an infinite timeout.
    251        1.2        ad  */
    252        1.2        ad int
    253        1.2        ad cv_timedwait(kcondvar_t *cv, kmutex_t *mtx, int timo)
    254        1.2        ad {
    255        1.6        ad 	lwp_t *l = curlwp;
    256        1.2        ad 	int error;
    257        1.2        ad 
    258        1.8      yamt 	KASSERT(mutex_owned(mtx));
    259        1.2        ad 
    260       1.20        ad 	cv_enter(cv, mtx, l);
    261        1.8      yamt 	error = sleepq_block(timo, false);
    262        1.6        ad 	return cv_exit(cv, mtx, l, error);
    263        1.2        ad }
    264        1.2        ad 
    265        1.2        ad /*
    266        1.2        ad  * cv_timedwait_sig:
    267        1.2        ad  *
    268        1.2        ad  *	Wait on a condition variable until a timeout expires, awoken or a
    269        1.2        ad  *	signal is received.  Will also return early if the process is
    270       1.29       jym  *	exiting.  Returns zero if awoken normally, EWOULDBLOCK if the
    271        1.2        ad  *	timeout expires, ERESTART if a signal was received and the system
    272        1.2        ad  *	call is restartable, or EINTR otherwise.
    273  1.30.12.1       tls  *
    274  1.30.12.1       tls  *	timo is a timeout in ticks.  timo = 0 specifies an infinite timeout.
    275        1.2        ad  */
    276        1.2        ad int
    277        1.2        ad cv_timedwait_sig(kcondvar_t *cv, kmutex_t *mtx, int timo)
    278        1.2        ad {
    279        1.6        ad 	lwp_t *l = curlwp;
    280        1.2        ad 	int error;
    281        1.2        ad 
    282        1.8      yamt 	KASSERT(mutex_owned(mtx));
    283        1.2        ad 
    284       1.20        ad 	cv_enter(cv, mtx, l);
    285        1.8      yamt 	error = sleepq_block(timo, true);
    286        1.6        ad 	return cv_exit(cv, mtx, l, error);
    287        1.2        ad }
    288        1.2        ad 
    289        1.2        ad /*
    290        1.2        ad  * cv_signal:
    291        1.2        ad  *
    292        1.2        ad  *	Wake the highest priority LWP waiting on a condition variable.
    293        1.2        ad  *	Must be called with the interlocking mutex held.
    294        1.2        ad  */
    295        1.2        ad void
    296        1.2        ad cv_signal(kcondvar_t *cv)
    297        1.2        ad {
    298       1.20        ad 
    299       1.22        ad 	/* LOCKDEBUG_WAKEUP(CV_DEBUG_P(cv), cv, CV_RA); */
    300       1.20        ad 	KASSERT(cv_is_valid(cv));
    301       1.20        ad 
    302       1.24        ad 	if (__predict_false(!TAILQ_EMPTY(CV_SLEEPQ(cv))))
    303       1.24        ad 		cv_wakeup_one(cv);
    304       1.20        ad }
    305       1.20        ad 
    306       1.20        ad static void __noinline
    307       1.20        ad cv_wakeup_one(kcondvar_t *cv)
    308       1.20        ad {
    309        1.2        ad 	sleepq_t *sq;
    310       1.18        ad 	kmutex_t *mp;
    311       1.20        ad 	lwp_t *l;
    312        1.2        ad 
    313       1.15        ad 	KASSERT(cv_is_valid(cv));
    314       1.15        ad 
    315       1.24        ad 	mp = sleepq_hashlock(cv);
    316       1.20        ad 	sq = CV_SLEEPQ(cv);
    317       1.20        ad 	l = TAILQ_FIRST(sq);
    318       1.20        ad 	if (l == NULL) {
    319       1.20        ad 		mutex_spin_exit(mp);
    320        1.2        ad 		return;
    321       1.20        ad 	}
    322       1.20        ad 	KASSERT(l->l_sleepq == sq);
    323       1.20        ad 	KASSERT(l->l_mutex == mp);
    324       1.20        ad 	KASSERT(l->l_wchan == cv);
    325       1.27     rmind 	sleepq_remove(sq, l);
    326       1.20        ad 	mutex_spin_exit(mp);
    327        1.2        ad 
    328       1.15        ad 	KASSERT(cv_is_valid(cv));
    329        1.2        ad }
    330        1.2        ad 
    331        1.2        ad /*
    332        1.2        ad  * cv_broadcast:
    333        1.2        ad  *
    334        1.2        ad  *	Wake all LWPs waiting on a condition variable.  Must be called
    335        1.2        ad  *	with the interlocking mutex held.
    336        1.2        ad  */
    337        1.2        ad void
    338        1.2        ad cv_broadcast(kcondvar_t *cv)
    339        1.2        ad {
    340       1.20        ad 
    341       1.22        ad 	/* LOCKDEBUG_WAKEUP(CV_DEBUG_P(cv), cv, CV_RA); */
    342       1.20        ad 	KASSERT(cv_is_valid(cv));
    343       1.20        ad 
    344       1.24        ad 	if (__predict_false(!TAILQ_EMPTY(CV_SLEEPQ(cv))))
    345       1.24        ad 		cv_wakeup_all(cv);
    346       1.20        ad }
    347       1.20        ad 
    348       1.20        ad static void __noinline
    349       1.20        ad cv_wakeup_all(kcondvar_t *cv)
    350       1.20        ad {
    351        1.2        ad 	sleepq_t *sq;
    352       1.18        ad 	kmutex_t *mp;
    353       1.20        ad 	lwp_t *l, *next;
    354        1.2        ad 
    355       1.15        ad 	KASSERT(cv_is_valid(cv));
    356       1.15        ad 
    357       1.24        ad 	mp = sleepq_hashlock(cv);
    358       1.20        ad 	sq = CV_SLEEPQ(cv);
    359       1.20        ad 	for (l = TAILQ_FIRST(sq); l != NULL; l = next) {
    360       1.20        ad 		KASSERT(l->l_sleepq == sq);
    361       1.20        ad 		KASSERT(l->l_mutex == mp);
    362       1.20        ad 		KASSERT(l->l_wchan == cv);
    363       1.20        ad 		next = TAILQ_NEXT(l, l_sleepchain);
    364       1.27     rmind 		sleepq_remove(sq, l);
    365       1.20        ad 	}
    366       1.20        ad 	mutex_spin_exit(mp);
    367        1.2        ad 
    368       1.15        ad 	KASSERT(cv_is_valid(cv));
    369        1.2        ad }
    370        1.2        ad 
    371        1.2        ad /*
    372        1.2        ad  * cv_has_waiters:
    373        1.2        ad  *
    374        1.2        ad  *	For diagnostic assertions: return non-zero if a condition
    375        1.2        ad  *	variable has waiters.
    376        1.2        ad  */
    377        1.7        ad bool
    378        1.2        ad cv_has_waiters(kcondvar_t *cv)
    379        1.2        ad {
    380       1.23     chris 
    381       1.25        ad 	return !TAILQ_EMPTY(CV_SLEEPQ(cv));
    382        1.2        ad }
    383       1.15        ad 
    384       1.15        ad /*
    385       1.15        ad  * cv_is_valid:
    386       1.15        ad  *
    387       1.15        ad  *	For diagnostic assertions: return non-zero if a condition
    388       1.15        ad  *	variable appears to be valid.  No locks need be held.
    389       1.15        ad  */
    390       1.15        ad bool
    391       1.15        ad cv_is_valid(kcondvar_t *cv)
    392       1.15        ad {
    393       1.15        ad 
    394       1.26   thorpej 	return CV_WMESG(cv) != deadcv && CV_WMESG(cv) != NULL;
    395       1.15        ad }
    396