kern_condvar.c revision 1.50 1 1.50 thorpej /* $NetBSD: kern_condvar.c,v 1.50 2020/05/03 17:36:33 thorpej Exp $ */
2 1.2 ad
3 1.2 ad /*-
4 1.43 ad * Copyright (c) 2006, 2007, 2008, 2019, 2020 The NetBSD Foundation, Inc.
5 1.2 ad * All rights reserved.
6 1.2 ad *
7 1.2 ad * This code is derived from software contributed to The NetBSD Foundation
8 1.2 ad * by Andrew Doran.
9 1.2 ad *
10 1.2 ad * Redistribution and use in source and binary forms, with or without
11 1.2 ad * modification, are permitted provided that the following conditions
12 1.2 ad * are met:
13 1.2 ad * 1. Redistributions of source code must retain the above copyright
14 1.2 ad * notice, this list of conditions and the following disclaimer.
15 1.2 ad * 2. Redistributions in binary form must reproduce the above copyright
16 1.2 ad * notice, this list of conditions and the following disclaimer in the
17 1.2 ad * documentation and/or other materials provided with the distribution.
18 1.2 ad *
19 1.2 ad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.2 ad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.2 ad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.2 ad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.2 ad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.2 ad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.2 ad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.2 ad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.2 ad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.2 ad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.2 ad * POSSIBILITY OF SUCH DAMAGE.
30 1.2 ad */
31 1.2 ad
32 1.2 ad /*
33 1.24 ad * Kernel condition variable implementation.
34 1.2 ad */
35 1.2 ad
36 1.2 ad #include <sys/cdefs.h>
37 1.50 thorpej __KERNEL_RCSID(0, "$NetBSD: kern_condvar.c,v 1.50 2020/05/03 17:36:33 thorpej Exp $");
38 1.2 ad
39 1.2 ad #include <sys/param.h>
40 1.2 ad #include <sys/systm.h>
41 1.35 uebayasi #include <sys/lwp.h>
42 1.2 ad #include <sys/condvar.h>
43 1.2 ad #include <sys/sleepq.h>
44 1.20 ad #include <sys/lockdebug.h>
45 1.24 ad #include <sys/cpu.h>
46 1.37 riastrad #include <sys/kernel.h>
47 1.20 ad
48 1.26 thorpej /*
49 1.26 thorpej * Accessors for the private contents of the kcondvar_t data type.
50 1.26 thorpej *
51 1.44 ad * cv_opaque[0] sleepq_t
52 1.44 ad * cv_opaque[1] description for ps(1)
53 1.26 thorpej *
54 1.44 ad * cv_opaque[0] is protected by the interlock passed to cv_wait() (enqueue
55 1.43 ad * only), and the sleep queue lock acquired with sleepq_hashlock() (enqueue
56 1.26 thorpej * and dequeue).
57 1.26 thorpej *
58 1.44 ad * cv_opaque[1] (the wmesg) is static and does not change throughout the life
59 1.26 thorpej * of the CV.
60 1.26 thorpej */
61 1.26 thorpej #define CV_SLEEPQ(cv) ((sleepq_t *)(cv)->cv_opaque)
62 1.44 ad #define CV_WMESG(cv) ((const char *)(cv)->cv_opaque[1])
63 1.44 ad #define CV_SET_WMESG(cv, v) (cv)->cv_opaque[1] = __UNCONST(v)
64 1.26 thorpej
65 1.26 thorpej #define CV_DEBUG_P(cv) (CV_WMESG(cv) != nodebug)
66 1.20 ad #define CV_RA ((uintptr_t)__builtin_return_address(0))
67 1.2 ad
68 1.36 chs static void cv_unsleep(lwp_t *, bool);
69 1.36 chs static inline void cv_wakeup_one(kcondvar_t *);
70 1.36 chs static inline void cv_wakeup_all(kcondvar_t *);
71 1.2 ad
72 1.43 ad syncobj_t cv_syncobj = {
73 1.41 ozaki .sobj_flag = SOBJ_SLEEPQ_SORTED,
74 1.41 ozaki .sobj_unsleep = cv_unsleep,
75 1.41 ozaki .sobj_changepri = sleepq_changepri,
76 1.41 ozaki .sobj_lendpri = sleepq_lendpri,
77 1.41 ozaki .sobj_owner = syncobj_noowner,
78 1.2 ad };
79 1.2 ad
80 1.10 ad static const char deadcv[] = "deadcv";
81 1.10 ad
82 1.2 ad /*
83 1.2 ad * cv_init:
84 1.2 ad *
85 1.2 ad * Initialize a condition variable for use.
86 1.2 ad */
87 1.2 ad void
88 1.2 ad cv_init(kcondvar_t *cv, const char *wmesg)
89 1.2 ad {
90 1.2 ad
91 1.21 ad KASSERT(wmesg != NULL);
92 1.26 thorpej CV_SET_WMESG(cv, wmesg);
93 1.20 ad sleepq_init(CV_SLEEPQ(cv));
94 1.2 ad }
95 1.2 ad
96 1.2 ad /*
97 1.2 ad * cv_destroy:
98 1.2 ad *
99 1.2 ad * Tear down a condition variable.
100 1.2 ad */
101 1.2 ad void
102 1.2 ad cv_destroy(kcondvar_t *cv)
103 1.2 ad {
104 1.2 ad
105 1.2 ad #ifdef DIAGNOSTIC
106 1.15 ad KASSERT(cv_is_valid(cv));
107 1.45 ad KASSERT(!cv_has_waiters(cv));
108 1.26 thorpej CV_SET_WMESG(cv, deadcv);
109 1.2 ad #endif
110 1.2 ad }
111 1.2 ad
112 1.2 ad /*
113 1.2 ad * cv_enter:
114 1.2 ad *
115 1.2 ad * Look up and lock the sleep queue corresponding to the given
116 1.2 ad * condition variable, and increment the number of waiters.
117 1.2 ad */
118 1.20 ad static inline void
119 1.47 ad cv_enter(kcondvar_t *cv, kmutex_t *mtx, lwp_t *l, bool catch_p)
120 1.2 ad {
121 1.2 ad sleepq_t *sq;
122 1.18 ad kmutex_t *mp;
123 1.2 ad
124 1.15 ad KASSERT(cv_is_valid(cv));
125 1.24 ad KASSERT(!cpu_intr_p());
126 1.14 ad KASSERT((l->l_pflag & LP_INTR) == 0 || panicstr != NULL);
127 1.2 ad
128 1.14 ad l->l_kpriority = true;
129 1.24 ad mp = sleepq_hashlock(cv);
130 1.20 ad sq = CV_SLEEPQ(cv);
131 1.18 ad sleepq_enter(sq, l, mp);
132 1.47 ad sleepq_enqueue(sq, cv, CV_WMESG(cv), &cv_syncobj, catch_p);
133 1.2 ad mutex_exit(mtx);
134 1.24 ad KASSERT(cv_has_waiters(cv));
135 1.2 ad }
136 1.2 ad
137 1.2 ad /*
138 1.2 ad * cv_unsleep:
139 1.2 ad *
140 1.2 ad * Remove an LWP from the condition variable and sleep queue. This
141 1.2 ad * is called when the LWP has not been awoken normally but instead
142 1.2 ad * interrupted: for example, when a signal is received. Must be
143 1.42 ad * called with the LWP locked. Will unlock if "unlock" is true.
144 1.2 ad */
145 1.27 rmind static void
146 1.42 ad cv_unsleep(lwp_t *l, bool unlock)
147 1.2 ad {
148 1.34 martin kcondvar_t *cv __diagused;
149 1.2 ad
150 1.15 ad cv = (kcondvar_t *)(uintptr_t)l->l_wchan;
151 1.15 ad
152 1.20 ad KASSERT(l->l_wchan == (wchan_t)cv);
153 1.20 ad KASSERT(l->l_sleepq == CV_SLEEPQ(cv));
154 1.15 ad KASSERT(cv_is_valid(cv));
155 1.24 ad KASSERT(cv_has_waiters(cv));
156 1.2 ad
157 1.42 ad sleepq_unsleep(l, unlock);
158 1.2 ad }
159 1.2 ad
160 1.2 ad /*
161 1.2 ad * cv_wait:
162 1.2 ad *
163 1.2 ad * Wait non-interruptably on a condition variable until awoken.
164 1.2 ad */
165 1.2 ad void
166 1.2 ad cv_wait(kcondvar_t *cv, kmutex_t *mtx)
167 1.2 ad {
168 1.6 ad lwp_t *l = curlwp;
169 1.2 ad
170 1.8 yamt KASSERT(mutex_owned(mtx));
171 1.2 ad
172 1.47 ad cv_enter(cv, mtx, l, false);
173 1.8 yamt (void)sleepq_block(0, false);
174 1.36 chs mutex_enter(mtx);
175 1.2 ad }
176 1.2 ad
177 1.2 ad /*
178 1.2 ad * cv_wait_sig:
179 1.2 ad *
180 1.2 ad * Wait on a condition variable until a awoken or a signal is received.
181 1.2 ad * Will also return early if the process is exiting. Returns zero if
182 1.29 jym * awoken normally, ERESTART if a signal was received and the system
183 1.2 ad * call is restartable, or EINTR otherwise.
184 1.2 ad */
185 1.2 ad int
186 1.2 ad cv_wait_sig(kcondvar_t *cv, kmutex_t *mtx)
187 1.2 ad {
188 1.6 ad lwp_t *l = curlwp;
189 1.2 ad int error;
190 1.2 ad
191 1.8 yamt KASSERT(mutex_owned(mtx));
192 1.2 ad
193 1.47 ad cv_enter(cv, mtx, l, true);
194 1.8 yamt error = sleepq_block(0, true);
195 1.45 ad mutex_enter(mtx);
196 1.45 ad return error;
197 1.2 ad }
198 1.2 ad
199 1.2 ad /*
200 1.2 ad * cv_timedwait:
201 1.2 ad *
202 1.2 ad * Wait on a condition variable until awoken or the specified timeout
203 1.2 ad * expires. Returns zero if awoken normally or EWOULDBLOCK if the
204 1.2 ad * timeout expired.
205 1.31 apb *
206 1.31 apb * timo is a timeout in ticks. timo = 0 specifies an infinite timeout.
207 1.2 ad */
208 1.2 ad int
209 1.2 ad cv_timedwait(kcondvar_t *cv, kmutex_t *mtx, int timo)
210 1.2 ad {
211 1.6 ad lwp_t *l = curlwp;
212 1.2 ad int error;
213 1.2 ad
214 1.8 yamt KASSERT(mutex_owned(mtx));
215 1.2 ad
216 1.47 ad cv_enter(cv, mtx, l, false);
217 1.8 yamt error = sleepq_block(timo, false);
218 1.45 ad mutex_enter(mtx);
219 1.45 ad return error;
220 1.2 ad }
221 1.2 ad
222 1.2 ad /*
223 1.2 ad * cv_timedwait_sig:
224 1.2 ad *
225 1.2 ad * Wait on a condition variable until a timeout expires, awoken or a
226 1.2 ad * signal is received. Will also return early if the process is
227 1.29 jym * exiting. Returns zero if awoken normally, EWOULDBLOCK if the
228 1.2 ad * timeout expires, ERESTART if a signal was received and the system
229 1.2 ad * call is restartable, or EINTR otherwise.
230 1.32 apb *
231 1.32 apb * timo is a timeout in ticks. timo = 0 specifies an infinite timeout.
232 1.2 ad */
233 1.2 ad int
234 1.2 ad cv_timedwait_sig(kcondvar_t *cv, kmutex_t *mtx, int timo)
235 1.2 ad {
236 1.6 ad lwp_t *l = curlwp;
237 1.2 ad int error;
238 1.2 ad
239 1.8 yamt KASSERT(mutex_owned(mtx));
240 1.2 ad
241 1.47 ad cv_enter(cv, mtx, l, true);
242 1.8 yamt error = sleepq_block(timo, true);
243 1.45 ad mutex_enter(mtx);
244 1.45 ad return error;
245 1.2 ad }
246 1.2 ad
247 1.49 riastrad /*
248 1.49 riastrad * cv_timedwaitclock:
249 1.49 riastrad *
250 1.49 riastrad * Wait on a condition variable until awoken normally, or the
251 1.49 riastrad * specified timeout expires according to the provided clock.
252 1.49 riastrad * Returns zero if awoken normally or EWOULDBLOCK if the timeout
253 1.49 riastrad * expired. For relative timeouts ((flags & TIMER_ABSTIME) == 0),
254 1.49 riastrad * updates timeout with the time left.
255 1.49 riastrad *
256 1.49 riastrad * timeout == NULL specifies an infinite timeout. epsilon is a
257 1.49 riastrad * requested maximum error in timeout (excluding spurious
258 1.49 riastrad * wakeups).
259 1.49 riastrad */
260 1.49 riastrad int
261 1.49 riastrad cv_timedwaitclock(kcondvar_t *cv, kmutex_t *mtx, struct timespec *timeout,
262 1.49 riastrad clockid_t clockid, int flags, const struct bintime *epsilon)
263 1.49 riastrad {
264 1.49 riastrad struct timedwaitclock T = {
265 1.49 riastrad .timeout = timeout,
266 1.49 riastrad .clockid = clockid,
267 1.49 riastrad .flags = flags,
268 1.49 riastrad .epsilon = epsilon,
269 1.49 riastrad };
270 1.49 riastrad int timo;
271 1.49 riastrad int error;
272 1.49 riastrad
273 1.49 riastrad if (timeout == NULL) {
274 1.49 riastrad cv_wait(cv, mtx);
275 1.49 riastrad return 0;
276 1.49 riastrad }
277 1.49 riastrad
278 1.50 thorpej error = timedwaitclock_begin(&T, &timo);
279 1.49 riastrad if (error)
280 1.49 riastrad return error;
281 1.49 riastrad error = cv_timedwait(cv, mtx, timo);
282 1.50 thorpej timedwaitclock_end(&T);
283 1.49 riastrad return error;
284 1.49 riastrad }
285 1.49 riastrad
286 1.49 riastrad /*
287 1.49 riastrad * cv_timedwaitclock_sig:
288 1.49 riastrad *
289 1.49 riastrad * Wait on a condition variable until awoken normally, interrupted
290 1.49 riastrad * by a signal, or the specified timeout expires according to the
291 1.49 riastrad * provided clock. Returns zero if awoken normally,
292 1.49 riastrad * EINTR/ERESTART if interrupted by a signal, or EWOULDBLOCK if
293 1.49 riastrad * the timeout expired. For relative timeouts ((flags &
294 1.49 riastrad * TIMER_ABSTIME) == 0), updates timeout with the time left.
295 1.49 riastrad *
296 1.49 riastrad * timeout == NULL specifies an infinite timeout. epsilon is a
297 1.49 riastrad * requested maximum error in timeout (excluding spurious
298 1.49 riastrad * wakeups).
299 1.49 riastrad */
300 1.49 riastrad int
301 1.49 riastrad cv_timedwaitclock_sig(kcondvar_t *cv, kmutex_t *mtx, struct timespec *timeout,
302 1.49 riastrad clockid_t clockid, int flags, const struct bintime *epsilon)
303 1.49 riastrad {
304 1.49 riastrad struct timedwaitclock T = {
305 1.49 riastrad .timeout = timeout,
306 1.49 riastrad .clockid = clockid,
307 1.49 riastrad .flags = flags,
308 1.49 riastrad .epsilon = epsilon,
309 1.49 riastrad };
310 1.49 riastrad int timo;
311 1.49 riastrad int error;
312 1.49 riastrad
313 1.49 riastrad if (timeout == NULL)
314 1.49 riastrad return cv_wait_sig(cv, mtx);
315 1.49 riastrad
316 1.50 thorpej error = timedwaitclock_begin(&T, &timo);
317 1.49 riastrad if (error)
318 1.49 riastrad return error;
319 1.49 riastrad error = cv_timedwait_sig(cv, mtx, timo);
320 1.50 thorpej timedwaitclock_end(&T);
321 1.49 riastrad return error;
322 1.49 riastrad }
323 1.49 riastrad
324 1.2 ad /*
325 1.37 riastrad * Given a number of seconds, sec, and 2^64ths of a second, frac, we
326 1.37 riastrad * want a number of ticks for a timeout:
327 1.37 riastrad *
328 1.37 riastrad * timo = hz*(sec + frac/2^64)
329 1.37 riastrad * = hz*sec + hz*frac/2^64
330 1.37 riastrad * = hz*sec + hz*(frachi*2^32 + fraclo)/2^64
331 1.37 riastrad * = hz*sec + hz*frachi/2^32 + hz*fraclo/2^64,
332 1.37 riastrad *
333 1.37 riastrad * where frachi is the high 32 bits of frac and fraclo is the
334 1.37 riastrad * low 32 bits.
335 1.37 riastrad *
336 1.37 riastrad * We assume hz < INT_MAX/2 < UINT32_MAX, so
337 1.37 riastrad *
338 1.37 riastrad * hz*fraclo/2^64 < fraclo*2^32/2^64 <= 1,
339 1.37 riastrad *
340 1.37 riastrad * since fraclo < 2^32.
341 1.37 riastrad *
342 1.37 riastrad * We clamp the result at INT_MAX/2 for a timeout in ticks, since we
343 1.37 riastrad * can't represent timeouts higher than INT_MAX in cv_timedwait, and
344 1.37 riastrad * spurious wakeup is OK. Moreover, we don't want to wrap around,
345 1.37 riastrad * because we compute end - start in ticks in order to compute the
346 1.37 riastrad * remaining timeout, and that difference cannot wrap around, so we use
347 1.37 riastrad * a timeout less than INT_MAX. Using INT_MAX/2 provides plenty of
348 1.37 riastrad * margin for paranoia and will exceed most waits in practice by far.
349 1.37 riastrad */
350 1.37 riastrad static unsigned
351 1.37 riastrad bintime2timo(const struct bintime *bt)
352 1.37 riastrad {
353 1.37 riastrad
354 1.37 riastrad KASSERT(hz < INT_MAX/2);
355 1.37 riastrad CTASSERT(INT_MAX/2 < UINT32_MAX);
356 1.37 riastrad if (bt->sec > ((INT_MAX/2)/hz))
357 1.37 riastrad return INT_MAX/2;
358 1.37 riastrad if ((hz*(bt->frac >> 32) >> 32) > (INT_MAX/2 - hz*bt->sec))
359 1.37 riastrad return INT_MAX/2;
360 1.37 riastrad
361 1.37 riastrad return hz*bt->sec + (hz*(bt->frac >> 32) >> 32);
362 1.37 riastrad }
363 1.37 riastrad
364 1.37 riastrad /*
365 1.37 riastrad * timo is in units of ticks. We want units of seconds and 2^64ths of
366 1.37 riastrad * a second. We know hz = 1 sec/tick, and 2^64 = 1 sec/(2^64th of a
367 1.37 riastrad * second), from which we can conclude 2^64 / hz = 1 (2^64th of a
368 1.37 riastrad * second)/tick. So for the fractional part, we compute
369 1.37 riastrad *
370 1.37 riastrad * frac = rem * 2^64 / hz
371 1.37 riastrad * = ((rem * 2^32) / hz) * 2^32
372 1.37 riastrad *
373 1.37 riastrad * Using truncating integer division instead of real division will
374 1.37 riastrad * leave us with only about 32 bits of precision, which means about
375 1.37 riastrad * 1/4-nanosecond resolution, which is good enough for our purposes.
376 1.37 riastrad */
377 1.37 riastrad static struct bintime
378 1.37 riastrad timo2bintime(unsigned timo)
379 1.37 riastrad {
380 1.37 riastrad
381 1.37 riastrad return (struct bintime) {
382 1.37 riastrad .sec = timo / hz,
383 1.37 riastrad .frac = (((uint64_t)(timo % hz) << 32)/hz << 32),
384 1.37 riastrad };
385 1.37 riastrad }
386 1.37 riastrad
387 1.37 riastrad /*
388 1.37 riastrad * cv_timedwaitbt:
389 1.37 riastrad *
390 1.37 riastrad * Wait on a condition variable until awoken or the specified
391 1.37 riastrad * timeout expires. Returns zero if awoken normally or
392 1.37 riastrad * EWOULDBLOCK if the timeout expires.
393 1.37 riastrad *
394 1.37 riastrad * On entry, bt is a timeout in bintime. cv_timedwaitbt subtracts
395 1.37 riastrad * the time slept, so on exit, bt is the time remaining after
396 1.38 riastrad * sleeping, possibly negative if the complete time has elapsed.
397 1.38 riastrad * No infinite timeout; use cv_wait_sig instead.
398 1.37 riastrad *
399 1.37 riastrad * epsilon is a requested maximum error in timeout (excluding
400 1.37 riastrad * spurious wakeups). Currently not used, will be used in the
401 1.37 riastrad * future to choose between low- and high-resolution timers.
402 1.38 riastrad * Actual wakeup time will be somewhere in [t, t + max(e, r) + s)
403 1.38 riastrad * where r is the finest resolution of clock available and s is
404 1.38 riastrad * scheduling delays for scheduler overhead and competing threads.
405 1.38 riastrad * Time is measured by the interrupt source implementing the
406 1.38 riastrad * timeout, not by another timecounter.
407 1.37 riastrad */
408 1.37 riastrad int
409 1.37 riastrad cv_timedwaitbt(kcondvar_t *cv, kmutex_t *mtx, struct bintime *bt,
410 1.38 riastrad const struct bintime *epsilon __diagused)
411 1.37 riastrad {
412 1.37 riastrad struct bintime slept;
413 1.37 riastrad unsigned start, end;
414 1.48 riastrad int timo;
415 1.37 riastrad int error;
416 1.37 riastrad
417 1.38 riastrad KASSERTMSG(bt->sec >= 0, "negative timeout");
418 1.38 riastrad KASSERTMSG(epsilon != NULL, "specify maximum requested delay");
419 1.38 riastrad
420 1.48 riastrad /* If there's nothing left to wait, time out. */
421 1.48 riastrad if (bt->sec == 0 && bt->frac == 0)
422 1.48 riastrad return EWOULDBLOCK;
423 1.48 riastrad
424 1.48 riastrad /* Convert to ticks, but clamp to be >=1. */
425 1.48 riastrad timo = bintime2timo(bt);
426 1.48 riastrad KASSERTMSG(timo >= 0, "negative ticks: %d", timo);
427 1.48 riastrad if (timo == 0)
428 1.48 riastrad timo = 1;
429 1.48 riastrad
430 1.37 riastrad /*
431 1.46 maxv * getticks() is technically int, but nothing special
432 1.37 riastrad * happens instead of overflow, so we assume two's-complement
433 1.37 riastrad * wraparound and just treat it as unsigned.
434 1.37 riastrad */
435 1.46 maxv start = getticks();
436 1.48 riastrad error = cv_timedwait(cv, mtx, timo);
437 1.46 maxv end = getticks();
438 1.37 riastrad
439 1.48 riastrad /*
440 1.48 riastrad * Set it to the time left, or zero, whichever is larger. We
441 1.48 riastrad * do not fail with EWOULDBLOCK here because this may have been
442 1.48 riastrad * an explicit wakeup, so the caller needs to check before they
443 1.48 riastrad * give up or else cv_signal would be lost.
444 1.48 riastrad */
445 1.37 riastrad slept = timo2bintime(end - start);
446 1.48 riastrad if (bintimecmp(bt, &slept, <=)) {
447 1.48 riastrad bt->sec = 0;
448 1.48 riastrad bt->frac = 0;
449 1.48 riastrad } else {
450 1.48 riastrad /* bt := bt - slept */
451 1.48 riastrad bintime_sub(bt, &slept);
452 1.48 riastrad }
453 1.37 riastrad
454 1.37 riastrad return error;
455 1.37 riastrad }
456 1.37 riastrad
457 1.37 riastrad /*
458 1.37 riastrad * cv_timedwaitbt_sig:
459 1.37 riastrad *
460 1.37 riastrad * Wait on a condition variable until awoken, the specified
461 1.37 riastrad * timeout expires, or interrupted by a signal. Returns zero if
462 1.37 riastrad * awoken normally, EWOULDBLOCK if the timeout expires, or
463 1.37 riastrad * EINTR/ERESTART if interrupted by a signal.
464 1.37 riastrad *
465 1.37 riastrad * On entry, bt is a timeout in bintime. cv_timedwaitbt_sig
466 1.37 riastrad * subtracts the time slept, so on exit, bt is the time remaining
467 1.37 riastrad * after sleeping. No infinite timeout; use cv_wait instead.
468 1.37 riastrad *
469 1.37 riastrad * epsilon is a requested maximum error in timeout (excluding
470 1.37 riastrad * spurious wakeups). Currently not used, will be used in the
471 1.37 riastrad * future to choose between low- and high-resolution timers.
472 1.37 riastrad */
473 1.37 riastrad int
474 1.37 riastrad cv_timedwaitbt_sig(kcondvar_t *cv, kmutex_t *mtx, struct bintime *bt,
475 1.39 riastrad const struct bintime *epsilon __diagused)
476 1.37 riastrad {
477 1.37 riastrad struct bintime slept;
478 1.37 riastrad unsigned start, end;
479 1.48 riastrad int timo;
480 1.37 riastrad int error;
481 1.37 riastrad
482 1.39 riastrad KASSERTMSG(bt->sec >= 0, "negative timeout");
483 1.39 riastrad KASSERTMSG(epsilon != NULL, "specify maximum requested delay");
484 1.39 riastrad
485 1.48 riastrad /* If there's nothing left to wait, time out. */
486 1.48 riastrad if (bt->sec == 0 && bt->frac == 0)
487 1.48 riastrad return EWOULDBLOCK;
488 1.48 riastrad
489 1.48 riastrad /* Convert to ticks, but clamp to be >=1. */
490 1.48 riastrad timo = bintime2timo(bt);
491 1.48 riastrad KASSERTMSG(timo >= 0, "negative ticks: %d", timo);
492 1.48 riastrad if (timo == 0)
493 1.48 riastrad timo = 1;
494 1.48 riastrad
495 1.37 riastrad /*
496 1.46 maxv * getticks() is technically int, but nothing special
497 1.37 riastrad * happens instead of overflow, so we assume two's-complement
498 1.37 riastrad * wraparound and just treat it as unsigned.
499 1.37 riastrad */
500 1.46 maxv start = getticks();
501 1.48 riastrad error = cv_timedwait_sig(cv, mtx, timo);
502 1.46 maxv end = getticks();
503 1.37 riastrad
504 1.48 riastrad /*
505 1.48 riastrad * Set it to the time left, or zero, whichever is larger. We
506 1.48 riastrad * do not fail with EWOULDBLOCK here because this may have been
507 1.48 riastrad * an explicit wakeup, so the caller needs to check before they
508 1.48 riastrad * give up or else cv_signal would be lost.
509 1.48 riastrad */
510 1.37 riastrad slept = timo2bintime(end - start);
511 1.48 riastrad if (bintimecmp(bt, &slept, <=)) {
512 1.48 riastrad bt->sec = 0;
513 1.48 riastrad bt->frac = 0;
514 1.48 riastrad } else {
515 1.48 riastrad /* bt := bt - slept */
516 1.48 riastrad bintime_sub(bt, &slept);
517 1.48 riastrad }
518 1.37 riastrad
519 1.37 riastrad return error;
520 1.37 riastrad }
521 1.37 riastrad
522 1.37 riastrad /*
523 1.2 ad * cv_signal:
524 1.2 ad *
525 1.2 ad * Wake the highest priority LWP waiting on a condition variable.
526 1.2 ad * Must be called with the interlocking mutex held.
527 1.2 ad */
528 1.2 ad void
529 1.2 ad cv_signal(kcondvar_t *cv)
530 1.2 ad {
531 1.20 ad
532 1.20 ad KASSERT(cv_is_valid(cv));
533 1.20 ad
534 1.44 ad if (__predict_false(!LIST_EMPTY(CV_SLEEPQ(cv))))
535 1.24 ad cv_wakeup_one(cv);
536 1.20 ad }
537 1.20 ad
538 1.42 ad /*
539 1.42 ad * cv_wakeup_one:
540 1.42 ad *
541 1.42 ad * Slow path for cv_signal(). Deliberately marked __noinline to
542 1.42 ad * prevent the compiler pulling it in to cv_signal(), which adds
543 1.42 ad * extra prologue and epilogue code.
544 1.42 ad */
545 1.42 ad static __noinline void
546 1.20 ad cv_wakeup_one(kcondvar_t *cv)
547 1.20 ad {
548 1.2 ad sleepq_t *sq;
549 1.18 ad kmutex_t *mp;
550 1.20 ad lwp_t *l;
551 1.2 ad
552 1.45 ad /*
553 1.45 ad * Keep waking LWPs until a non-interruptable waiter is found. An
554 1.45 ad * interruptable waiter could fail to do something useful with the
555 1.45 ad * wakeup due to an error return from cv_[timed]wait_sig(), and the
556 1.45 ad * caller of cv_signal() may not expect such a scenario.
557 1.45 ad *
558 1.45 ad * This isn't a problem for non-interruptable waits (untimed and
559 1.45 ad * timed), because if such a waiter is woken here it will not return
560 1.45 ad * an error.
561 1.45 ad */
562 1.24 ad mp = sleepq_hashlock(cv);
563 1.20 ad sq = CV_SLEEPQ(cv);
564 1.45 ad while ((l = LIST_FIRST(sq)) != NULL) {
565 1.45 ad KASSERT(l->l_sleepq == sq);
566 1.45 ad KASSERT(l->l_mutex == mp);
567 1.45 ad KASSERT(l->l_wchan == cv);
568 1.45 ad if ((l->l_flag & LW_SINTR) == 0) {
569 1.45 ad sleepq_remove(sq, l);
570 1.45 ad break;
571 1.45 ad } else
572 1.45 ad sleepq_remove(sq, l);
573 1.20 ad }
574 1.20 ad mutex_spin_exit(mp);
575 1.2 ad }
576 1.2 ad
577 1.2 ad /*
578 1.2 ad * cv_broadcast:
579 1.2 ad *
580 1.2 ad * Wake all LWPs waiting on a condition variable. Must be called
581 1.2 ad * with the interlocking mutex held.
582 1.2 ad */
583 1.2 ad void
584 1.2 ad cv_broadcast(kcondvar_t *cv)
585 1.2 ad {
586 1.20 ad
587 1.20 ad KASSERT(cv_is_valid(cv));
588 1.20 ad
589 1.44 ad if (__predict_false(!LIST_EMPTY(CV_SLEEPQ(cv))))
590 1.24 ad cv_wakeup_all(cv);
591 1.20 ad }
592 1.20 ad
593 1.42 ad /*
594 1.42 ad * cv_wakeup_all:
595 1.42 ad *
596 1.42 ad * Slow path for cv_broadcast(). Deliberately marked __noinline to
597 1.42 ad * prevent the compiler pulling it in to cv_broadcast(), which adds
598 1.42 ad * extra prologue and epilogue code.
599 1.42 ad */
600 1.42 ad static __noinline void
601 1.20 ad cv_wakeup_all(kcondvar_t *cv)
602 1.20 ad {
603 1.2 ad sleepq_t *sq;
604 1.18 ad kmutex_t *mp;
605 1.45 ad lwp_t *l;
606 1.15 ad
607 1.24 ad mp = sleepq_hashlock(cv);
608 1.20 ad sq = CV_SLEEPQ(cv);
609 1.45 ad while ((l = LIST_FIRST(sq)) != NULL) {
610 1.20 ad KASSERT(l->l_sleepq == sq);
611 1.20 ad KASSERT(l->l_mutex == mp);
612 1.20 ad KASSERT(l->l_wchan == cv);
613 1.27 rmind sleepq_remove(sq, l);
614 1.20 ad }
615 1.20 ad mutex_spin_exit(mp);
616 1.2 ad }
617 1.2 ad
618 1.2 ad /*
619 1.2 ad * cv_has_waiters:
620 1.2 ad *
621 1.2 ad * For diagnostic assertions: return non-zero if a condition
622 1.2 ad * variable has waiters.
623 1.2 ad */
624 1.7 ad bool
625 1.2 ad cv_has_waiters(kcondvar_t *cv)
626 1.2 ad {
627 1.23 chris
628 1.44 ad return !LIST_EMPTY(CV_SLEEPQ(cv));
629 1.2 ad }
630 1.15 ad
631 1.15 ad /*
632 1.15 ad * cv_is_valid:
633 1.15 ad *
634 1.15 ad * For diagnostic assertions: return non-zero if a condition
635 1.15 ad * variable appears to be valid. No locks need be held.
636 1.15 ad */
637 1.15 ad bool
638 1.15 ad cv_is_valid(kcondvar_t *cv)
639 1.15 ad {
640 1.15 ad
641 1.26 thorpej return CV_WMESG(cv) != deadcv && CV_WMESG(cv) != NULL;
642 1.15 ad }
643