scheduler.c revision 1.43 1 1.43 pooka /* $NetBSD: scheduler.c,v 1.43 2016/02/08 18:18:19 pooka Exp $ */
2 1.1 pooka
3 1.1 pooka /*
4 1.26 pooka * Copyright (c) 2010, 2011 Antti Kantee. All Rights Reserved.
5 1.1 pooka *
6 1.1 pooka * Redistribution and use in source and binary forms, with or without
7 1.1 pooka * modification, are permitted provided that the following conditions
8 1.1 pooka * are met:
9 1.1 pooka * 1. Redistributions of source code must retain the above copyright
10 1.1 pooka * notice, this list of conditions and the following disclaimer.
11 1.1 pooka * 2. Redistributions in binary form must reproduce the above copyright
12 1.1 pooka * notice, this list of conditions and the following disclaimer in the
13 1.1 pooka * documentation and/or other materials provided with the distribution.
14 1.1 pooka *
15 1.1 pooka * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
16 1.1 pooka * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 1.1 pooka * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18 1.1 pooka * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 1.1 pooka * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 1.1 pooka * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 1.1 pooka * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 1.1 pooka * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 1.1 pooka * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 1.1 pooka * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 1.1 pooka * SUCH DAMAGE.
26 1.1 pooka */
27 1.1 pooka
28 1.1 pooka #include <sys/cdefs.h>
29 1.43 pooka __KERNEL_RCSID(0, "$NetBSD: scheduler.c,v 1.43 2016/02/08 18:18:19 pooka Exp $");
30 1.1 pooka
31 1.1 pooka #include <sys/param.h>
32 1.16 pooka #include <sys/atomic.h>
33 1.1 pooka #include <sys/cpu.h>
34 1.2 pooka #include <sys/kmem.h>
35 1.1 pooka #include <sys/mutex.h>
36 1.8 pooka #include <sys/namei.h>
37 1.1 pooka #include <sys/queue.h>
38 1.1 pooka #include <sys/select.h>
39 1.10 pooka #include <sys/systm.h>
40 1.1 pooka
41 1.42 pooka #include <rump-sys/kern.h>
42 1.42 pooka
43 1.1 pooka #include <rump/rumpuser.h>
44 1.1 pooka
45 1.1 pooka static struct rumpcpu {
46 1.15 pooka /* needed in fastpath */
47 1.1 pooka struct cpu_info *rcpu_ci;
48 1.15 pooka void *rcpu_prevlwp;
49 1.15 pooka
50 1.15 pooka /* needed in slowpath */
51 1.15 pooka struct rumpuser_mtx *rcpu_mtx;
52 1.8 pooka struct rumpuser_cv *rcpu_cv;
53 1.15 pooka int rcpu_wanted;
54 1.15 pooka
55 1.15 pooka /* offset 20 (P=4) or 36 (P=8) here */
56 1.15 pooka
57 1.15 pooka /*
58 1.15 pooka * Some stats. Not really that necessary, but we should
59 1.15 pooka * have room. Note that these overflow quite fast, so need
60 1.15 pooka * to be collected often.
61 1.15 pooka */
62 1.15 pooka unsigned int rcpu_fastpath;
63 1.15 pooka unsigned int rcpu_slowpath;
64 1.15 pooka unsigned int rcpu_migrated;
65 1.15 pooka
66 1.15 pooka /* offset 32 (P=4) or 50 (P=8) */
67 1.15 pooka
68 1.15 pooka int rcpu_align[0] __aligned(CACHE_LINE_SIZE);
69 1.8 pooka } rcpu_storage[MAXCPUS];
70 1.28 rmind
71 1.43 pooka static inline struct rumpcpu *
72 1.43 pooka cpuinfo_to_rumpcpu(struct cpu_info *ci)
73 1.43 pooka {
74 1.43 pooka
75 1.43 pooka return &rcpu_storage[cpu_index(ci)];
76 1.43 pooka }
77 1.43 pooka
78 1.43 pooka struct cpu_info rump_bootcpu;
79 1.28 rmind kcpuset_t *kcpuset_attached = NULL;
80 1.28 rmind kcpuset_t *kcpuset_running = NULL;
81 1.41 pooka int ncpu, ncpuonline;
82 1.1 pooka
83 1.15 pooka #define RCPULWP_BUSY ((void *)-1)
84 1.15 pooka #define RCPULWP_WANTED ((void *)-2)
85 1.8 pooka
86 1.15 pooka static struct rumpuser_mtx *lwp0mtx;
87 1.15 pooka static struct rumpuser_cv *lwp0cv;
88 1.15 pooka static unsigned nextcpu;
89 1.14 pooka
90 1.25 pooka kmutex_t unruntime_lock; /* unruntime lwp lock. practically unused */
91 1.25 pooka
92 1.19 pooka static bool lwp0isbusy = false;
93 1.3 pooka
94 1.15 pooka /*
95 1.15 pooka * Keep some stats.
96 1.15 pooka *
97 1.15 pooka * Keeping track of there is not really critical for speed, unless
98 1.15 pooka * stats happen to be on a different cache line (CACHE_LINE_SIZE is
99 1.15 pooka * really just a coarse estimate), so default for the performant case
100 1.15 pooka * (i.e. no stats).
101 1.15 pooka */
102 1.15 pooka #ifdef RUMPSCHED_STATS
103 1.15 pooka #define SCHED_FASTPATH(rcpu) rcpu->rcpu_fastpath++;
104 1.15 pooka #define SCHED_SLOWPATH(rcpu) rcpu->rcpu_slowpath++;
105 1.15 pooka #define SCHED_MIGRATED(rcpu) rcpu->rcpu_migrated++;
106 1.15 pooka #else
107 1.15 pooka #define SCHED_FASTPATH(rcpu)
108 1.15 pooka #define SCHED_SLOWPATH(rcpu)
109 1.15 pooka #define SCHED_MIGRATED(rcpu)
110 1.15 pooka #endif
111 1.1 pooka
112 1.1 pooka struct cpu_info *
113 1.1 pooka cpu_lookup(u_int index)
114 1.1 pooka {
115 1.1 pooka
116 1.43 pooka return rcpu_storage[index].rcpu_ci;
117 1.1 pooka }
118 1.1 pooka
119 1.15 pooka static inline struct rumpcpu *
120 1.15 pooka getnextcpu(void)
121 1.15 pooka {
122 1.15 pooka unsigned newcpu;
123 1.15 pooka
124 1.15 pooka newcpu = atomic_inc_uint_nv(&nextcpu);
125 1.15 pooka if (__predict_false(ncpu > UINT_MAX/2))
126 1.15 pooka atomic_and_uint(&nextcpu, 0);
127 1.15 pooka newcpu = newcpu % ncpu;
128 1.15 pooka
129 1.15 pooka return &rcpu_storage[newcpu];
130 1.15 pooka }
131 1.15 pooka
132 1.12 pooka /* this could/should be mi_attach_cpu? */
133 1.12 pooka void
134 1.22 pooka rump_cpus_bootstrap(int *nump)
135 1.12 pooka {
136 1.22 pooka int num = *nump;
137 1.12 pooka
138 1.13 pooka if (num > MAXCPUS) {
139 1.22 pooka aprint_verbose("CPU limit: %d wanted, %d (MAXCPUS) "
140 1.22 pooka "available (adjusted)\n", num, MAXCPUS);
141 1.13 pooka num = MAXCPUS;
142 1.13 pooka }
143 1.13 pooka
144 1.28 rmind kcpuset_create(&kcpuset_attached, true);
145 1.28 rmind kcpuset_create(&kcpuset_running, true);
146 1.28 rmind
147 1.20 pooka /* attach first cpu for bootstrap */
148 1.43 pooka rump_cpu_attach(&rump_bootcpu);
149 1.20 pooka ncpu = 1;
150 1.22 pooka *nump = num;
151 1.12 pooka }
152 1.12 pooka
153 1.1 pooka void
154 1.20 pooka rump_scheduler_init(int numcpu)
155 1.1 pooka {
156 1.1 pooka struct rumpcpu *rcpu;
157 1.1 pooka struct cpu_info *ci;
158 1.1 pooka int i;
159 1.1 pooka
160 1.31 pooka rumpuser_mutex_init(&lwp0mtx, RUMPUSER_MTX_SPIN);
161 1.3 pooka rumpuser_cv_init(&lwp0cv);
162 1.20 pooka for (i = 0; i < numcpu; i++) {
163 1.43 pooka if (i == 0) {
164 1.43 pooka ci = &rump_bootcpu;
165 1.43 pooka } else {
166 1.43 pooka ci = kmem_zalloc(sizeof(*ci), KM_SLEEP);
167 1.43 pooka ci->ci_index = i;
168 1.43 pooka }
169 1.43 pooka
170 1.1 pooka rcpu = &rcpu_storage[i];
171 1.12 pooka rcpu->rcpu_ci = ci;
172 1.43 pooka rcpu->rcpu_wanted = 0;
173 1.43 pooka rumpuser_cv_init(&rcpu->rcpu_cv);
174 1.43 pooka rumpuser_mutex_init(&rcpu->rcpu_mtx, RUMPUSER_MTX_SPIN);
175 1.43 pooka
176 1.4 pooka ci->ci_schedstate.spc_mutex =
177 1.32 pooka mutex_obj_alloc(MUTEX_DEFAULT, IPL_SCHED);
178 1.9 pooka ci->ci_schedstate.spc_flags = SPCF_RUNNING;
179 1.1 pooka }
180 1.25 pooka
181 1.32 pooka mutex_init(&unruntime_lock, MUTEX_DEFAULT, IPL_SCHED);
182 1.1 pooka }
183 1.1 pooka
184 1.14 pooka /*
185 1.14 pooka * condvar ops using scheduler lock as the rumpuser interlock.
186 1.14 pooka */
187 1.14 pooka void
188 1.14 pooka rump_schedlock_cv_wait(struct rumpuser_cv *cv)
189 1.14 pooka {
190 1.15 pooka struct lwp *l = curlwp;
191 1.43 pooka struct rumpcpu *rcpu = cpuinfo_to_rumpcpu(l->l_cpu);
192 1.14 pooka
193 1.15 pooka /* mutex will be taken and released in cpu schedule/unschedule */
194 1.15 pooka rumpuser_cv_wait(cv, rcpu->rcpu_mtx);
195 1.14 pooka }
196 1.14 pooka
197 1.14 pooka int
198 1.14 pooka rump_schedlock_cv_timedwait(struct rumpuser_cv *cv, const struct timespec *ts)
199 1.14 pooka {
200 1.15 pooka struct lwp *l = curlwp;
201 1.43 pooka struct rumpcpu *rcpu = cpuinfo_to_rumpcpu(l->l_cpu);
202 1.14 pooka
203 1.15 pooka /* mutex will be taken and released in cpu schedule/unschedule */
204 1.15 pooka return rumpuser_cv_timedwait(cv, rcpu->rcpu_mtx,
205 1.15 pooka ts->tv_sec, ts->tv_nsec);
206 1.14 pooka }
207 1.14 pooka
208 1.19 pooka static void
209 1.19 pooka lwp0busy(void)
210 1.19 pooka {
211 1.19 pooka
212 1.19 pooka /* busy lwp0 */
213 1.25 pooka KASSERT(curlwp == NULL || curlwp->l_stat != LSONPROC);
214 1.19 pooka rumpuser_mutex_enter_nowrap(lwp0mtx);
215 1.19 pooka while (lwp0isbusy)
216 1.19 pooka rumpuser_cv_wait_nowrap(lwp0cv, lwp0mtx);
217 1.19 pooka lwp0isbusy = true;
218 1.19 pooka rumpuser_mutex_exit(lwp0mtx);
219 1.19 pooka }
220 1.19 pooka
221 1.19 pooka static void
222 1.19 pooka lwp0rele(void)
223 1.19 pooka {
224 1.19 pooka
225 1.19 pooka rumpuser_mutex_enter_nowrap(lwp0mtx);
226 1.19 pooka KASSERT(lwp0isbusy == true);
227 1.19 pooka lwp0isbusy = false;
228 1.19 pooka rumpuser_cv_signal(lwp0cv);
229 1.19 pooka rumpuser_mutex_exit(lwp0mtx);
230 1.19 pooka }
231 1.19 pooka
232 1.27 yamt /*
233 1.27 yamt * rump_schedule: ensure that the calling host thread has a valid lwp context.
234 1.33 pooka * ie. ensure that curlwp != NULL. Also, ensure that there
235 1.33 pooka * a 1:1 mapping between the lwp and rump kernel cpu.
236 1.27 yamt */
237 1.1 pooka void
238 1.1 pooka rump_schedule()
239 1.1 pooka {
240 1.3 pooka struct lwp *l;
241 1.2 pooka
242 1.2 pooka /*
243 1.2 pooka * If there is no dedicated lwp, allocate a temp one and
244 1.3 pooka * set it to be free'd upon unschedule(). Use lwp0 context
245 1.15 pooka * for reserving the necessary resources. Don't optimize
246 1.15 pooka * for this case -- anyone who cares about performance will
247 1.15 pooka * start a real thread.
248 1.2 pooka */
249 1.36 pooka if (__predict_true((l = curlwp) != NULL)) {
250 1.19 pooka rump_schedule_cpu(l);
251 1.19 pooka LWP_CACHE_CREDS(l, l->l_proc);
252 1.19 pooka } else {
253 1.19 pooka lwp0busy();
254 1.3 pooka
255 1.3 pooka /* schedule cpu and use lwp0 */
256 1.4 pooka rump_schedule_cpu(&lwp0);
257 1.36 pooka rump_lwproc_curlwp_set(&lwp0);
258 1.3 pooka
259 1.19 pooka /* allocate thread, switch to it, and release lwp0 */
260 1.21 pooka l = rump__lwproc_alloclwp(initproc);
261 1.19 pooka rump_lwproc_switch(l);
262 1.19 pooka lwp0rele();
263 1.3 pooka
264 1.19 pooka /*
265 1.19 pooka * mark new thread dead-on-unschedule. this
266 1.19 pooka * means that we'll be running with l_refcnt == 0.
267 1.19 pooka * relax, it's fine.
268 1.19 pooka */
269 1.19 pooka rump_lwproc_releaselwp();
270 1.2 pooka }
271 1.2 pooka }
272 1.2 pooka
273 1.4 pooka void
274 1.4 pooka rump_schedule_cpu(struct lwp *l)
275 1.2 pooka {
276 1.14 pooka
277 1.14 pooka rump_schedule_cpu_interlock(l, NULL);
278 1.14 pooka }
279 1.14 pooka
280 1.15 pooka /*
281 1.15 pooka * Schedule a CPU. This optimizes for the case where we schedule
282 1.15 pooka * the same thread often, and we have nCPU >= nFrequently-Running-Thread
283 1.15 pooka * (where CPU is virtual rump cpu, not host CPU).
284 1.15 pooka */
285 1.14 pooka void
286 1.14 pooka rump_schedule_cpu_interlock(struct lwp *l, void *interlock)
287 1.14 pooka {
288 1.1 pooka struct rumpcpu *rcpu;
289 1.40 pooka struct cpu_info *ci;
290 1.15 pooka void *old;
291 1.15 pooka bool domigrate;
292 1.15 pooka bool bound = l->l_pflag & LP_BOUND;
293 1.15 pooka
294 1.25 pooka l->l_stat = LSRUN;
295 1.25 pooka
296 1.15 pooka /*
297 1.15 pooka * First, try fastpath: if we were the previous user of the
298 1.15 pooka * CPU, everything is in order cachewise and we can just
299 1.15 pooka * proceed to use it.
300 1.15 pooka *
301 1.15 pooka * If we are a different thread (i.e. CAS fails), we must go
302 1.15 pooka * through a memory barrier to ensure we get a truthful
303 1.15 pooka * view of the world.
304 1.15 pooka */
305 1.14 pooka
306 1.17 pooka KASSERT(l->l_target_cpu != NULL);
307 1.43 pooka rcpu = cpuinfo_to_rumpcpu(l->l_target_cpu);
308 1.15 pooka if (atomic_cas_ptr(&rcpu->rcpu_prevlwp, l, RCPULWP_BUSY) == l) {
309 1.29 pooka if (interlock == rcpu->rcpu_mtx)
310 1.15 pooka rumpuser_mutex_exit(rcpu->rcpu_mtx);
311 1.15 pooka SCHED_FASTPATH(rcpu);
312 1.15 pooka /* jones, you're the man */
313 1.15 pooka goto fastlane;
314 1.15 pooka }
315 1.1 pooka
316 1.15 pooka /*
317 1.15 pooka * Else, it's the slowpath for us. First, determine if we
318 1.15 pooka * can migrate.
319 1.15 pooka */
320 1.15 pooka if (ncpu == 1)
321 1.15 pooka domigrate = false;
322 1.15 pooka else
323 1.15 pooka domigrate = true;
324 1.15 pooka
325 1.15 pooka /* Take lock. This acts as a load barrier too. */
326 1.29 pooka if (interlock != rcpu->rcpu_mtx)
327 1.15 pooka rumpuser_mutex_enter_nowrap(rcpu->rcpu_mtx);
328 1.15 pooka
329 1.15 pooka for (;;) {
330 1.15 pooka SCHED_SLOWPATH(rcpu);
331 1.15 pooka old = atomic_swap_ptr(&rcpu->rcpu_prevlwp, RCPULWP_WANTED);
332 1.15 pooka
333 1.15 pooka /* CPU is free? */
334 1.15 pooka if (old != RCPULWP_BUSY && old != RCPULWP_WANTED) {
335 1.15 pooka if (atomic_cas_ptr(&rcpu->rcpu_prevlwp,
336 1.15 pooka RCPULWP_WANTED, RCPULWP_BUSY) == RCPULWP_WANTED) {
337 1.15 pooka break;
338 1.8 pooka }
339 1.8 pooka }
340 1.15 pooka
341 1.15 pooka /*
342 1.15 pooka * Do we want to migrate once?
343 1.15 pooka * This may need a slightly better algorithm, or we
344 1.15 pooka * might cache pingpong eternally for non-frequent
345 1.15 pooka * threads.
346 1.15 pooka */
347 1.15 pooka if (domigrate && !bound) {
348 1.15 pooka domigrate = false;
349 1.15 pooka SCHED_MIGRATED(rcpu);
350 1.15 pooka rumpuser_mutex_exit(rcpu->rcpu_mtx);
351 1.15 pooka rcpu = getnextcpu();
352 1.15 pooka rumpuser_mutex_enter_nowrap(rcpu->rcpu_mtx);
353 1.15 pooka continue;
354 1.8 pooka }
355 1.15 pooka
356 1.15 pooka /* Want CPU, wait until it's released an retry */
357 1.15 pooka rcpu->rcpu_wanted++;
358 1.15 pooka rumpuser_cv_wait_nowrap(rcpu->rcpu_cv, rcpu->rcpu_mtx);
359 1.15 pooka rcpu->rcpu_wanted--;
360 1.8 pooka }
361 1.15 pooka rumpuser_mutex_exit(rcpu->rcpu_mtx);
362 1.15 pooka
363 1.15 pooka fastlane:
364 1.40 pooka ci = rcpu->rcpu_ci;
365 1.40 pooka l->l_cpu = l->l_target_cpu = ci;
366 1.4 pooka l->l_mutex = rcpu->rcpu_ci->ci_schedstate.spc_mutex;
367 1.18 pooka l->l_ncsw++;
368 1.25 pooka l->l_stat = LSONPROC;
369 1.23 pooka
370 1.40 pooka /*
371 1.40 pooka * No interrupts, so ci_curlwp === cpu_onproc.
372 1.40 pooka * Okay, we could make an attempt to not set cpu_onproc
373 1.40 pooka * in the case that an interrupt is scheduled immediately
374 1.40 pooka * after a user proc, but leave that for later.
375 1.40 pooka */
376 1.40 pooka ci->ci_curlwp = ci->ci_data.cpu_onproc = l;
377 1.1 pooka }
378 1.1 pooka
379 1.1 pooka void
380 1.1 pooka rump_unschedule()
381 1.1 pooka {
382 1.36 pooka struct lwp *l = curlwp;
383 1.24 pooka #ifdef DIAGNOSTIC
384 1.24 pooka int nlock;
385 1.24 pooka
386 1.24 pooka KERNEL_UNLOCK_ALL(l, &nlock);
387 1.24 pooka KASSERT(nlock == 0);
388 1.24 pooka #endif
389 1.2 pooka
390 1.4 pooka KASSERT(l->l_mutex == l->l_cpu->ci_schedstate.spc_mutex);
391 1.2 pooka rump_unschedule_cpu(l);
392 1.25 pooka l->l_mutex = &unruntime_lock;
393 1.25 pooka l->l_stat = LSSTOP;
394 1.6 pooka
395 1.6 pooka /*
396 1.19 pooka * Check special conditions:
397 1.19 pooka * 1) do we need to free the lwp which just unscheduled?
398 1.19 pooka * (locking order: lwp0, cpu)
399 1.19 pooka * 2) do we want to clear curlwp for the current host thread
400 1.6 pooka */
401 1.19 pooka if (__predict_false(l->l_flag & LW_WEXIT)) {
402 1.19 pooka lwp0busy();
403 1.19 pooka
404 1.19 pooka /* Now that we have lwp0, we can schedule a CPU again */
405 1.19 pooka rump_schedule_cpu(l);
406 1.6 pooka
407 1.19 pooka /* switch to lwp0. this frees the old thread */
408 1.19 pooka KASSERT(l->l_flag & LW_WEXIT);
409 1.19 pooka rump_lwproc_switch(&lwp0);
410 1.6 pooka
411 1.19 pooka /* release lwp0 */
412 1.6 pooka rump_unschedule_cpu(&lwp0);
413 1.25 pooka lwp0.l_mutex = &unruntime_lock;
414 1.19 pooka lwp0.l_pflag &= ~LP_RUNNING;
415 1.19 pooka lwp0rele();
416 1.36 pooka rump_lwproc_curlwp_clear(&lwp0);
417 1.6 pooka
418 1.19 pooka } else if (__predict_false(l->l_flag & LW_RUMP_CLEAR)) {
419 1.36 pooka rump_lwproc_curlwp_clear(l);
420 1.19 pooka l->l_flag &= ~LW_RUMP_CLEAR;
421 1.2 pooka }
422 1.2 pooka }
423 1.2 pooka
424 1.2 pooka void
425 1.2 pooka rump_unschedule_cpu(struct lwp *l)
426 1.2 pooka {
427 1.8 pooka
428 1.14 pooka rump_unschedule_cpu_interlock(l, NULL);
429 1.14 pooka }
430 1.14 pooka
431 1.14 pooka void
432 1.14 pooka rump_unschedule_cpu_interlock(struct lwp *l, void *interlock)
433 1.14 pooka {
434 1.14 pooka
435 1.8 pooka if ((l->l_pflag & LP_INTR) == 0)
436 1.8 pooka rump_softint_run(l->l_cpu);
437 1.14 pooka rump_unschedule_cpu1(l, interlock);
438 1.8 pooka }
439 1.8 pooka
440 1.8 pooka void
441 1.14 pooka rump_unschedule_cpu1(struct lwp *l, void *interlock)
442 1.8 pooka {
443 1.1 pooka struct rumpcpu *rcpu;
444 1.1 pooka struct cpu_info *ci;
445 1.15 pooka void *old;
446 1.1 pooka
447 1.1 pooka ci = l->l_cpu;
448 1.40 pooka ci->ci_curlwp = ci->ci_data.cpu_onproc = NULL;
449 1.43 pooka rcpu = cpuinfo_to_rumpcpu(ci);
450 1.15 pooka
451 1.1 pooka KASSERT(rcpu->rcpu_ci == ci);
452 1.1 pooka
453 1.15 pooka /*
454 1.15 pooka * Make sure all stores are seen before the CPU release. This
455 1.15 pooka * is relevant only in the non-fastpath scheduling case, but
456 1.15 pooka * we don't know here if that's going to happen, so need to
457 1.15 pooka * expect the worst.
458 1.29 pooka *
459 1.29 pooka * If the scheduler interlock was requested by the caller, we
460 1.29 pooka * need to obtain it before we release the CPU. Otherwise, we risk a
461 1.29 pooka * race condition where another thread is scheduled onto the
462 1.29 pooka * rump kernel CPU before our current thread can
463 1.29 pooka * grab the interlock.
464 1.15 pooka */
465 1.29 pooka if (interlock == rcpu->rcpu_mtx)
466 1.29 pooka rumpuser_mutex_enter_nowrap(rcpu->rcpu_mtx);
467 1.29 pooka else
468 1.29 pooka membar_exit();
469 1.15 pooka
470 1.15 pooka /* Release the CPU. */
471 1.15 pooka old = atomic_swap_ptr(&rcpu->rcpu_prevlwp, l);
472 1.15 pooka
473 1.15 pooka /* No waiters? No problems. We're outta here. */
474 1.15 pooka if (old == RCPULWP_BUSY) {
475 1.15 pooka return;
476 1.15 pooka }
477 1.15 pooka
478 1.15 pooka KASSERT(old == RCPULWP_WANTED);
479 1.15 pooka
480 1.15 pooka /*
481 1.15 pooka * Ok, things weren't so snappy.
482 1.15 pooka *
483 1.15 pooka * Snailpath: take lock and signal anyone waiting for this CPU.
484 1.15 pooka */
485 1.14 pooka
486 1.29 pooka if (interlock != rcpu->rcpu_mtx)
487 1.29 pooka rumpuser_mutex_enter_nowrap(rcpu->rcpu_mtx);
488 1.15 pooka if (rcpu->rcpu_wanted)
489 1.8 pooka rumpuser_cv_broadcast(rcpu->rcpu_cv);
490 1.29 pooka if (interlock != rcpu->rcpu_mtx)
491 1.15 pooka rumpuser_mutex_exit(rcpu->rcpu_mtx);
492 1.1 pooka }
493 1.5 pooka
494 1.5 pooka /* Give up and retake CPU (perhaps a different one) */
495 1.5 pooka void
496 1.5 pooka yield()
497 1.5 pooka {
498 1.5 pooka struct lwp *l = curlwp;
499 1.5 pooka int nlocks;
500 1.5 pooka
501 1.5 pooka KERNEL_UNLOCK_ALL(l, &nlocks);
502 1.5 pooka rump_unschedule_cpu(l);
503 1.5 pooka rump_schedule_cpu(l);
504 1.5 pooka KERNEL_LOCK(nlocks, l);
505 1.5 pooka }
506 1.5 pooka
507 1.5 pooka void
508 1.5 pooka preempt()
509 1.5 pooka {
510 1.5 pooka
511 1.5 pooka yield();
512 1.5 pooka }
513 1.10 pooka
514 1.10 pooka bool
515 1.10 pooka kpreempt(uintptr_t where)
516 1.10 pooka {
517 1.10 pooka
518 1.10 pooka return false;
519 1.10 pooka }
520 1.10 pooka
521 1.10 pooka /*
522 1.10 pooka * There is no kernel thread preemption in rump currently. But call
523 1.10 pooka * the implementing macros anyway in case they grow some side-effects
524 1.10 pooka * down the road.
525 1.10 pooka */
526 1.10 pooka void
527 1.10 pooka kpreempt_disable(void)
528 1.10 pooka {
529 1.10 pooka
530 1.35 pooka KPREEMPT_DISABLE(curlwp);
531 1.10 pooka }
532 1.10 pooka
533 1.10 pooka void
534 1.10 pooka kpreempt_enable(void)
535 1.10 pooka {
536 1.10 pooka
537 1.35 pooka KPREEMPT_ENABLE(curlwp);
538 1.10 pooka }
539 1.10 pooka
540 1.38 rmind bool
541 1.38 rmind kpreempt_disabled(void)
542 1.38 rmind {
543 1.39 rmind #if 0
544 1.38 rmind const lwp_t *l = curlwp;
545 1.38 rmind
546 1.38 rmind return l->l_nopreempt != 0 || l->l_stat == LSZOMB ||
547 1.39 rmind (l->l_flag & LW_IDLE) != 0 || cpu_kpreempt_disabled();
548 1.39 rmind #endif
549 1.39 rmind /* XXX: emulate cpu_kpreempt_disabled() */
550 1.39 rmind return true;
551 1.38 rmind }
552 1.38 rmind
553 1.10 pooka void
554 1.10 pooka suspendsched(void)
555 1.10 pooka {
556 1.10 pooka
557 1.10 pooka /*
558 1.10 pooka * Could wait until everyone is out and block further entries,
559 1.10 pooka * but skip that for now.
560 1.10 pooka */
561 1.10 pooka }
562 1.11 pooka
563 1.11 pooka void
564 1.11 pooka sched_nice(struct proc *p, int level)
565 1.11 pooka {
566 1.11 pooka
567 1.11 pooka /* nothing to do for now */
568 1.11 pooka }
569 1.37 pooka
570 1.37 pooka void
571 1.37 pooka sched_enqueue(struct lwp *l, bool swtch)
572 1.37 pooka {
573 1.37 pooka
574 1.37 pooka if (swtch)
575 1.37 pooka panic("sched_enqueue with switcheroo");
576 1.37 pooka rump_thread_allow(l);
577 1.37 pooka }
578 1.37 pooka
579 1.37 pooka void
580 1.37 pooka sched_dequeue(struct lwp *l)
581 1.37 pooka {
582 1.37 pooka
583 1.37 pooka panic("sched_dequeue not implemented");
584 1.37 pooka }
585