kern_cpu.c revision 1.40 1 1.40 christos /* $NetBSD: kern_cpu.c,v 1.40 2009/01/19 17:39:02 christos Exp $ */
2 1.3 ad
3 1.3 ad /*-
4 1.21 ad * Copyright (c) 2007, 2008 The NetBSD Foundation, Inc.
5 1.3 ad * All rights reserved.
6 1.3 ad *
7 1.3 ad * This code is derived from software contributed to The NetBSD Foundation
8 1.3 ad * by Andrew Doran.
9 1.3 ad *
10 1.3 ad * Redistribution and use in source and binary forms, with or without
11 1.3 ad * modification, are permitted provided that the following conditions
12 1.3 ad * are met:
13 1.3 ad * 1. Redistributions of source code must retain the above copyright
14 1.3 ad * notice, this list of conditions and the following disclaimer.
15 1.3 ad * 2. Redistributions in binary form must reproduce the above copyright
16 1.3 ad * notice, this list of conditions and the following disclaimer in the
17 1.3 ad * documentation and/or other materials provided with the distribution.
18 1.3 ad *
19 1.3 ad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.3 ad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.3 ad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.3 ad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.3 ad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.3 ad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.3 ad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.3 ad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.3 ad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.3 ad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.3 ad * POSSIBILITY OF SUCH DAMAGE.
30 1.3 ad */
31 1.2 yamt
32 1.2 yamt /*-
33 1.2 yamt * Copyright (c)2007 YAMAMOTO Takashi,
34 1.2 yamt * All rights reserved.
35 1.2 yamt *
36 1.2 yamt * Redistribution and use in source and binary forms, with or without
37 1.2 yamt * modification, are permitted provided that the following conditions
38 1.2 yamt * are met:
39 1.2 yamt * 1. Redistributions of source code must retain the above copyright
40 1.2 yamt * notice, this list of conditions and the following disclaimer.
41 1.2 yamt * 2. Redistributions in binary form must reproduce the above copyright
42 1.2 yamt * notice, this list of conditions and the following disclaimer in the
43 1.2 yamt * documentation and/or other materials provided with the distribution.
44 1.2 yamt *
45 1.2 yamt * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
46 1.2 yamt * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
47 1.2 yamt * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
48 1.2 yamt * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
49 1.2 yamt * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
50 1.2 yamt * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
51 1.2 yamt * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
52 1.2 yamt * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
53 1.2 yamt * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
54 1.2 yamt * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
55 1.2 yamt * SUCH DAMAGE.
56 1.2 yamt */
57 1.2 yamt
58 1.2 yamt #include <sys/cdefs.h>
59 1.40 christos __KERNEL_RCSID(0, "$NetBSD: kern_cpu.c,v 1.40 2009/01/19 17:39:02 christos Exp $");
60 1.40 christos
61 1.40 christos #include "opt_compat_netbsd.h"
62 1.2 yamt
63 1.2 yamt #include <sys/param.h>
64 1.2 yamt #include <sys/systm.h>
65 1.2 yamt #include <sys/idle.h>
66 1.2 yamt #include <sys/sched.h>
67 1.8 ad #include <sys/intr.h>
68 1.3 ad #include <sys/conf.h>
69 1.3 ad #include <sys/cpu.h>
70 1.3 ad #include <sys/cpuio.h>
71 1.3 ad #include <sys/proc.h>
72 1.17 yamt #include <sys/percpu.h>
73 1.3 ad #include <sys/kernel.h>
74 1.3 ad #include <sys/kauth.h>
75 1.7 ad #include <sys/xcall.h>
76 1.7 ad #include <sys/pool.h>
77 1.21 ad #include <sys/kmem.h>
78 1.22 ad #include <sys/select.h>
79 1.23 ad #include <sys/namei.h>
80 1.27 ad #include <sys/callout.h>
81 1.3 ad
82 1.6 ad #include <uvm/uvm_extern.h>
83 1.6 ad
84 1.40 christos #ifdef COMPAT_50
85 1.40 christos #include <compat/sys/cpuio.h>
86 1.40 christos #endif
87 1.40 christos
88 1.3 ad void cpuctlattach(int);
89 1.3 ad
90 1.11 rmind static void cpu_xc_online(struct cpu_info *);
91 1.11 rmind static void cpu_xc_offline(struct cpu_info *);
92 1.7 ad
93 1.3 ad dev_type_ioctl(cpuctl_ioctl);
94 1.3 ad
95 1.3 ad const struct cdevsw cpuctl_cdevsw = {
96 1.3 ad nullopen, nullclose, nullread, nullwrite, cpuctl_ioctl,
97 1.3 ad nullstop, notty, nopoll, nommap, nokqfilter,
98 1.3 ad D_OTHER | D_MPSAFE
99 1.3 ad };
100 1.11 rmind
101 1.3 ad kmutex_t cpu_lock;
102 1.9 ad int ncpu;
103 1.9 ad int ncpuonline;
104 1.17 yamt bool mp_online;
105 1.24 ad struct cpuqueue cpu_queue = CIRCLEQ_HEAD_INITIALIZER(cpu_queue);
106 1.2 yamt
107 1.16 yamt static struct cpu_info *cpu_infos[MAXCPUS];
108 1.16 yamt
109 1.2 yamt int
110 1.2 yamt mi_cpu_attach(struct cpu_info *ci)
111 1.2 yamt {
112 1.2 yamt int error;
113 1.2 yamt
114 1.5 rmind ci->ci_index = ncpu;
115 1.24 ad cpu_infos[cpu_index(ci)] = ci;
116 1.24 ad CIRCLEQ_INSERT_TAIL(&cpu_queue, ci, ci_data.cpu_qchain);
117 1.30 ad TAILQ_INIT(&ci->ci_data.cpu_ld_locks);
118 1.30 ad __cpu_simple_lock_init(&ci->ci_data.cpu_ld_lock);
119 1.5 rmind
120 1.2 yamt sched_cpuattach(ci);
121 1.2 yamt
122 1.2 yamt error = create_idle_lwp(ci);
123 1.2 yamt if (error != 0) {
124 1.2 yamt /* XXX revert sched_cpuattach */
125 1.2 yamt return error;
126 1.2 yamt }
127 1.2 yamt
128 1.13 ad if (ci == curcpu())
129 1.13 ad ci->ci_data.cpu_onproc = curlwp;
130 1.13 ad else
131 1.13 ad ci->ci_data.cpu_onproc = ci->ci_data.cpu_idlelwp;
132 1.13 ad
133 1.17 yamt percpu_init_cpu(ci);
134 1.8 ad softint_init(ci);
135 1.27 ad callout_init_cpu(ci);
136 1.7 ad xc_init_cpu(ci);
137 1.14 ad pool_cache_cpu_init(ci);
138 1.22 ad selsysinit(ci);
139 1.23 ad cache_cpu_init(ci);
140 1.7 ad TAILQ_INIT(&ci->ci_data.cpu_biodone);
141 1.2 yamt ncpu++;
142 1.9 ad ncpuonline++;
143 1.2 yamt
144 1.2 yamt return 0;
145 1.2 yamt }
146 1.3 ad
147 1.3 ad void
148 1.3 ad cpuctlattach(int dummy)
149 1.3 ad {
150 1.3 ad
151 1.3 ad }
152 1.3 ad
153 1.3 ad int
154 1.3 ad cpuctl_ioctl(dev_t dev, u_long cmd, void *data, int flag, lwp_t *l)
155 1.3 ad {
156 1.3 ad CPU_INFO_ITERATOR cii;
157 1.3 ad cpustate_t *cs;
158 1.3 ad struct cpu_info *ci;
159 1.3 ad int error, i;
160 1.3 ad u_int id;
161 1.3 ad
162 1.3 ad error = 0;
163 1.3 ad
164 1.3 ad mutex_enter(&cpu_lock);
165 1.3 ad switch (cmd) {
166 1.40 christos #ifdef IOC_CPU_OSETSTATE
167 1.40 christos cpustate_t csb;
168 1.40 christos
169 1.40 christos case IOC_CPU_OSETSTATE: {
170 1.40 christos cpustate50_t *ocs = data;
171 1.40 christos cpustate50_to_cpustate(ocs, &csb);
172 1.40 christos cs = &csb;
173 1.40 christos error = 1;
174 1.40 christos /*FALLTHROUGH*/
175 1.40 christos }
176 1.40 christos #endif
177 1.3 ad case IOC_CPU_SETSTATE:
178 1.40 christos if (error == 0)
179 1.40 christos cs = data;
180 1.20 elad error = kauth_authorize_system(l->l_cred,
181 1.20 elad KAUTH_SYSTEM_CPU, KAUTH_REQ_SYSTEM_CPU_SETSTATE, cs, NULL,
182 1.20 elad NULL);
183 1.3 ad if (error != 0)
184 1.3 ad break;
185 1.36 ad if (cs->cs_id >= __arraycount(cpu_infos) ||
186 1.36 ad (ci = cpu_lookup(cs->cs_id)) == NULL) {
187 1.3 ad error = ESRCH;
188 1.3 ad break;
189 1.3 ad }
190 1.3 ad if (!cs->cs_intr) {
191 1.3 ad error = EOPNOTSUPP;
192 1.3 ad break;
193 1.3 ad }
194 1.37 rmind error = cpu_setstate(ci, cs->cs_online);
195 1.3 ad break;
196 1.3 ad
197 1.40 christos #ifdef IOC_CPU_OGETSTATE
198 1.40 christos case IOC_CPU_OGETSTATE: {
199 1.40 christos cpustate50_t *ocs = data;
200 1.40 christos cpustate50_to_cpustate(ocs, &csb);
201 1.40 christos cs = &csb;
202 1.40 christos error = 1;
203 1.40 christos /*FALLTHROUGH*/
204 1.40 christos }
205 1.40 christos #endif
206 1.3 ad case IOC_CPU_GETSTATE:
207 1.40 christos if (error == 0)
208 1.40 christos cs = data;
209 1.3 ad id = cs->cs_id;
210 1.10 ad memset(cs, 0, sizeof(*cs));
211 1.3 ad cs->cs_id = id;
212 1.36 ad if (cs->cs_id >= __arraycount(cpu_infos) ||
213 1.36 ad (ci = cpu_lookup(id)) == NULL) {
214 1.3 ad error = ESRCH;
215 1.3 ad break;
216 1.3 ad }
217 1.3 ad if ((ci->ci_schedstate.spc_flags & SPCF_OFFLINE) != 0)
218 1.3 ad cs->cs_online = false;
219 1.3 ad else
220 1.3 ad cs->cs_online = true;
221 1.3 ad cs->cs_intr = true;
222 1.3 ad cs->cs_lastmod = ci->ci_schedstate.spc_lastmod;
223 1.40 christos #ifdef IOC_CPU_OGETSTATE
224 1.40 christos if (cmd == IOC_CPU_OGETSTATE) {
225 1.40 christos cpustate50_t *ocs = data;
226 1.40 christos cpustate_to_cpustate50(cs, ocs);
227 1.40 christos }
228 1.40 christos #endif
229 1.3 ad break;
230 1.3 ad
231 1.3 ad case IOC_CPU_MAPID:
232 1.3 ad i = 0;
233 1.3 ad for (CPU_INFO_FOREACH(cii, ci)) {
234 1.3 ad if (i++ == *(int *)data)
235 1.3 ad break;
236 1.3 ad }
237 1.3 ad if (ci == NULL)
238 1.3 ad error = ESRCH;
239 1.3 ad else
240 1.38 rmind *(int *)data = cpu_index(ci);
241 1.3 ad break;
242 1.3 ad
243 1.3 ad case IOC_CPU_GETCOUNT:
244 1.3 ad *(int *)data = ncpu;
245 1.3 ad break;
246 1.3 ad
247 1.3 ad default:
248 1.3 ad error = ENOTTY;
249 1.3 ad break;
250 1.3 ad }
251 1.3 ad mutex_exit(&cpu_lock);
252 1.3 ad
253 1.3 ad return error;
254 1.3 ad }
255 1.3 ad
256 1.3 ad struct cpu_info *
257 1.36 ad cpu_lookup(u_int idx)
258 1.16 yamt {
259 1.16 yamt struct cpu_info *ci = cpu_infos[idx];
260 1.16 yamt
261 1.36 ad KASSERT(idx < __arraycount(cpu_infos));
262 1.16 yamt KASSERT(ci == NULL || cpu_index(ci) == idx);
263 1.16 yamt
264 1.16 yamt return ci;
265 1.16 yamt }
266 1.16 yamt
267 1.7 ad static void
268 1.11 rmind cpu_xc_offline(struct cpu_info *ci)
269 1.7 ad {
270 1.11 rmind struct schedstate_percpu *spc, *mspc = NULL;
271 1.37 rmind struct cpu_info *target_ci;
272 1.11 rmind struct lwp *l;
273 1.11 rmind CPU_INFO_ITERATOR cii;
274 1.7 ad int s;
275 1.7 ad
276 1.37 rmind /*
277 1.37 rmind * Thread which sent unicast (separate context) is holding
278 1.37 rmind * the cpu_lock for us.
279 1.37 rmind */
280 1.11 rmind spc = &ci->ci_schedstate;
281 1.7 ad s = splsched();
282 1.7 ad spc->spc_flags |= SPCF_OFFLINE;
283 1.7 ad splx(s);
284 1.11 rmind
285 1.11 rmind /* Take the first available CPU for the migration */
286 1.37 rmind for (CPU_INFO_FOREACH(cii, target_ci)) {
287 1.37 rmind mspc = &target_ci->ci_schedstate;
288 1.11 rmind if ((mspc->spc_flags & SPCF_OFFLINE) == 0)
289 1.11 rmind break;
290 1.11 rmind }
291 1.37 rmind KASSERT(target_ci != NULL);
292 1.11 rmind
293 1.11 rmind /*
294 1.37 rmind * Migrate all non-bound threads to the other CPU. Note that this
295 1.37 rmind * runs from the xcall thread, thus handling of LSONPROC is not needed.
296 1.11 rmind */
297 1.28 ad mutex_enter(proc_lock);
298 1.11 rmind LIST_FOREACH(l, &alllwp, l_list) {
299 1.37 rmind struct cpu_info *mci;
300 1.37 rmind
301 1.35 yamt lwp_lock(l);
302 1.37 rmind if (l->l_cpu != ci || (l->l_pflag & (LP_BOUND | LP_INTR))) {
303 1.35 yamt lwp_unlock(l);
304 1.37 rmind continue;
305 1.11 rmind }
306 1.37 rmind /* Normal case - no affinity */
307 1.37 rmind if ((l->l_flag & LW_AFFINITY) == 0) {
308 1.37 rmind lwp_migrate(l, target_ci);
309 1.37 rmind continue;
310 1.37 rmind }
311 1.37 rmind /* Affinity is set, find an online CPU in the set */
312 1.37 rmind KASSERT(l->l_affinity != NULL);
313 1.37 rmind for (CPU_INFO_FOREACH(cii, mci)) {
314 1.37 rmind mspc = &mci->ci_schedstate;
315 1.37 rmind if ((mspc->spc_flags & SPCF_OFFLINE) == 0 &&
316 1.37 rmind kcpuset_isset(cpu_index(mci), l->l_affinity))
317 1.37 rmind break;
318 1.37 rmind }
319 1.37 rmind if (mci == NULL) {
320 1.37 rmind lwp_unlock(l);
321 1.37 rmind mutex_exit(proc_lock);
322 1.37 rmind goto fail;
323 1.37 rmind }
324 1.37 rmind lwp_migrate(l, mci);
325 1.11 rmind }
326 1.28 ad mutex_exit(proc_lock);
327 1.19 joerg
328 1.19 joerg #ifdef __HAVE_MD_CPU_OFFLINE
329 1.19 joerg cpu_offline_md();
330 1.19 joerg #endif
331 1.37 rmind return;
332 1.37 rmind fail:
333 1.37 rmind /* Just unset the SPCF_OFFLINE flag, caller will check */
334 1.37 rmind s = splsched();
335 1.37 rmind spc->spc_flags &= ~SPCF_OFFLINE;
336 1.37 rmind splx(s);
337 1.7 ad }
338 1.7 ad
339 1.7 ad static void
340 1.11 rmind cpu_xc_online(struct cpu_info *ci)
341 1.7 ad {
342 1.11 rmind struct schedstate_percpu *spc;
343 1.7 ad int s;
344 1.7 ad
345 1.11 rmind spc = &ci->ci_schedstate;
346 1.7 ad s = splsched();
347 1.7 ad spc->spc_flags &= ~SPCF_OFFLINE;
348 1.7 ad splx(s);
349 1.7 ad }
350 1.7 ad
351 1.3 ad int
352 1.37 rmind cpu_setstate(struct cpu_info *ci, bool online)
353 1.3 ad {
354 1.3 ad struct schedstate_percpu *spc;
355 1.3 ad CPU_INFO_ITERATOR cii;
356 1.3 ad struct cpu_info *ci2;
357 1.7 ad uint64_t where;
358 1.7 ad xcfunc_t func;
359 1.3 ad int nonline;
360 1.3 ad
361 1.3 ad spc = &ci->ci_schedstate;
362 1.3 ad
363 1.3 ad KASSERT(mutex_owned(&cpu_lock));
364 1.3 ad
365 1.3 ad if (online) {
366 1.3 ad if ((spc->spc_flags & SPCF_OFFLINE) == 0)
367 1.3 ad return 0;
368 1.7 ad func = (xcfunc_t)cpu_xc_online;
369 1.9 ad ncpuonline++;
370 1.3 ad } else {
371 1.3 ad if ((spc->spc_flags & SPCF_OFFLINE) != 0)
372 1.3 ad return 0;
373 1.3 ad nonline = 0;
374 1.33 ad /*
375 1.33 ad * Ensure that at least one CPU within the processor set
376 1.33 ad * stays online. Revisit this later.
377 1.33 ad */
378 1.3 ad for (CPU_INFO_FOREACH(cii, ci2)) {
379 1.33 ad if ((ci2->ci_schedstate.spc_flags & SPCF_OFFLINE) != 0)
380 1.33 ad continue;
381 1.33 ad if (ci2->ci_schedstate.spc_psid != spc->spc_psid)
382 1.33 ad continue;
383 1.33 ad nonline++;
384 1.3 ad }
385 1.3 ad if (nonline == 1)
386 1.3 ad return EBUSY;
387 1.7 ad func = (xcfunc_t)cpu_xc_offline;
388 1.9 ad ncpuonline--;
389 1.3 ad }
390 1.3 ad
391 1.11 rmind where = xc_unicast(0, func, ci, NULL, ci);
392 1.7 ad xc_wait(where);
393 1.11 rmind if (online) {
394 1.11 rmind KASSERT((spc->spc_flags & SPCF_OFFLINE) == 0);
395 1.37 rmind } else if ((spc->spc_flags & SPCF_OFFLINE) == 0) {
396 1.37 rmind /* If was not set offline, then it is busy */
397 1.37 rmind return EBUSY;
398 1.11 rmind }
399 1.37 rmind
400 1.7 ad spc->spc_lastmod = time_second;
401 1.3 ad return 0;
402 1.3 ad }
403 1.39 ad
404 1.39 ad bool
405 1.39 ad cpu_softintr_p(void)
406 1.39 ad {
407 1.39 ad
408 1.39 ad return (curlwp->l_pflag & LP_INTR) != 0;
409 1.39 ad }
410