Home | History | Annotate | Line # | Download | only in kern
kern_cpu.c revision 1.33
      1  1.33     ad /*	$NetBSD: kern_cpu.c,v 1.33 2008/06/22 13:59:06 ad Exp $	*/
      2   1.3     ad 
      3   1.3     ad /*-
      4  1.21     ad  * Copyright (c) 2007, 2008 The NetBSD Foundation, Inc.
      5   1.3     ad  * All rights reserved.
      6   1.3     ad  *
      7   1.3     ad  * This code is derived from software contributed to The NetBSD Foundation
      8   1.3     ad  * by Andrew Doran.
      9   1.3     ad  *
     10   1.3     ad  * Redistribution and use in source and binary forms, with or without
     11   1.3     ad  * modification, are permitted provided that the following conditions
     12   1.3     ad  * are met:
     13   1.3     ad  * 1. Redistributions of source code must retain the above copyright
     14   1.3     ad  *    notice, this list of conditions and the following disclaimer.
     15   1.3     ad  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.3     ad  *    notice, this list of conditions and the following disclaimer in the
     17   1.3     ad  *    documentation and/or other materials provided with the distribution.
     18   1.3     ad  *
     19   1.3     ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.3     ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.3     ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.3     ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.3     ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.3     ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.3     ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.3     ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.3     ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.3     ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.3     ad  * POSSIBILITY OF SUCH DAMAGE.
     30   1.3     ad  */
     31   1.2   yamt 
     32   1.2   yamt /*-
     33   1.2   yamt  * Copyright (c)2007 YAMAMOTO Takashi,
     34   1.2   yamt  * All rights reserved.
     35   1.2   yamt  *
     36   1.2   yamt  * Redistribution and use in source and binary forms, with or without
     37   1.2   yamt  * modification, are permitted provided that the following conditions
     38   1.2   yamt  * are met:
     39   1.2   yamt  * 1. Redistributions of source code must retain the above copyright
     40   1.2   yamt  *    notice, this list of conditions and the following disclaimer.
     41   1.2   yamt  * 2. Redistributions in binary form must reproduce the above copyright
     42   1.2   yamt  *    notice, this list of conditions and the following disclaimer in the
     43   1.2   yamt  *    documentation and/or other materials provided with the distribution.
     44   1.2   yamt  *
     45   1.2   yamt  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     46   1.2   yamt  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     47   1.2   yamt  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     48   1.2   yamt  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     49   1.2   yamt  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     50   1.2   yamt  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     51   1.2   yamt  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     52   1.2   yamt  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     53   1.2   yamt  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     54   1.2   yamt  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     55   1.2   yamt  * SUCH DAMAGE.
     56   1.2   yamt  */
     57   1.2   yamt 
     58   1.2   yamt #include <sys/cdefs.h>
     59   1.2   yamt 
     60  1.33     ad __KERNEL_RCSID(0, "$NetBSD: kern_cpu.c,v 1.33 2008/06/22 13:59:06 ad Exp $");
     61   1.2   yamt 
     62   1.2   yamt #include <sys/param.h>
     63   1.2   yamt #include <sys/systm.h>
     64   1.2   yamt #include <sys/idle.h>
     65   1.2   yamt #include <sys/sched.h>
     66   1.8     ad #include <sys/intr.h>
     67   1.3     ad #include <sys/conf.h>
     68   1.3     ad #include <sys/cpu.h>
     69   1.3     ad #include <sys/cpuio.h>
     70   1.3     ad #include <sys/proc.h>
     71  1.17   yamt #include <sys/percpu.h>
     72   1.3     ad #include <sys/kernel.h>
     73   1.3     ad #include <sys/kauth.h>
     74   1.7     ad #include <sys/xcall.h>
     75   1.7     ad #include <sys/pool.h>
     76  1.21     ad #include <sys/kmem.h>
     77  1.22     ad #include <sys/select.h>
     78  1.23     ad #include <sys/namei.h>
     79  1.27     ad #include <sys/callout.h>
     80   1.3     ad 
     81   1.6     ad #include <uvm/uvm_extern.h>
     82   1.6     ad 
     83   1.3     ad void	cpuctlattach(int);
     84   1.3     ad 
     85  1.11  rmind static void	cpu_xc_online(struct cpu_info *);
     86  1.11  rmind static void	cpu_xc_offline(struct cpu_info *);
     87   1.7     ad 
     88   1.3     ad dev_type_ioctl(cpuctl_ioctl);
     89   1.3     ad 
     90   1.3     ad const struct cdevsw cpuctl_cdevsw = {
     91   1.3     ad 	nullopen, nullclose, nullread, nullwrite, cpuctl_ioctl,
     92   1.3     ad 	nullstop, notty, nopoll, nommap, nokqfilter,
     93   1.3     ad 	D_OTHER | D_MPSAFE
     94   1.3     ad };
     95  1.11  rmind 
     96   1.3     ad kmutex_t cpu_lock;
     97   1.9     ad int	ncpu;
     98   1.9     ad int	ncpuonline;
     99  1.17   yamt bool	mp_online;
    100  1.24     ad struct	cpuqueue cpu_queue = CIRCLEQ_HEAD_INITIALIZER(cpu_queue);
    101   1.2   yamt 
    102  1.16   yamt static struct cpu_info *cpu_infos[MAXCPUS];
    103  1.16   yamt 
    104   1.2   yamt int
    105   1.2   yamt mi_cpu_attach(struct cpu_info *ci)
    106   1.2   yamt {
    107   1.2   yamt 	int error;
    108   1.2   yamt 
    109   1.5  rmind 	ci->ci_index = ncpu;
    110  1.24     ad 	cpu_infos[cpu_index(ci)] = ci;
    111  1.24     ad 	CIRCLEQ_INSERT_TAIL(&cpu_queue, ci, ci_data.cpu_qchain);
    112  1.30     ad 	TAILQ_INIT(&ci->ci_data.cpu_ld_locks);
    113  1.30     ad 	__cpu_simple_lock_init(&ci->ci_data.cpu_ld_lock);
    114   1.5  rmind 
    115   1.2   yamt 	sched_cpuattach(ci);
    116   1.2   yamt 
    117   1.2   yamt 	error = create_idle_lwp(ci);
    118   1.2   yamt 	if (error != 0) {
    119   1.2   yamt 		/* XXX revert sched_cpuattach */
    120   1.2   yamt 		return error;
    121   1.2   yamt 	}
    122   1.2   yamt 
    123  1.13     ad 	if (ci == curcpu())
    124  1.13     ad 		ci->ci_data.cpu_onproc = curlwp;
    125  1.13     ad 	else
    126  1.13     ad 		ci->ci_data.cpu_onproc = ci->ci_data.cpu_idlelwp;
    127  1.13     ad 
    128  1.17   yamt 	percpu_init_cpu(ci);
    129   1.8     ad 	softint_init(ci);
    130  1.27     ad 	callout_init_cpu(ci);
    131   1.7     ad 	xc_init_cpu(ci);
    132  1.14     ad 	pool_cache_cpu_init(ci);
    133  1.22     ad 	selsysinit(ci);
    134  1.23     ad 	cache_cpu_init(ci);
    135   1.7     ad 	TAILQ_INIT(&ci->ci_data.cpu_biodone);
    136   1.2   yamt 	ncpu++;
    137   1.9     ad 	ncpuonline++;
    138   1.2   yamt 
    139   1.2   yamt 	return 0;
    140   1.2   yamt }
    141   1.3     ad 
    142   1.3     ad void
    143   1.3     ad cpuctlattach(int dummy)
    144   1.3     ad {
    145   1.3     ad 
    146   1.3     ad }
    147   1.3     ad 
    148   1.3     ad int
    149   1.3     ad cpuctl_ioctl(dev_t dev, u_long cmd, void *data, int flag, lwp_t *l)
    150   1.3     ad {
    151   1.3     ad 	CPU_INFO_ITERATOR cii;
    152   1.3     ad 	cpustate_t *cs;
    153   1.3     ad 	struct cpu_info *ci;
    154   1.3     ad 	int error, i;
    155   1.3     ad 	u_int id;
    156   1.3     ad 
    157   1.3     ad 	error = 0;
    158   1.3     ad 
    159   1.3     ad 	mutex_enter(&cpu_lock);
    160   1.3     ad 	switch (cmd) {
    161   1.3     ad 	case IOC_CPU_SETSTATE:
    162  1.20   elad 		cs = data;
    163  1.20   elad 		error = kauth_authorize_system(l->l_cred,
    164  1.20   elad 		    KAUTH_SYSTEM_CPU, KAUTH_REQ_SYSTEM_CPU_SETSTATE, cs, NULL,
    165  1.20   elad 		    NULL);
    166   1.3     ad 		if (error != 0)
    167   1.3     ad 			break;
    168   1.3     ad 		if ((ci = cpu_lookup(cs->cs_id)) == NULL) {
    169   1.3     ad 			error = ESRCH;
    170   1.3     ad 			break;
    171   1.3     ad 		}
    172   1.3     ad 		if (!cs->cs_intr) {
    173   1.3     ad 			error = EOPNOTSUPP;
    174   1.3     ad 			break;
    175   1.3     ad 		}
    176   1.3     ad 		error = cpu_setonline(ci, cs->cs_online);
    177   1.3     ad 		break;
    178   1.3     ad 
    179   1.3     ad 	case IOC_CPU_GETSTATE:
    180   1.3     ad 		cs = data;
    181   1.3     ad 		id = cs->cs_id;
    182  1.10     ad 		memset(cs, 0, sizeof(*cs));
    183   1.3     ad 		cs->cs_id = id;
    184   1.3     ad 		if ((ci = cpu_lookup(id)) == NULL) {
    185   1.3     ad 			error = ESRCH;
    186   1.3     ad 			break;
    187   1.3     ad 		}
    188   1.3     ad 		if ((ci->ci_schedstate.spc_flags & SPCF_OFFLINE) != 0)
    189   1.3     ad 			cs->cs_online = false;
    190   1.3     ad 		else
    191   1.3     ad 			cs->cs_online = true;
    192   1.3     ad 		cs->cs_intr = true;
    193   1.3     ad 		cs->cs_lastmod = ci->ci_schedstate.spc_lastmod;
    194   1.3     ad 		break;
    195   1.3     ad 
    196   1.3     ad 	case IOC_CPU_MAPID:
    197   1.3     ad 		i = 0;
    198   1.3     ad 		for (CPU_INFO_FOREACH(cii, ci)) {
    199   1.3     ad 			if (i++ == *(int *)data)
    200   1.3     ad 				break;
    201   1.3     ad 		}
    202   1.3     ad 		if (ci == NULL)
    203   1.3     ad 			error = ESRCH;
    204   1.3     ad 		else
    205   1.3     ad 			*(int *)data = ci->ci_cpuid;
    206   1.3     ad 		break;
    207   1.3     ad 
    208   1.3     ad 	case IOC_CPU_GETCOUNT:
    209   1.3     ad 		*(int *)data = ncpu;
    210   1.3     ad 		break;
    211   1.3     ad 
    212   1.3     ad 	default:
    213   1.3     ad 		error = ENOTTY;
    214   1.3     ad 		break;
    215   1.3     ad 	}
    216   1.3     ad 	mutex_exit(&cpu_lock);
    217   1.3     ad 
    218   1.3     ad 	return error;
    219   1.3     ad }
    220   1.3     ad 
    221   1.3     ad struct cpu_info *
    222   1.3     ad cpu_lookup(cpuid_t id)
    223   1.3     ad {
    224   1.3     ad 	CPU_INFO_ITERATOR cii;
    225   1.3     ad 	struct cpu_info *ci;
    226   1.3     ad 
    227   1.3     ad 	for (CPU_INFO_FOREACH(cii, ci)) {
    228   1.3     ad 		if (ci->ci_cpuid == id)
    229   1.3     ad 			return ci;
    230   1.3     ad 	}
    231   1.3     ad 
    232   1.3     ad 	return NULL;
    233   1.3     ad }
    234   1.3     ad 
    235  1.16   yamt struct cpu_info *
    236  1.16   yamt cpu_lookup_byindex(u_int idx)
    237  1.16   yamt {
    238  1.16   yamt 	struct cpu_info *ci = cpu_infos[idx];
    239  1.16   yamt 
    240  1.16   yamt 	KASSERT(idx < MAXCPUS);
    241  1.16   yamt 	KASSERT(ci == NULL || cpu_index(ci) == idx);
    242  1.16   yamt 
    243  1.16   yamt 	return ci;
    244  1.16   yamt }
    245  1.16   yamt 
    246   1.7     ad static void
    247  1.11  rmind cpu_xc_offline(struct cpu_info *ci)
    248   1.7     ad {
    249  1.11  rmind 	struct schedstate_percpu *spc, *mspc = NULL;
    250  1.11  rmind 	struct cpu_info *mci;
    251  1.11  rmind 	struct lwp *l;
    252  1.11  rmind 	CPU_INFO_ITERATOR cii;
    253   1.7     ad 	int s;
    254   1.7     ad 
    255  1.11  rmind 	spc = &ci->ci_schedstate;
    256   1.7     ad 	s = splsched();
    257   1.7     ad 	spc->spc_flags |= SPCF_OFFLINE;
    258   1.7     ad 	splx(s);
    259  1.11  rmind 
    260  1.11  rmind 	/* Take the first available CPU for the migration */
    261  1.11  rmind 	for (CPU_INFO_FOREACH(cii, mci)) {
    262  1.11  rmind 		mspc = &mci->ci_schedstate;
    263  1.11  rmind 		if ((mspc->spc_flags & SPCF_OFFLINE) == 0)
    264  1.11  rmind 			break;
    265  1.11  rmind 	}
    266  1.11  rmind 	KASSERT(mci != NULL);
    267  1.11  rmind 
    268  1.11  rmind 	/*
    269  1.11  rmind 	 * Migrate all non-bound threads to the other CPU.
    270  1.31  rmind 	 *
    271  1.11  rmind 	 * Please note, that this runs from the xcall thread, thus handling
    272  1.31  rmind 	 * of LSONPROC is not needed.  Threads which change the state will
    273  1.31  rmind 	 * be handled by sched_takecpu().
    274  1.11  rmind 	 */
    275  1.28     ad 	mutex_enter(proc_lock);
    276  1.31  rmind 	spc_dlock(ci, mci);
    277  1.11  rmind 	LIST_FOREACH(l, &alllwp, l_list) {
    278  1.11  rmind 		lwp_lock(l);
    279  1.31  rmind 		if (l->l_cpu != ci || (l->l_pflag & LP_BOUND) != 0) {
    280  1.31  rmind 			lwp_unlock(l);
    281  1.31  rmind 			continue;
    282  1.11  rmind 		}
    283  1.11  rmind 		if (l->l_stat == LSRUN && (l->l_flag & LW_INMEM) != 0) {
    284  1.11  rmind 			sched_dequeue(l);
    285  1.11  rmind 			l->l_cpu = mci;
    286  1.11  rmind 			lwp_setlock(l, mspc->spc_mutex);
    287  1.11  rmind 			sched_enqueue(l, false);
    288  1.31  rmind 			lwp_unlock(l);
    289  1.31  rmind 		} else {
    290  1.31  rmind 			lwp_migrate(l, mci);
    291  1.11  rmind 		}
    292  1.11  rmind 	}
    293  1.18  rmind 	spc_dunlock(ci, mci);
    294  1.28     ad 	mutex_exit(proc_lock);
    295  1.19  joerg 
    296  1.19  joerg #ifdef __HAVE_MD_CPU_OFFLINE
    297  1.19  joerg 	cpu_offline_md();
    298  1.19  joerg #endif
    299   1.7     ad }
    300   1.7     ad 
    301   1.7     ad static void
    302  1.11  rmind cpu_xc_online(struct cpu_info *ci)
    303   1.7     ad {
    304  1.11  rmind 	struct schedstate_percpu *spc;
    305   1.7     ad 	int s;
    306   1.7     ad 
    307  1.11  rmind 	spc = &ci->ci_schedstate;
    308   1.7     ad 	s = splsched();
    309   1.7     ad 	spc->spc_flags &= ~SPCF_OFFLINE;
    310   1.7     ad 	splx(s);
    311   1.7     ad }
    312   1.7     ad 
    313   1.3     ad int
    314   1.3     ad cpu_setonline(struct cpu_info *ci, bool online)
    315   1.3     ad {
    316   1.3     ad 	struct schedstate_percpu *spc;
    317   1.3     ad 	CPU_INFO_ITERATOR cii;
    318   1.3     ad 	struct cpu_info *ci2;
    319   1.7     ad 	uint64_t where;
    320   1.7     ad 	xcfunc_t func;
    321   1.3     ad 	int nonline;
    322   1.3     ad 
    323   1.3     ad 	spc = &ci->ci_schedstate;
    324   1.3     ad 
    325   1.3     ad 	KASSERT(mutex_owned(&cpu_lock));
    326   1.3     ad 
    327   1.3     ad 	if (online) {
    328   1.3     ad 		if ((spc->spc_flags & SPCF_OFFLINE) == 0)
    329   1.3     ad 			return 0;
    330   1.7     ad 		func = (xcfunc_t)cpu_xc_online;
    331   1.9     ad 		ncpuonline++;
    332   1.3     ad 	} else {
    333   1.3     ad 		if ((spc->spc_flags & SPCF_OFFLINE) != 0)
    334   1.3     ad 			return 0;
    335   1.3     ad 		nonline = 0;
    336  1.33     ad 		/*
    337  1.33     ad 		 * Ensure that at least one CPU within the processor set
    338  1.33     ad 		 * stays online.  Revisit this later.
    339  1.33     ad 		 */
    340   1.3     ad 		for (CPU_INFO_FOREACH(cii, ci2)) {
    341  1.33     ad 			if ((ci2->ci_schedstate.spc_flags & SPCF_OFFLINE) != 0)
    342  1.33     ad 				continue;
    343  1.33     ad 			if (ci2->ci_schedstate.spc_psid != spc->spc_psid)
    344  1.33     ad 				continue;
    345  1.33     ad 			nonline++;
    346   1.3     ad 		}
    347   1.3     ad 		if (nonline == 1)
    348   1.3     ad 			return EBUSY;
    349   1.7     ad 		func = (xcfunc_t)cpu_xc_offline;
    350   1.9     ad 		ncpuonline--;
    351   1.3     ad 	}
    352   1.3     ad 
    353  1.11  rmind 	where = xc_unicast(0, func, ci, NULL, ci);
    354   1.7     ad 	xc_wait(where);
    355  1.11  rmind 	if (online) {
    356  1.11  rmind 		KASSERT((spc->spc_flags & SPCF_OFFLINE) == 0);
    357  1.11  rmind 	} else {
    358  1.11  rmind 		KASSERT(spc->spc_flags & SPCF_OFFLINE);
    359  1.11  rmind 	}
    360   1.7     ad 	spc->spc_lastmod = time_second;
    361   1.7     ad 
    362   1.3     ad 	return 0;
    363   1.3     ad }
    364