Home | History | Annotate | Line # | Download | only in kern
kern_cpu.c revision 1.38
      1  1.38  rmind /*	$NetBSD: kern_cpu.c,v 1.38 2008/11/06 16:48:51 rmind Exp $	*/
      2   1.3     ad 
      3   1.3     ad /*-
      4  1.21     ad  * Copyright (c) 2007, 2008 The NetBSD Foundation, Inc.
      5   1.3     ad  * All rights reserved.
      6   1.3     ad  *
      7   1.3     ad  * This code is derived from software contributed to The NetBSD Foundation
      8   1.3     ad  * by Andrew Doran.
      9   1.3     ad  *
     10   1.3     ad  * Redistribution and use in source and binary forms, with or without
     11   1.3     ad  * modification, are permitted provided that the following conditions
     12   1.3     ad  * are met:
     13   1.3     ad  * 1. Redistributions of source code must retain the above copyright
     14   1.3     ad  *    notice, this list of conditions and the following disclaimer.
     15   1.3     ad  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.3     ad  *    notice, this list of conditions and the following disclaimer in the
     17   1.3     ad  *    documentation and/or other materials provided with the distribution.
     18   1.3     ad  *
     19   1.3     ad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.3     ad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.3     ad  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.3     ad  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.3     ad  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.3     ad  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.3     ad  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.3     ad  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.3     ad  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.3     ad  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.3     ad  * POSSIBILITY OF SUCH DAMAGE.
     30   1.3     ad  */
     31   1.2   yamt 
     32   1.2   yamt /*-
     33   1.2   yamt  * Copyright (c)2007 YAMAMOTO Takashi,
     34   1.2   yamt  * All rights reserved.
     35   1.2   yamt  *
     36   1.2   yamt  * Redistribution and use in source and binary forms, with or without
     37   1.2   yamt  * modification, are permitted provided that the following conditions
     38   1.2   yamt  * are met:
     39   1.2   yamt  * 1. Redistributions of source code must retain the above copyright
     40   1.2   yamt  *    notice, this list of conditions and the following disclaimer.
     41   1.2   yamt  * 2. Redistributions in binary form must reproduce the above copyright
     42   1.2   yamt  *    notice, this list of conditions and the following disclaimer in the
     43   1.2   yamt  *    documentation and/or other materials provided with the distribution.
     44   1.2   yamt  *
     45   1.2   yamt  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     46   1.2   yamt  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     47   1.2   yamt  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     48   1.2   yamt  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     49   1.2   yamt  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     50   1.2   yamt  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     51   1.2   yamt  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     52   1.2   yamt  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     53   1.2   yamt  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     54   1.2   yamt  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     55   1.2   yamt  * SUCH DAMAGE.
     56   1.2   yamt  */
     57   1.2   yamt 
     58   1.2   yamt #include <sys/cdefs.h>
     59  1.38  rmind __KERNEL_RCSID(0, "$NetBSD: kern_cpu.c,v 1.38 2008/11/06 16:48:51 rmind Exp $");
     60   1.2   yamt 
     61   1.2   yamt #include <sys/param.h>
     62   1.2   yamt #include <sys/systm.h>
     63   1.2   yamt #include <sys/idle.h>
     64   1.2   yamt #include <sys/sched.h>
     65   1.8     ad #include <sys/intr.h>
     66   1.3     ad #include <sys/conf.h>
     67   1.3     ad #include <sys/cpu.h>
     68   1.3     ad #include <sys/cpuio.h>
     69   1.3     ad #include <sys/proc.h>
     70  1.17   yamt #include <sys/percpu.h>
     71   1.3     ad #include <sys/kernel.h>
     72   1.3     ad #include <sys/kauth.h>
     73   1.7     ad #include <sys/xcall.h>
     74   1.7     ad #include <sys/pool.h>
     75  1.21     ad #include <sys/kmem.h>
     76  1.22     ad #include <sys/select.h>
     77  1.23     ad #include <sys/namei.h>
     78  1.27     ad #include <sys/callout.h>
     79   1.3     ad 
     80   1.6     ad #include <uvm/uvm_extern.h>
     81   1.6     ad 
     82   1.3     ad void	cpuctlattach(int);
     83   1.3     ad 
     84  1.11  rmind static void	cpu_xc_online(struct cpu_info *);
     85  1.11  rmind static void	cpu_xc_offline(struct cpu_info *);
     86   1.7     ad 
     87   1.3     ad dev_type_ioctl(cpuctl_ioctl);
     88   1.3     ad 
     89   1.3     ad const struct cdevsw cpuctl_cdevsw = {
     90   1.3     ad 	nullopen, nullclose, nullread, nullwrite, cpuctl_ioctl,
     91   1.3     ad 	nullstop, notty, nopoll, nommap, nokqfilter,
     92   1.3     ad 	D_OTHER | D_MPSAFE
     93   1.3     ad };
     94  1.11  rmind 
     95   1.3     ad kmutex_t cpu_lock;
     96   1.9     ad int	ncpu;
     97   1.9     ad int	ncpuonline;
     98  1.17   yamt bool	mp_online;
     99  1.24     ad struct	cpuqueue cpu_queue = CIRCLEQ_HEAD_INITIALIZER(cpu_queue);
    100   1.2   yamt 
    101  1.16   yamt static struct cpu_info *cpu_infos[MAXCPUS];
    102  1.16   yamt 
    103   1.2   yamt int
    104   1.2   yamt mi_cpu_attach(struct cpu_info *ci)
    105   1.2   yamt {
    106   1.2   yamt 	int error;
    107   1.2   yamt 
    108   1.5  rmind 	ci->ci_index = ncpu;
    109  1.24     ad 	cpu_infos[cpu_index(ci)] = ci;
    110  1.24     ad 	CIRCLEQ_INSERT_TAIL(&cpu_queue, ci, ci_data.cpu_qchain);
    111  1.30     ad 	TAILQ_INIT(&ci->ci_data.cpu_ld_locks);
    112  1.30     ad 	__cpu_simple_lock_init(&ci->ci_data.cpu_ld_lock);
    113   1.5  rmind 
    114   1.2   yamt 	sched_cpuattach(ci);
    115   1.2   yamt 
    116   1.2   yamt 	error = create_idle_lwp(ci);
    117   1.2   yamt 	if (error != 0) {
    118   1.2   yamt 		/* XXX revert sched_cpuattach */
    119   1.2   yamt 		return error;
    120   1.2   yamt 	}
    121   1.2   yamt 
    122  1.13     ad 	if (ci == curcpu())
    123  1.13     ad 		ci->ci_data.cpu_onproc = curlwp;
    124  1.13     ad 	else
    125  1.13     ad 		ci->ci_data.cpu_onproc = ci->ci_data.cpu_idlelwp;
    126  1.13     ad 
    127  1.17   yamt 	percpu_init_cpu(ci);
    128   1.8     ad 	softint_init(ci);
    129  1.27     ad 	callout_init_cpu(ci);
    130   1.7     ad 	xc_init_cpu(ci);
    131  1.14     ad 	pool_cache_cpu_init(ci);
    132  1.22     ad 	selsysinit(ci);
    133  1.23     ad 	cache_cpu_init(ci);
    134   1.7     ad 	TAILQ_INIT(&ci->ci_data.cpu_biodone);
    135   1.2   yamt 	ncpu++;
    136   1.9     ad 	ncpuonline++;
    137   1.2   yamt 
    138   1.2   yamt 	return 0;
    139   1.2   yamt }
    140   1.3     ad 
    141   1.3     ad void
    142   1.3     ad cpuctlattach(int dummy)
    143   1.3     ad {
    144   1.3     ad 
    145   1.3     ad }
    146   1.3     ad 
    147   1.3     ad int
    148   1.3     ad cpuctl_ioctl(dev_t dev, u_long cmd, void *data, int flag, lwp_t *l)
    149   1.3     ad {
    150   1.3     ad 	CPU_INFO_ITERATOR cii;
    151   1.3     ad 	cpustate_t *cs;
    152   1.3     ad 	struct cpu_info *ci;
    153   1.3     ad 	int error, i;
    154   1.3     ad 	u_int id;
    155   1.3     ad 
    156   1.3     ad 	error = 0;
    157   1.3     ad 
    158   1.3     ad 	mutex_enter(&cpu_lock);
    159   1.3     ad 	switch (cmd) {
    160   1.3     ad 	case IOC_CPU_SETSTATE:
    161  1.20   elad 		cs = data;
    162  1.20   elad 		error = kauth_authorize_system(l->l_cred,
    163  1.20   elad 		    KAUTH_SYSTEM_CPU, KAUTH_REQ_SYSTEM_CPU_SETSTATE, cs, NULL,
    164  1.20   elad 		    NULL);
    165   1.3     ad 		if (error != 0)
    166   1.3     ad 			break;
    167  1.36     ad 		if (cs->cs_id >= __arraycount(cpu_infos) ||
    168  1.36     ad 		    (ci = cpu_lookup(cs->cs_id)) == NULL) {
    169   1.3     ad 			error = ESRCH;
    170   1.3     ad 			break;
    171   1.3     ad 		}
    172   1.3     ad 		if (!cs->cs_intr) {
    173   1.3     ad 			error = EOPNOTSUPP;
    174   1.3     ad 			break;
    175   1.3     ad 		}
    176  1.37  rmind 		error = cpu_setstate(ci, cs->cs_online);
    177   1.3     ad 		break;
    178   1.3     ad 
    179   1.3     ad 	case IOC_CPU_GETSTATE:
    180   1.3     ad 		cs = data;
    181   1.3     ad 		id = cs->cs_id;
    182  1.10     ad 		memset(cs, 0, sizeof(*cs));
    183   1.3     ad 		cs->cs_id = id;
    184  1.36     ad 		if (cs->cs_id >= __arraycount(cpu_infos) ||
    185  1.36     ad 		    (ci = cpu_lookup(id)) == NULL) {
    186   1.3     ad 			error = ESRCH;
    187   1.3     ad 			break;
    188   1.3     ad 		}
    189   1.3     ad 		if ((ci->ci_schedstate.spc_flags & SPCF_OFFLINE) != 0)
    190   1.3     ad 			cs->cs_online = false;
    191   1.3     ad 		else
    192   1.3     ad 			cs->cs_online = true;
    193   1.3     ad 		cs->cs_intr = true;
    194   1.3     ad 		cs->cs_lastmod = ci->ci_schedstate.spc_lastmod;
    195   1.3     ad 		break;
    196   1.3     ad 
    197   1.3     ad 	case IOC_CPU_MAPID:
    198   1.3     ad 		i = 0;
    199   1.3     ad 		for (CPU_INFO_FOREACH(cii, ci)) {
    200   1.3     ad 			if (i++ == *(int *)data)
    201   1.3     ad 				break;
    202   1.3     ad 		}
    203   1.3     ad 		if (ci == NULL)
    204   1.3     ad 			error = ESRCH;
    205   1.3     ad 		else
    206  1.38  rmind 			*(int *)data = cpu_index(ci);
    207   1.3     ad 		break;
    208   1.3     ad 
    209   1.3     ad 	case IOC_CPU_GETCOUNT:
    210   1.3     ad 		*(int *)data = ncpu;
    211   1.3     ad 		break;
    212   1.3     ad 
    213   1.3     ad 	default:
    214   1.3     ad 		error = ENOTTY;
    215   1.3     ad 		break;
    216   1.3     ad 	}
    217   1.3     ad 	mutex_exit(&cpu_lock);
    218   1.3     ad 
    219   1.3     ad 	return error;
    220   1.3     ad }
    221   1.3     ad 
    222   1.3     ad struct cpu_info *
    223  1.36     ad cpu_lookup(u_int idx)
    224  1.16   yamt {
    225  1.16   yamt 	struct cpu_info *ci = cpu_infos[idx];
    226  1.16   yamt 
    227  1.36     ad 	KASSERT(idx < __arraycount(cpu_infos));
    228  1.16   yamt 	KASSERT(ci == NULL || cpu_index(ci) == idx);
    229  1.16   yamt 
    230  1.16   yamt 	return ci;
    231  1.16   yamt }
    232  1.16   yamt 
    233   1.7     ad static void
    234  1.11  rmind cpu_xc_offline(struct cpu_info *ci)
    235   1.7     ad {
    236  1.11  rmind 	struct schedstate_percpu *spc, *mspc = NULL;
    237  1.37  rmind 	struct cpu_info *target_ci;
    238  1.11  rmind 	struct lwp *l;
    239  1.11  rmind 	CPU_INFO_ITERATOR cii;
    240   1.7     ad 	int s;
    241   1.7     ad 
    242  1.37  rmind 	/*
    243  1.37  rmind 	 * Thread which sent unicast (separate context) is holding
    244  1.37  rmind 	 * the cpu_lock for us.
    245  1.37  rmind 	 */
    246  1.11  rmind 	spc = &ci->ci_schedstate;
    247   1.7     ad 	s = splsched();
    248   1.7     ad 	spc->spc_flags |= SPCF_OFFLINE;
    249   1.7     ad 	splx(s);
    250  1.11  rmind 
    251  1.11  rmind 	/* Take the first available CPU for the migration */
    252  1.37  rmind 	for (CPU_INFO_FOREACH(cii, target_ci)) {
    253  1.37  rmind 		mspc = &target_ci->ci_schedstate;
    254  1.11  rmind 		if ((mspc->spc_flags & SPCF_OFFLINE) == 0)
    255  1.11  rmind 			break;
    256  1.11  rmind 	}
    257  1.37  rmind 	KASSERT(target_ci != NULL);
    258  1.11  rmind 
    259  1.11  rmind 	/*
    260  1.37  rmind 	 * Migrate all non-bound threads to the other CPU.  Note that this
    261  1.37  rmind 	 * runs from the xcall thread, thus handling of LSONPROC is not needed.
    262  1.11  rmind 	 */
    263  1.28     ad 	mutex_enter(proc_lock);
    264  1.11  rmind 	LIST_FOREACH(l, &alllwp, l_list) {
    265  1.37  rmind 		struct cpu_info *mci;
    266  1.37  rmind 
    267  1.35   yamt 		lwp_lock(l);
    268  1.37  rmind 		if (l->l_cpu != ci || (l->l_pflag & (LP_BOUND | LP_INTR))) {
    269  1.35   yamt 			lwp_unlock(l);
    270  1.37  rmind 			continue;
    271  1.11  rmind 		}
    272  1.37  rmind 		/* Normal case - no affinity */
    273  1.37  rmind 		if ((l->l_flag & LW_AFFINITY) == 0) {
    274  1.37  rmind 			lwp_migrate(l, target_ci);
    275  1.37  rmind 			continue;
    276  1.37  rmind 		}
    277  1.37  rmind 		/* Affinity is set, find an online CPU in the set */
    278  1.37  rmind 		KASSERT(l->l_affinity != NULL);
    279  1.37  rmind 		for (CPU_INFO_FOREACH(cii, mci)) {
    280  1.37  rmind 			mspc = &mci->ci_schedstate;
    281  1.37  rmind 			if ((mspc->spc_flags & SPCF_OFFLINE) == 0 &&
    282  1.37  rmind 			    kcpuset_isset(cpu_index(mci), l->l_affinity))
    283  1.37  rmind 				break;
    284  1.37  rmind 		}
    285  1.37  rmind 		if (mci == NULL) {
    286  1.37  rmind 			lwp_unlock(l);
    287  1.37  rmind 			mutex_exit(proc_lock);
    288  1.37  rmind 			goto fail;
    289  1.37  rmind 		}
    290  1.37  rmind 		lwp_migrate(l, mci);
    291  1.11  rmind 	}
    292  1.28     ad 	mutex_exit(proc_lock);
    293  1.19  joerg 
    294  1.19  joerg #ifdef __HAVE_MD_CPU_OFFLINE
    295  1.19  joerg 	cpu_offline_md();
    296  1.19  joerg #endif
    297  1.37  rmind 	return;
    298  1.37  rmind fail:
    299  1.37  rmind 	/* Just unset the SPCF_OFFLINE flag, caller will check */
    300  1.37  rmind 	s = splsched();
    301  1.37  rmind 	spc->spc_flags &= ~SPCF_OFFLINE;
    302  1.37  rmind 	splx(s);
    303   1.7     ad }
    304   1.7     ad 
    305   1.7     ad static void
    306  1.11  rmind cpu_xc_online(struct cpu_info *ci)
    307   1.7     ad {
    308  1.11  rmind 	struct schedstate_percpu *spc;
    309   1.7     ad 	int s;
    310   1.7     ad 
    311  1.11  rmind 	spc = &ci->ci_schedstate;
    312   1.7     ad 	s = splsched();
    313   1.7     ad 	spc->spc_flags &= ~SPCF_OFFLINE;
    314   1.7     ad 	splx(s);
    315   1.7     ad }
    316   1.7     ad 
    317   1.3     ad int
    318  1.37  rmind cpu_setstate(struct cpu_info *ci, bool online)
    319   1.3     ad {
    320   1.3     ad 	struct schedstate_percpu *spc;
    321   1.3     ad 	CPU_INFO_ITERATOR cii;
    322   1.3     ad 	struct cpu_info *ci2;
    323   1.7     ad 	uint64_t where;
    324   1.7     ad 	xcfunc_t func;
    325   1.3     ad 	int nonline;
    326   1.3     ad 
    327   1.3     ad 	spc = &ci->ci_schedstate;
    328   1.3     ad 
    329   1.3     ad 	KASSERT(mutex_owned(&cpu_lock));
    330   1.3     ad 
    331   1.3     ad 	if (online) {
    332   1.3     ad 		if ((spc->spc_flags & SPCF_OFFLINE) == 0)
    333   1.3     ad 			return 0;
    334   1.7     ad 		func = (xcfunc_t)cpu_xc_online;
    335   1.9     ad 		ncpuonline++;
    336   1.3     ad 	} else {
    337   1.3     ad 		if ((spc->spc_flags & SPCF_OFFLINE) != 0)
    338   1.3     ad 			return 0;
    339   1.3     ad 		nonline = 0;
    340  1.33     ad 		/*
    341  1.33     ad 		 * Ensure that at least one CPU within the processor set
    342  1.33     ad 		 * stays online.  Revisit this later.
    343  1.33     ad 		 */
    344   1.3     ad 		for (CPU_INFO_FOREACH(cii, ci2)) {
    345  1.33     ad 			if ((ci2->ci_schedstate.spc_flags & SPCF_OFFLINE) != 0)
    346  1.33     ad 				continue;
    347  1.33     ad 			if (ci2->ci_schedstate.spc_psid != spc->spc_psid)
    348  1.33     ad 				continue;
    349  1.33     ad 			nonline++;
    350   1.3     ad 		}
    351   1.3     ad 		if (nonline == 1)
    352   1.3     ad 			return EBUSY;
    353   1.7     ad 		func = (xcfunc_t)cpu_xc_offline;
    354   1.9     ad 		ncpuonline--;
    355   1.3     ad 	}
    356   1.3     ad 
    357  1.11  rmind 	where = xc_unicast(0, func, ci, NULL, ci);
    358   1.7     ad 	xc_wait(where);
    359  1.11  rmind 	if (online) {
    360  1.11  rmind 		KASSERT((spc->spc_flags & SPCF_OFFLINE) == 0);
    361  1.37  rmind 	} else if ((spc->spc_flags & SPCF_OFFLINE) == 0) {
    362  1.37  rmind 		/* If was not set offline, then it is busy */
    363  1.37  rmind 		return EBUSY;
    364  1.11  rmind 	}
    365  1.37  rmind 
    366   1.7     ad 	spc->spc_lastmod = time_second;
    367   1.3     ad 	return 0;
    368   1.3     ad }
    369