Home | History | Annotate | Line # | Download | only in acpi
acpi_cpu_md.c revision 1.31
      1  1.31  jruoho /* $NetBSD: acpi_cpu_md.c,v 1.31 2010/08/23 16:20:44 jruoho Exp $ */
      2   1.1  jruoho 
      3   1.1  jruoho /*-
      4   1.1  jruoho  * Copyright (c) 2010 Jukka Ruohonen <jruohonen (at) iki.fi>
      5   1.1  jruoho  * All rights reserved.
      6   1.1  jruoho  *
      7   1.1  jruoho  * Redistribution and use in source and binary forms, with or without
      8   1.1  jruoho  * modification, are permitted provided that the following conditions
      9   1.1  jruoho  * are met:
     10   1.1  jruoho  *
     11   1.1  jruoho  * 1. Redistributions of source code must retain the above copyright
     12   1.1  jruoho  *    notice, this list of conditions and the following disclaimer.
     13   1.1  jruoho  * 2. Redistributions in binary form must reproduce the above copyright
     14   1.1  jruoho  *    notice, this list of conditions and the following disclaimer in the
     15   1.1  jruoho  *    documentation and/or other materials provided with the distribution.
     16   1.1  jruoho  *
     17   1.1  jruoho  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     18   1.1  jruoho  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     19   1.1  jruoho  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     20   1.1  jruoho  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     21   1.1  jruoho  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     22   1.1  jruoho  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     23   1.1  jruoho  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     24   1.1  jruoho  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     25   1.1  jruoho  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     26   1.1  jruoho  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     27   1.1  jruoho  * SUCH DAMAGE.
     28   1.1  jruoho  */
     29   1.1  jruoho #include <sys/cdefs.h>
     30  1.31  jruoho __KERNEL_RCSID(0, "$NetBSD: acpi_cpu_md.c,v 1.31 2010/08/23 16:20:44 jruoho Exp $");
     31   1.1  jruoho 
     32   1.1  jruoho #include <sys/param.h>
     33   1.1  jruoho #include <sys/bus.h>
     34   1.1  jruoho #include <sys/kcore.h>
     35   1.5  jruoho #include <sys/sysctl.h>
     36   1.4  jruoho #include <sys/xcall.h>
     37   1.1  jruoho 
     38   1.1  jruoho #include <x86/cpu.h>
     39   1.5  jruoho #include <x86/cpufunc.h>
     40   1.5  jruoho #include <x86/cputypes.h>
     41   1.1  jruoho #include <x86/cpuvar.h>
     42   1.5  jruoho #include <x86/cpu_msr.h>
     43   1.1  jruoho #include <x86/machdep.h>
     44   1.1  jruoho 
     45   1.1  jruoho #include <dev/acpi/acpica.h>
     46   1.1  jruoho #include <dev/acpi/acpi_cpu.h>
     47   1.1  jruoho 
     48  1.12  jruoho #include <dev/pci/pcivar.h>
     49  1.12  jruoho #include <dev/pci/pcidevs.h>
     50  1.12  jruoho 
     51  1.22  jruoho #define CPUID_INTEL_TSC		__BIT(8)
     52  1.22  jruoho 
     53  1.17  jruoho #define MSR_0FH_CONTROL		0xc0010041 /* Family 0Fh (and K7).  */
     54  1.17  jruoho #define MSR_0FH_STATUS		0xc0010042
     55  1.17  jruoho 
     56  1.17  jruoho #define MSR_10H_LIMIT		0xc0010061 /* Families 10h and 11h. */
     57  1.17  jruoho #define MSR_10H_CONTROL		0xc0010062
     58  1.17  jruoho #define MSR_10H_STATUS		0xc0010063
     59  1.17  jruoho #define MSR_10H_CONFIG		0xc0010064
     60  1.17  jruoho 
     61   1.5  jruoho static char	  native_idle_text[16];
     62   1.5  jruoho void		(*native_idle)(void) = NULL;
     63   1.1  jruoho 
     64  1.12  jruoho static int	 acpicpu_md_quirks_piix4(struct pci_attach_args *);
     65  1.19  jruoho static void	 acpicpu_md_pstate_status(void *, void *);
     66  1.19  jruoho static void	 acpicpu_md_tstate_status(void *, void *);
     67  1.19  jruoho static int	 acpicpu_md_pstate_sysctl_init(void);
     68   1.5  jruoho static int	 acpicpu_md_pstate_sysctl_get(SYSCTLFN_PROTO);
     69   1.5  jruoho static int	 acpicpu_md_pstate_sysctl_set(SYSCTLFN_PROTO);
     70   1.5  jruoho static int	 acpicpu_md_pstate_sysctl_all(SYSCTLFN_PROTO);
     71   1.5  jruoho 
     72   1.5  jruoho extern uint32_t cpus_running;
     73   1.5  jruoho extern struct acpicpu_softc **acpicpu_sc;
     74  1.19  jruoho static struct sysctllog *acpicpu_log = NULL;
     75   1.1  jruoho 
     76   1.1  jruoho uint32_t
     77   1.1  jruoho acpicpu_md_cap(void)
     78   1.1  jruoho {
     79   1.1  jruoho 	struct cpu_info *ci = curcpu();
     80   1.1  jruoho 	uint32_t val = 0;
     81   1.1  jruoho 
     82  1.17  jruoho 	if (cpu_vendor != CPUVENDOR_IDT &&
     83  1.17  jruoho 	    cpu_vendor != CPUVENDOR_INTEL)
     84   1.1  jruoho 		return val;
     85   1.1  jruoho 
     86   1.1  jruoho 	/*
     87   1.1  jruoho 	 * Basic SMP C-states (required for _CST).
     88   1.1  jruoho 	 */
     89   1.1  jruoho 	val |= ACPICPU_PDC_C_C1PT | ACPICPU_PDC_C_C2C3;
     90   1.1  jruoho 
     91   1.1  jruoho         /*
     92   1.1  jruoho 	 * If MONITOR/MWAIT is available, announce
     93   1.1  jruoho 	 * support for native instructions in all C-states.
     94   1.1  jruoho 	 */
     95   1.1  jruoho         if ((ci->ci_feat_val[1] & CPUID2_MONITOR) != 0)
     96   1.1  jruoho 		val |= ACPICPU_PDC_C_C1_FFH | ACPICPU_PDC_C_C2C3_FFH;
     97   1.1  jruoho 
     98   1.5  jruoho 	/*
     99  1.10  jruoho 	 * Set native P- and T-states, if available.
    100   1.5  jruoho 	 */
    101   1.5  jruoho         if ((ci->ci_feat_val[1] & CPUID2_EST) != 0)
    102   1.5  jruoho 		val |= ACPICPU_PDC_P_FFH;
    103   1.5  jruoho 
    104  1.10  jruoho 	if ((ci->ci_feat_val[0] & CPUID_ACPI) != 0)
    105  1.10  jruoho 		val |= ACPICPU_PDC_T_FFH;
    106  1.10  jruoho 
    107   1.1  jruoho 	return val;
    108   1.1  jruoho }
    109   1.1  jruoho 
    110   1.1  jruoho uint32_t
    111   1.1  jruoho acpicpu_md_quirks(void)
    112   1.1  jruoho {
    113   1.1  jruoho 	struct cpu_info *ci = curcpu();
    114  1.12  jruoho 	struct pci_attach_args pa;
    115  1.18  jruoho 	uint32_t family, val = 0;
    116  1.21  jruoho 	uint32_t regs[4];
    117   1.1  jruoho 
    118   1.1  jruoho 	if (acpicpu_md_cpus_running() == 1)
    119   1.1  jruoho 		val |= ACPICPU_FLAG_C_BM;
    120   1.1  jruoho 
    121   1.1  jruoho 	if ((ci->ci_feat_val[1] & CPUID2_MONITOR) != 0)
    122   1.5  jruoho 		val |= ACPICPU_FLAG_C_FFH;
    123   1.1  jruoho 
    124  1.25  jruoho 	val |= ACPICPU_FLAG_C_APIC | ACPICPU_FLAG_C_TSC;
    125  1.22  jruoho 
    126   1.1  jruoho 	switch (cpu_vendor) {
    127   1.1  jruoho 
    128  1.17  jruoho 	case CPUVENDOR_IDT:
    129  1.22  jruoho 
    130  1.22  jruoho 		if ((ci->ci_feat_val[1] & CPUID2_EST) != 0)
    131  1.22  jruoho 			val |= ACPICPU_FLAG_P_FFH;
    132  1.22  jruoho 
    133  1.22  jruoho 		if ((ci->ci_feat_val[0] & CPUID_ACPI) != 0)
    134  1.22  jruoho 			val |= ACPICPU_FLAG_T_FFH;
    135  1.22  jruoho 
    136  1.22  jruoho 		break;
    137  1.22  jruoho 
    138   1.1  jruoho 	case CPUVENDOR_INTEL:
    139  1.17  jruoho 
    140  1.22  jruoho 		val |= ACPICPU_FLAG_C_BM | ACPICPU_FLAG_C_ARB;
    141  1.22  jruoho 
    142   1.5  jruoho 		if ((ci->ci_feat_val[1] & CPUID2_EST) != 0)
    143   1.5  jruoho 			val |= ACPICPU_FLAG_P_FFH;
    144   1.5  jruoho 
    145  1.10  jruoho 		if ((ci->ci_feat_val[0] & CPUID_ACPI) != 0)
    146  1.10  jruoho 			val |= ACPICPU_FLAG_T_FFH;
    147  1.10  jruoho 
    148  1.22  jruoho 		/*
    149  1.25  jruoho 		 * Check whether MSR_APERF, MSR_MPERF, and Turbo
    150  1.25  jruoho 		 * Boost are available. Also see if we might have
    151  1.25  jruoho 		 * an invariant local APIC timer ("ARAT").
    152  1.23  jruoho 		 */
    153  1.23  jruoho 		if (cpuid_level >= 0x06) {
    154  1.23  jruoho 
    155  1.23  jruoho 			x86_cpuid(0x06, regs);
    156  1.23  jruoho 
    157  1.25  jruoho 			if ((regs[2] & __BIT(0)) != 0)		/* ECX.06[0] */
    158  1.23  jruoho 				val |= ACPICPU_FLAG_P_HW;
    159  1.23  jruoho 
    160  1.25  jruoho 			if ((regs[0] & __BIT(1)) != 0)		/* EAX.06[1] */
    161  1.24  jruoho 				val |= ACPICPU_FLAG_P_TURBO;
    162  1.25  jruoho 
    163  1.25  jruoho 			if ((regs[0] & __BIT(2)) != 0)		/* EAX.06[2] */
    164  1.25  jruoho 				val &= ~ACPICPU_FLAG_C_APIC;
    165  1.23  jruoho 		}
    166  1.23  jruoho 
    167  1.23  jruoho 		/*
    168  1.22  jruoho 		 * Detect whether TSC is invariant. If it is not,
    169  1.22  jruoho 		 * we keep the flag to note that TSC will not run
    170  1.22  jruoho 		 * at constant rate. Depending on the CPU, this may
    171  1.22  jruoho 		 * affect P- and T-state changes, but especially
    172  1.22  jruoho 		 * relevant are C-states; with variant TSC, states
    173  1.24  jruoho 		 * larger than C1 may completely stop the counter.
    174  1.22  jruoho 		 */
    175  1.22  jruoho 		x86_cpuid(0x80000000, regs);
    176  1.22  jruoho 
    177  1.22  jruoho 		if (regs[0] >= 0x80000007) {
    178  1.22  jruoho 
    179  1.22  jruoho 			x86_cpuid(0x80000007, regs);
    180  1.22  jruoho 
    181  1.22  jruoho 			if ((regs[3] & CPUID_INTEL_TSC) != 0)
    182  1.22  jruoho 				val &= ~ACPICPU_FLAG_C_TSC;
    183  1.22  jruoho 		}
    184  1.22  jruoho 
    185  1.17  jruoho 		break;
    186  1.12  jruoho 
    187  1.17  jruoho 	case CPUVENDOR_AMD:
    188  1.17  jruoho 
    189  1.18  jruoho 		family = CPUID2FAMILY(ci->ci_signature);
    190  1.18  jruoho 
    191  1.18  jruoho 		if (family == 0xf)
    192  1.18  jruoho 			family += CPUID2EXTFAMILY(ci->ci_signature);
    193  1.18  jruoho 
    194  1.18  jruoho 		switch (family) {
    195   1.1  jruoho 
    196  1.22  jruoho 		case 0x0f:
    197  1.17  jruoho 		case 0x10:
    198  1.17  jruoho 		case 0x11:
    199   1.1  jruoho 
    200  1.21  jruoho 			x86_cpuid(0x80000007, regs);
    201  1.21  jruoho 
    202  1.22  jruoho 			if ((regs[3] & CPUID_APM_TSC) != 0)
    203  1.22  jruoho 				val &= ~ACPICPU_FLAG_C_TSC;
    204  1.22  jruoho 
    205  1.21  jruoho 			if ((regs[3] & CPUID_APM_HWP) != 0)
    206  1.17  jruoho 				val |= ACPICPU_FLAG_P_FFH;
    207  1.21  jruoho 
    208  1.21  jruoho 			if ((regs[3] & CPUID_APM_CPB) != 0)
    209  1.21  jruoho 				val |= ACPICPU_FLAG_P_TURBO;
    210  1.17  jruoho 		}
    211   1.1  jruoho 
    212   1.1  jruoho 		break;
    213   1.1  jruoho 	}
    214   1.1  jruoho 
    215  1.12  jruoho 	/*
    216  1.12  jruoho 	 * There are several erratums for PIIX4.
    217  1.12  jruoho 	 */
    218  1.12  jruoho 	if (pci_find_device(&pa, acpicpu_md_quirks_piix4) != 0)
    219  1.12  jruoho 		val |= ACPICPU_FLAG_PIIX4;
    220  1.12  jruoho 
    221   1.1  jruoho 	return val;
    222   1.1  jruoho }
    223   1.1  jruoho 
    224  1.12  jruoho static int
    225  1.12  jruoho acpicpu_md_quirks_piix4(struct pci_attach_args *pa)
    226  1.12  jruoho {
    227  1.12  jruoho 
    228  1.12  jruoho 	/*
    229  1.12  jruoho 	 * XXX: The pci_find_device(9) function only
    230  1.12  jruoho 	 *	deals with attached devices. Change this
    231  1.12  jruoho 	 *	to use something like pci_device_foreach().
    232  1.12  jruoho 	 */
    233  1.12  jruoho 	if (PCI_VENDOR(pa->pa_id) != PCI_VENDOR_INTEL)
    234  1.12  jruoho 		return 0;
    235  1.12  jruoho 
    236  1.12  jruoho 	if (PCI_PRODUCT(pa->pa_id) == PCI_PRODUCT_INTEL_82371AB_ISA ||
    237  1.12  jruoho 	    PCI_PRODUCT(pa->pa_id) == PCI_PRODUCT_INTEL_82440MX_PMC)
    238  1.12  jruoho 		return 1;
    239  1.12  jruoho 
    240  1.12  jruoho 	return 0;
    241  1.12  jruoho }
    242  1.12  jruoho 
    243   1.1  jruoho uint32_t
    244   1.1  jruoho acpicpu_md_cpus_running(void)
    245   1.1  jruoho {
    246   1.1  jruoho 
    247   1.1  jruoho 	return popcount32(cpus_running);
    248   1.1  jruoho }
    249   1.1  jruoho 
    250   1.1  jruoho int
    251  1.31  jruoho acpicpu_md_idle_start(struct acpicpu_softc *sc)
    252   1.1  jruoho {
    253   1.1  jruoho 	const size_t size = sizeof(native_idle_text);
    254  1.31  jruoho 	struct acpicpu_cstate *cs;
    255  1.31  jruoho 	bool ipi = false;
    256  1.31  jruoho 	int i;
    257   1.1  jruoho 
    258   1.1  jruoho 	x86_cpu_idle_get(&native_idle, native_idle_text, size);
    259  1.31  jruoho 
    260  1.31  jruoho 	for (i = 0; i < ACPI_C_STATE_COUNT; i++) {
    261  1.31  jruoho 
    262  1.31  jruoho 		cs = &sc->sc_cstate[i];
    263  1.31  jruoho 
    264  1.31  jruoho 		if (cs->cs_method == ACPICPU_C_STATE_HALT) {
    265  1.31  jruoho 			ipi = true;
    266  1.31  jruoho 			break;
    267  1.31  jruoho 		}
    268  1.31  jruoho 	}
    269  1.31  jruoho 
    270  1.31  jruoho 	x86_cpu_idle_set(acpicpu_cstate_idle, "acpi", ipi);
    271   1.1  jruoho 
    272   1.1  jruoho 	return 0;
    273   1.1  jruoho }
    274   1.1  jruoho 
    275   1.1  jruoho int
    276   1.1  jruoho acpicpu_md_idle_stop(void)
    277   1.1  jruoho {
    278   1.4  jruoho 	uint64_t xc;
    279  1.31  jruoho 	bool ipi;
    280   1.1  jruoho 
    281  1.31  jruoho 	ipi = (native_idle != x86_cpu_idle_halt) ? false : true;
    282  1.31  jruoho 	x86_cpu_idle_set(native_idle, native_idle_text, ipi);
    283   1.1  jruoho 
    284   1.4  jruoho 	/*
    285   1.4  jruoho 	 * Run a cross-call to ensure that all CPUs are
    286   1.4  jruoho 	 * out from the ACPI idle-loop before detachment.
    287   1.4  jruoho 	 */
    288   1.4  jruoho 	xc = xc_broadcast(0, (xcfunc_t)nullop, NULL, NULL);
    289   1.4  jruoho 	xc_wait(xc);
    290   1.1  jruoho 
    291   1.1  jruoho 	return 0;
    292   1.1  jruoho }
    293   1.1  jruoho 
    294   1.3  jruoho /*
    295  1.31  jruoho  * Called with interrupts disabled.
    296  1.31  jruoho  * Caller should enable interrupts after return.
    297   1.3  jruoho  */
    298   1.1  jruoho void
    299   1.1  jruoho acpicpu_md_idle_enter(int method, int state)
    300   1.1  jruoho {
    301   1.3  jruoho 	struct cpu_info *ci = curcpu();
    302   1.1  jruoho 
    303   1.1  jruoho 	switch (method) {
    304   1.1  jruoho 
    305   1.1  jruoho 	case ACPICPU_C_STATE_FFH:
    306   1.3  jruoho 
    307   1.3  jruoho 		x86_enable_intr();
    308   1.3  jruoho 		x86_monitor(&ci->ci_want_resched, 0, 0);
    309   1.3  jruoho 
    310  1.31  jruoho 		if (__predict_false(ci->ci_want_resched != 0))
    311   1.3  jruoho 			return;
    312   1.3  jruoho 
    313   1.1  jruoho 		x86_mwait((state - 1) << 4, 0);
    314   1.1  jruoho 		break;
    315   1.1  jruoho 
    316   1.1  jruoho 	case ACPICPU_C_STATE_HALT:
    317   1.3  jruoho 
    318  1.31  jruoho 		if (__predict_false(ci->ci_want_resched != 0))
    319   1.3  jruoho 			return;
    320   1.3  jruoho 
    321   1.1  jruoho 		x86_stihlt();
    322   1.1  jruoho 		break;
    323   1.1  jruoho 	}
    324   1.1  jruoho }
    325   1.5  jruoho 
    326   1.5  jruoho int
    327   1.5  jruoho acpicpu_md_pstate_start(void)
    328   1.5  jruoho {
    329  1.20  jruoho 	const uint64_t est = __BIT(16);
    330  1.20  jruoho 	uint64_t val;
    331  1.20  jruoho 
    332  1.20  jruoho 	switch (cpu_vendor) {
    333  1.20  jruoho 
    334  1.20  jruoho 	case CPUVENDOR_IDT:
    335  1.20  jruoho 	case CPUVENDOR_INTEL:
    336  1.20  jruoho 
    337  1.20  jruoho 		val = rdmsr(MSR_MISC_ENABLE);
    338  1.20  jruoho 
    339  1.20  jruoho 		if ((val & est) == 0) {
    340  1.20  jruoho 
    341  1.20  jruoho 			val |= est;
    342  1.20  jruoho 
    343  1.20  jruoho 			wrmsr(MSR_MISC_ENABLE, val);
    344  1.20  jruoho 			val = rdmsr(MSR_MISC_ENABLE);
    345  1.20  jruoho 
    346  1.20  jruoho 			if ((val & est) == 0)
    347  1.20  jruoho 				return ENOTTY;
    348  1.20  jruoho 		}
    349  1.20  jruoho 	}
    350   1.9  jruoho 
    351  1.19  jruoho 	return acpicpu_md_pstate_sysctl_init();
    352   1.5  jruoho }
    353   1.5  jruoho 
    354   1.5  jruoho int
    355   1.5  jruoho acpicpu_md_pstate_stop(void)
    356   1.5  jruoho {
    357   1.5  jruoho 
    358  1.19  jruoho 	if (acpicpu_log != NULL)
    359  1.19  jruoho 		sysctl_teardown(&acpicpu_log);
    360   1.5  jruoho 
    361   1.5  jruoho 	return 0;
    362   1.5  jruoho }
    363   1.5  jruoho 
    364   1.5  jruoho int
    365  1.15  jruoho acpicpu_md_pstate_pss(struct acpicpu_softc *sc)
    366   1.5  jruoho {
    367  1.15  jruoho 	struct acpicpu_pstate *ps, msr;
    368  1.17  jruoho 	struct cpu_info *ci = curcpu();
    369  1.18  jruoho 	uint32_t family, i = 0;
    370  1.13  jruoho 
    371  1.15  jruoho 	(void)memset(&msr, 0, sizeof(struct acpicpu_pstate));
    372  1.13  jruoho 
    373   1.5  jruoho 	switch (cpu_vendor) {
    374   1.5  jruoho 
    375  1.17  jruoho 	case CPUVENDOR_IDT:
    376   1.5  jruoho 	case CPUVENDOR_INTEL:
    377  1.15  jruoho 		msr.ps_control_addr = MSR_PERF_CTL;
    378  1.15  jruoho 		msr.ps_control_mask = __BITS(0, 15);
    379  1.15  jruoho 
    380  1.15  jruoho 		msr.ps_status_addr  = MSR_PERF_STATUS;
    381  1.15  jruoho 		msr.ps_status_mask  = __BITS(0, 15);
    382  1.13  jruoho 		break;
    383  1.13  jruoho 
    384  1.13  jruoho 	case CPUVENDOR_AMD:
    385  1.13  jruoho 
    386  1.18  jruoho 		family = CPUID2FAMILY(ci->ci_signature);
    387  1.18  jruoho 
    388  1.18  jruoho 		if (family == 0xf)
    389  1.18  jruoho 			family += CPUID2EXTFAMILY(ci->ci_signature);
    390  1.18  jruoho 
    391  1.18  jruoho 		switch (family) {
    392  1.17  jruoho 
    393  1.17  jruoho 		case 0x10:
    394  1.17  jruoho 		case 0x11:
    395  1.17  jruoho 			msr.ps_control_addr = MSR_10H_CONTROL;
    396  1.17  jruoho 			msr.ps_control_mask = __BITS(0, 2);
    397  1.17  jruoho 
    398  1.17  jruoho 			msr.ps_status_addr  = MSR_10H_STATUS;
    399  1.17  jruoho 			msr.ps_status_mask  = __BITS(0, 2);
    400  1.17  jruoho 			break;
    401  1.17  jruoho 
    402  1.17  jruoho 		default:
    403  1.17  jruoho 
    404  1.17  jruoho 			if ((sc->sc_flags & ACPICPU_FLAG_P_XPSS) == 0)
    405  1.17  jruoho 				return EOPNOTSUPP;
    406  1.17  jruoho 		}
    407  1.13  jruoho 
    408  1.13  jruoho 		break;
    409  1.13  jruoho 
    410  1.13  jruoho 	default:
    411  1.13  jruoho 		return ENODEV;
    412  1.13  jruoho 	}
    413   1.5  jruoho 
    414  1.26  jruoho 	/*
    415  1.26  jruoho 	 * Fill the P-state structures with MSR addresses that are
    416  1.27  jruoho 	 * known to be correct. If we do not know the addresses,
    417  1.27  jruoho 	 * leave the values intact. If a vendor uses XPSS, we do
    418  1.27  jruoho 	 * not necessary need to do anything to support new CPUs.
    419  1.26  jruoho 	 */
    420  1.15  jruoho 	while (i < sc->sc_pstate_count) {
    421  1.15  jruoho 
    422  1.15  jruoho 		ps = &sc->sc_pstate[i];
    423  1.15  jruoho 
    424  1.27  jruoho 		if (msr.ps_status_addr != 0)
    425  1.15  jruoho 			ps->ps_status_addr = msr.ps_status_addr;
    426  1.15  jruoho 
    427  1.27  jruoho 		if (msr.ps_status_mask != 0)
    428  1.15  jruoho 			ps->ps_status_mask = msr.ps_status_mask;
    429  1.15  jruoho 
    430  1.27  jruoho 		if (msr.ps_control_addr != 0)
    431  1.15  jruoho 			ps->ps_control_addr = msr.ps_control_addr;
    432  1.15  jruoho 
    433  1.27  jruoho 		if (msr.ps_control_mask != 0)
    434  1.15  jruoho 			ps->ps_control_mask = msr.ps_control_mask;
    435  1.15  jruoho 
    436  1.15  jruoho 		i++;
    437  1.15  jruoho 	}
    438  1.15  jruoho 
    439  1.24  jruoho 	/*
    440  1.24  jruoho 	 * When the state is P0 and Turbo Boost has been
    441  1.24  jruoho 	 * detected, we need to skip the status check as
    442  1.24  jruoho 	 * BIOS may not report right comparison values for
    443  1.25  jruoho 	 * the IA32_PERF_STATUS register. Note that this
    444  1.25  jruoho 	 * issue is specific to Intel. For discussion, see:
    445  1.24  jruoho 	 *
    446  1.24  jruoho 	 *	Intel Corporation: Intel Turbo Boost Technology
    447  1.24  jruoho 	 *	in Intel Core(tm) Microarchitectures (Nehalem)
    448  1.24  jruoho 	 *	Based Processors. White Paper, November 2008.
    449  1.24  jruoho 	 */
    450  1.24  jruoho 	if (cpu_vendor != CPUVENDOR_INTEL)
    451  1.24  jruoho 		return 0;
    452  1.24  jruoho 
    453  1.24  jruoho 	if ((sc->sc_flags & ACPICPU_FLAG_P_TURBO) == 0)
    454  1.24  jruoho 		return 0;
    455  1.24  jruoho 
    456  1.24  jruoho 	if (sc->sc_pstate[1].ps_freq + 1 == sc->sc_pstate[0].ps_freq)
    457  1.24  jruoho 		sc->sc_pstate[0].ps_flags |= ACPICPU_FLAG_P_TURBO;
    458  1.24  jruoho 
    459  1.15  jruoho 	return 0;
    460  1.15  jruoho }
    461  1.15  jruoho 
    462  1.15  jruoho int
    463  1.15  jruoho acpicpu_md_pstate_get(struct acpicpu_softc *sc, uint32_t *freq)
    464  1.15  jruoho {
    465  1.15  jruoho 	struct acpicpu_pstate *ps = NULL;
    466  1.15  jruoho 	uint64_t val;
    467  1.15  jruoho 	uint32_t i;
    468  1.15  jruoho 
    469  1.15  jruoho 	for (i = 0; i < sc->sc_pstate_count; i++) {
    470  1.15  jruoho 
    471  1.15  jruoho 		ps = &sc->sc_pstate[i];
    472  1.15  jruoho 
    473  1.15  jruoho 		if (ps->ps_freq != 0)
    474  1.15  jruoho 			break;
    475  1.15  jruoho 	}
    476  1.15  jruoho 
    477  1.15  jruoho 	if (__predict_false(ps == NULL))
    478  1.17  jruoho 		return ENODEV;
    479  1.15  jruoho 
    480  1.28  jruoho 	if (__predict_false(ps->ps_status_addr == 0))
    481  1.13  jruoho 		return EINVAL;
    482   1.5  jruoho 
    483  1.13  jruoho 	val = rdmsr(ps->ps_status_addr);
    484   1.5  jruoho 
    485  1.28  jruoho 	if (__predict_true(ps->ps_status_mask != 0))
    486  1.13  jruoho 		val = val & ps->ps_status_mask;
    487   1.5  jruoho 
    488  1.13  jruoho 	for (i = 0; i < sc->sc_pstate_count; i++) {
    489   1.5  jruoho 
    490  1.13  jruoho 		ps = &sc->sc_pstate[i];
    491   1.5  jruoho 
    492  1.13  jruoho 		if (ps->ps_freq == 0)
    493  1.13  jruoho 			continue;
    494   1.5  jruoho 
    495  1.29  jruoho 		if (val == ps->ps_status) {
    496  1.13  jruoho 			*freq = ps->ps_freq;
    497  1.13  jruoho 			return 0;
    498  1.13  jruoho 		}
    499   1.5  jruoho 	}
    500   1.5  jruoho 
    501  1.13  jruoho 	return EIO;
    502   1.5  jruoho }
    503   1.5  jruoho 
    504   1.5  jruoho int
    505   1.5  jruoho acpicpu_md_pstate_set(struct acpicpu_pstate *ps)
    506   1.5  jruoho {
    507   1.5  jruoho 	struct msr_rw_info msr;
    508  1.14  jruoho 	uint64_t xc;
    509  1.14  jruoho 	int rv = 0;
    510   1.5  jruoho 
    511  1.13  jruoho 	msr.msr_read  = false;
    512  1.13  jruoho 	msr.msr_type  = ps->ps_control_addr;
    513  1.13  jruoho 	msr.msr_value = ps->ps_control;
    514  1.13  jruoho 
    515  1.24  jruoho 	if (__predict_true(ps->ps_control_mask != 0)) {
    516  1.13  jruoho 		msr.msr_mask = ps->ps_control_mask;
    517  1.13  jruoho 		msr.msr_read = true;
    518  1.13  jruoho 	}
    519  1.13  jruoho 
    520   1.5  jruoho 	xc = xc_broadcast(0, (xcfunc_t)x86_msr_xcall, &msr, NULL);
    521   1.5  jruoho 	xc_wait(xc);
    522   1.5  jruoho 
    523  1.29  jruoho 	if (__predict_false(ps->ps_status == 0))
    524  1.30  jruoho 		goto out;
    525  1.29  jruoho 
    526  1.24  jruoho 	if (__predict_false(ps->ps_status_addr == 0))
    527  1.30  jruoho 		goto out;
    528  1.24  jruoho 
    529  1.24  jruoho 	if ((ps->ps_flags & ACPICPU_FLAG_P_TURBO) != 0)
    530  1.30  jruoho 		goto out;
    531  1.13  jruoho 
    532  1.14  jruoho 	xc = xc_broadcast(0, (xcfunc_t)acpicpu_md_pstate_status, ps, &rv);
    533  1.14  jruoho 	xc_wait(xc);
    534  1.14  jruoho 
    535  1.14  jruoho 	return rv;
    536  1.30  jruoho 
    537  1.30  jruoho out:
    538  1.30  jruoho 	DELAY(ps->ps_latency);
    539  1.30  jruoho 
    540  1.30  jruoho 	return 0;
    541  1.14  jruoho }
    542  1.14  jruoho 
    543  1.14  jruoho static void
    544  1.14  jruoho acpicpu_md_pstate_status(void *arg1, void *arg2)
    545  1.14  jruoho {
    546  1.14  jruoho 	struct acpicpu_pstate *ps = arg1;
    547  1.14  jruoho 	uint64_t val;
    548  1.14  jruoho 	int i;
    549  1.14  jruoho 
    550   1.5  jruoho 	for (i = val = 0; i < ACPICPU_P_STATE_RETRY; i++) {
    551   1.5  jruoho 
    552  1.13  jruoho 		val = rdmsr(ps->ps_status_addr);
    553  1.13  jruoho 
    554  1.24  jruoho 		if (__predict_true(ps->ps_status_mask != 0))
    555  1.13  jruoho 			val = val & ps->ps_status_mask;
    556   1.5  jruoho 
    557  1.29  jruoho 		if (val == ps->ps_status)
    558  1.14  jruoho 			return;
    559   1.5  jruoho 
    560   1.5  jruoho 		DELAY(ps->ps_latency);
    561   1.5  jruoho 	}
    562   1.5  jruoho 
    563  1.14  jruoho 	*(uintptr_t *)arg2 = EAGAIN;
    564   1.5  jruoho }
    565  1.10  jruoho 
    566  1.10  jruoho int
    567  1.10  jruoho acpicpu_md_tstate_get(struct acpicpu_softc *sc, uint32_t *percent)
    568  1.10  jruoho {
    569  1.10  jruoho 	struct acpicpu_tstate *ts;
    570  1.14  jruoho 	uint64_t val;
    571  1.10  jruoho 	uint32_t i;
    572  1.10  jruoho 
    573  1.14  jruoho 	val = rdmsr(MSR_THERM_CONTROL);
    574  1.10  jruoho 
    575  1.10  jruoho 	for (i = 0; i < sc->sc_tstate_count; i++) {
    576  1.10  jruoho 
    577  1.10  jruoho 		ts = &sc->sc_tstate[i];
    578  1.10  jruoho 
    579  1.10  jruoho 		if (ts->ts_percent == 0)
    580  1.10  jruoho 			continue;
    581  1.10  jruoho 
    582  1.29  jruoho 		if (val == ts->ts_status) {
    583  1.10  jruoho 			*percent = ts->ts_percent;
    584  1.10  jruoho 			return 0;
    585  1.10  jruoho 		}
    586  1.10  jruoho 	}
    587  1.10  jruoho 
    588  1.10  jruoho 	return EIO;
    589  1.10  jruoho }
    590  1.10  jruoho 
    591  1.10  jruoho int
    592  1.10  jruoho acpicpu_md_tstate_set(struct acpicpu_tstate *ts)
    593  1.10  jruoho {
    594  1.10  jruoho 	struct msr_rw_info msr;
    595  1.14  jruoho 	uint64_t xc;
    596  1.14  jruoho 	int rv = 0;
    597  1.10  jruoho 
    598  1.14  jruoho 	msr.msr_read  = true;
    599  1.14  jruoho 	msr.msr_type  = MSR_THERM_CONTROL;
    600  1.14  jruoho 	msr.msr_value = ts->ts_control;
    601  1.14  jruoho 	msr.msr_mask = __BITS(1, 4);
    602  1.10  jruoho 
    603  1.10  jruoho 	xc = xc_broadcast(0, (xcfunc_t)x86_msr_xcall, &msr, NULL);
    604  1.10  jruoho 	xc_wait(xc);
    605  1.10  jruoho 
    606  1.30  jruoho 	if (ts->ts_status == 0) {
    607  1.30  jruoho 		DELAY(ts->ts_latency);
    608  1.10  jruoho 		return 0;
    609  1.30  jruoho 	}
    610  1.10  jruoho 
    611  1.14  jruoho 	xc = xc_broadcast(0, (xcfunc_t)acpicpu_md_tstate_status, ts, &rv);
    612  1.14  jruoho 	xc_wait(xc);
    613  1.14  jruoho 
    614  1.14  jruoho 	return rv;
    615  1.14  jruoho }
    616  1.14  jruoho 
    617  1.14  jruoho static void
    618  1.14  jruoho acpicpu_md_tstate_status(void *arg1, void *arg2)
    619  1.14  jruoho {
    620  1.14  jruoho 	struct acpicpu_tstate *ts = arg1;
    621  1.14  jruoho 	uint64_t val;
    622  1.14  jruoho 	int i;
    623  1.14  jruoho 
    624  1.10  jruoho 	for (i = val = 0; i < ACPICPU_T_STATE_RETRY; i++) {
    625  1.10  jruoho 
    626  1.14  jruoho 		val = rdmsr(MSR_THERM_CONTROL);
    627  1.10  jruoho 
    628  1.29  jruoho 		if (val == ts->ts_status)
    629  1.14  jruoho 			return;
    630  1.10  jruoho 
    631  1.10  jruoho 		DELAY(ts->ts_latency);
    632  1.10  jruoho 	}
    633  1.10  jruoho 
    634  1.14  jruoho 	*(uintptr_t *)arg2 = EAGAIN;
    635  1.10  jruoho }
    636  1.19  jruoho 
    637  1.19  jruoho /*
    638  1.19  jruoho  * A kludge for backwards compatibility.
    639  1.19  jruoho  */
    640  1.19  jruoho static int
    641  1.19  jruoho acpicpu_md_pstate_sysctl_init(void)
    642  1.19  jruoho {
    643  1.19  jruoho 	const struct sysctlnode	*fnode, *mnode, *rnode;
    644  1.19  jruoho 	const char *str;
    645  1.19  jruoho 	int rv;
    646  1.19  jruoho 
    647  1.19  jruoho 	switch (cpu_vendor) {
    648  1.19  jruoho 
    649  1.19  jruoho 	case CPUVENDOR_IDT:
    650  1.19  jruoho 	case CPUVENDOR_INTEL:
    651  1.19  jruoho 		str = "est";
    652  1.19  jruoho 		break;
    653  1.19  jruoho 
    654  1.19  jruoho 	case CPUVENDOR_AMD:
    655  1.19  jruoho 		str = "powernow";
    656  1.19  jruoho 		break;
    657  1.19  jruoho 
    658  1.19  jruoho 	default:
    659  1.19  jruoho 		return ENODEV;
    660  1.19  jruoho 	}
    661  1.19  jruoho 
    662  1.19  jruoho 
    663  1.19  jruoho 	rv = sysctl_createv(&acpicpu_log, 0, NULL, &rnode,
    664  1.19  jruoho 	    CTLFLAG_PERMANENT, CTLTYPE_NODE, "machdep", NULL,
    665  1.19  jruoho 	    NULL, 0, NULL, 0, CTL_MACHDEP, CTL_EOL);
    666  1.19  jruoho 
    667  1.19  jruoho 	if (rv != 0)
    668  1.19  jruoho 		goto fail;
    669  1.19  jruoho 
    670  1.19  jruoho 	rv = sysctl_createv(&acpicpu_log, 0, &rnode, &mnode,
    671  1.19  jruoho 	    0, CTLTYPE_NODE, str, NULL,
    672  1.19  jruoho 	    NULL, 0, NULL, 0, CTL_CREATE, CTL_EOL);
    673  1.19  jruoho 
    674  1.19  jruoho 	if (rv != 0)
    675  1.19  jruoho 		goto fail;
    676  1.19  jruoho 
    677  1.19  jruoho 	rv = sysctl_createv(&acpicpu_log, 0, &mnode, &fnode,
    678  1.19  jruoho 	    0, CTLTYPE_NODE, "frequency", NULL,
    679  1.19  jruoho 	    NULL, 0, NULL, 0, CTL_CREATE, CTL_EOL);
    680  1.19  jruoho 
    681  1.19  jruoho 	if (rv != 0)
    682  1.19  jruoho 		goto fail;
    683  1.19  jruoho 
    684  1.19  jruoho 	rv = sysctl_createv(&acpicpu_log, 0, &fnode, &rnode,
    685  1.19  jruoho 	    CTLFLAG_READWRITE, CTLTYPE_INT, "target", NULL,
    686  1.19  jruoho 	    acpicpu_md_pstate_sysctl_set, 0, NULL, 0, CTL_CREATE, CTL_EOL);
    687  1.19  jruoho 
    688  1.19  jruoho 	if (rv != 0)
    689  1.19  jruoho 		goto fail;
    690  1.19  jruoho 
    691  1.19  jruoho 	rv = sysctl_createv(&acpicpu_log, 0, &fnode, &rnode,
    692  1.19  jruoho 	    CTLFLAG_READONLY, CTLTYPE_INT, "current", NULL,
    693  1.19  jruoho 	    acpicpu_md_pstate_sysctl_get, 0, NULL, 0, CTL_CREATE, CTL_EOL);
    694  1.19  jruoho 
    695  1.19  jruoho 	if (rv != 0)
    696  1.19  jruoho 		goto fail;
    697  1.19  jruoho 
    698  1.19  jruoho 	rv = sysctl_createv(&acpicpu_log, 0, &fnode, &rnode,
    699  1.19  jruoho 	    CTLFLAG_READONLY, CTLTYPE_STRING, "available", NULL,
    700  1.19  jruoho 	    acpicpu_md_pstate_sysctl_all, 0, NULL, 0, CTL_CREATE, CTL_EOL);
    701  1.19  jruoho 
    702  1.19  jruoho 	if (rv != 0)
    703  1.19  jruoho 		goto fail;
    704  1.19  jruoho 
    705  1.19  jruoho 	return 0;
    706  1.19  jruoho 
    707  1.19  jruoho fail:
    708  1.19  jruoho 	if (acpicpu_log != NULL) {
    709  1.19  jruoho 		sysctl_teardown(&acpicpu_log);
    710  1.19  jruoho 		acpicpu_log = NULL;
    711  1.19  jruoho 	}
    712  1.19  jruoho 
    713  1.19  jruoho 	return rv;
    714  1.19  jruoho }
    715  1.19  jruoho 
    716  1.19  jruoho static int
    717  1.19  jruoho acpicpu_md_pstate_sysctl_get(SYSCTLFN_ARGS)
    718  1.19  jruoho {
    719  1.19  jruoho 	struct cpu_info *ci = curcpu();
    720  1.19  jruoho 	struct acpicpu_softc *sc;
    721  1.19  jruoho 	struct sysctlnode node;
    722  1.19  jruoho 	uint32_t freq;
    723  1.19  jruoho 	int err;
    724  1.19  jruoho 
    725  1.19  jruoho 	sc = acpicpu_sc[ci->ci_acpiid];
    726  1.19  jruoho 
    727  1.19  jruoho 	if (sc == NULL)
    728  1.19  jruoho 		return ENXIO;
    729  1.19  jruoho 
    730  1.19  jruoho 	err = acpicpu_pstate_get(sc, &freq);
    731  1.19  jruoho 
    732  1.19  jruoho 	if (err != 0)
    733  1.19  jruoho 		return err;
    734  1.19  jruoho 
    735  1.19  jruoho 	node = *rnode;
    736  1.19  jruoho 	node.sysctl_data = &freq;
    737  1.19  jruoho 
    738  1.19  jruoho 	err = sysctl_lookup(SYSCTLFN_CALL(&node));
    739  1.19  jruoho 
    740  1.19  jruoho 	if (err != 0 || newp == NULL)
    741  1.19  jruoho 		return err;
    742  1.19  jruoho 
    743  1.19  jruoho 	return 0;
    744  1.19  jruoho }
    745  1.19  jruoho 
    746  1.19  jruoho static int
    747  1.19  jruoho acpicpu_md_pstate_sysctl_set(SYSCTLFN_ARGS)
    748  1.19  jruoho {
    749  1.19  jruoho 	struct cpu_info *ci = curcpu();
    750  1.19  jruoho 	struct acpicpu_softc *sc;
    751  1.19  jruoho 	struct sysctlnode node;
    752  1.19  jruoho 	uint32_t freq;
    753  1.19  jruoho 	int err;
    754  1.19  jruoho 
    755  1.19  jruoho 	sc = acpicpu_sc[ci->ci_acpiid];
    756  1.19  jruoho 
    757  1.19  jruoho 	if (sc == NULL)
    758  1.19  jruoho 		return ENXIO;
    759  1.19  jruoho 
    760  1.19  jruoho 	err = acpicpu_pstate_get(sc, &freq);
    761  1.19  jruoho 
    762  1.19  jruoho 	if (err != 0)
    763  1.19  jruoho 		return err;
    764  1.19  jruoho 
    765  1.19  jruoho 	node = *rnode;
    766  1.19  jruoho 	node.sysctl_data = &freq;
    767  1.19  jruoho 
    768  1.19  jruoho 	err = sysctl_lookup(SYSCTLFN_CALL(&node));
    769  1.19  jruoho 
    770  1.19  jruoho 	if (err != 0 || newp == NULL)
    771  1.19  jruoho 		return err;
    772  1.19  jruoho 
    773  1.19  jruoho 	err = acpicpu_pstate_set(sc, freq);
    774  1.19  jruoho 
    775  1.19  jruoho 	if (err != 0)
    776  1.19  jruoho 		return err;
    777  1.19  jruoho 
    778  1.19  jruoho 	return 0;
    779  1.19  jruoho }
    780  1.19  jruoho 
    781  1.19  jruoho static int
    782  1.19  jruoho acpicpu_md_pstate_sysctl_all(SYSCTLFN_ARGS)
    783  1.19  jruoho {
    784  1.19  jruoho 	struct cpu_info *ci = curcpu();
    785  1.19  jruoho 	struct acpicpu_softc *sc;
    786  1.19  jruoho 	struct sysctlnode node;
    787  1.19  jruoho 	char buf[1024];
    788  1.19  jruoho 	size_t len;
    789  1.19  jruoho 	uint32_t i;
    790  1.19  jruoho 	int err;
    791  1.19  jruoho 
    792  1.19  jruoho 	sc = acpicpu_sc[ci->ci_acpiid];
    793  1.19  jruoho 
    794  1.19  jruoho 	if (sc == NULL)
    795  1.19  jruoho 		return ENXIO;
    796  1.19  jruoho 
    797  1.19  jruoho 	(void)memset(&buf, 0, sizeof(buf));
    798  1.19  jruoho 
    799  1.19  jruoho 	mutex_enter(&sc->sc_mtx);
    800  1.19  jruoho 
    801  1.19  jruoho 	for (len = 0, i = sc->sc_pstate_max; i < sc->sc_pstate_count; i++) {
    802  1.19  jruoho 
    803  1.19  jruoho 		if (sc->sc_pstate[i].ps_freq == 0)
    804  1.19  jruoho 			continue;
    805  1.19  jruoho 
    806  1.19  jruoho 		len += snprintf(buf + len, sizeof(buf) - len, "%u%s",
    807  1.19  jruoho 		    sc->sc_pstate[i].ps_freq,
    808  1.19  jruoho 		    i < (sc->sc_pstate_count - 1) ? " " : "");
    809  1.19  jruoho 	}
    810  1.19  jruoho 
    811  1.19  jruoho 	mutex_exit(&sc->sc_mtx);
    812  1.19  jruoho 
    813  1.19  jruoho 	node = *rnode;
    814  1.19  jruoho 	node.sysctl_data = buf;
    815  1.19  jruoho 
    816  1.19  jruoho 	err = sysctl_lookup(SYSCTLFN_CALL(&node));
    817  1.19  jruoho 
    818  1.19  jruoho 	if (err != 0 || newp == NULL)
    819  1.19  jruoho 		return err;
    820  1.19  jruoho 
    821  1.19  jruoho 	return 0;
    822  1.19  jruoho }
    823  1.19  jruoho 
    824