Home | History | Annotate | Line # | Download | only in include
cpufunc.h revision 1.16
      1  1.16      fvdl /*	$NetBSD: cpufunc.h,v 1.16 2007/05/11 14:01:46 fvdl Exp $	*/
      2   1.1      fvdl 
      3   1.1      fvdl /*-
      4   1.1      fvdl  * Copyright (c) 1998 The NetBSD Foundation, Inc.
      5   1.1      fvdl  * All rights reserved.
      6   1.1      fvdl  *
      7   1.1      fvdl  * This code is derived from software contributed to The NetBSD Foundation
      8   1.1      fvdl  * by Charles M. Hannum.
      9   1.1      fvdl  *
     10   1.1      fvdl  * Redistribution and use in source and binary forms, with or without
     11   1.1      fvdl  * modification, are permitted provided that the following conditions
     12   1.1      fvdl  * are met:
     13   1.1      fvdl  * 1. Redistributions of source code must retain the above copyright
     14   1.1      fvdl  *    notice, this list of conditions and the following disclaimer.
     15   1.1      fvdl  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.1      fvdl  *    notice, this list of conditions and the following disclaimer in the
     17   1.1      fvdl  *    documentation and/or other materials provided with the distribution.
     18   1.1      fvdl  * 3. All advertising materials mentioning features or use of this software
     19   1.1      fvdl  *    must display the following acknowledgement:
     20   1.1      fvdl  *        This product includes software developed by the NetBSD
     21   1.1      fvdl  *        Foundation, Inc. and its contributors.
     22   1.1      fvdl  * 4. Neither the name of The NetBSD Foundation nor the names of its
     23   1.1      fvdl  *    contributors may be used to endorse or promote products derived
     24   1.1      fvdl  *    from this software without specific prior written permission.
     25   1.1      fvdl  *
     26   1.1      fvdl  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     27   1.1      fvdl  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     28   1.1      fvdl  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     29   1.1      fvdl  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     30   1.1      fvdl  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     31   1.1      fvdl  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     32   1.1      fvdl  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     33   1.1      fvdl  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     34   1.1      fvdl  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     35   1.1      fvdl  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     36   1.1      fvdl  * POSSIBILITY OF SUCH DAMAGE.
     37   1.1      fvdl  */
     38   1.1      fvdl 
     39   1.1      fvdl #ifndef _AMD64_CPUFUNC_H_
     40   1.1      fvdl #define	_AMD64_CPUFUNC_H_
     41   1.1      fvdl 
     42   1.1      fvdl /*
     43   1.1      fvdl  * Functions to provide access to i386-specific instructions.
     44   1.1      fvdl  */
     45   1.1      fvdl 
     46   1.1      fvdl #include <sys/cdefs.h>
     47   1.1      fvdl #include <sys/types.h>
     48   1.1      fvdl 
     49   1.8       dsl #include <machine/segments.h>
     50   1.1      fvdl #include <machine/specialreg.h>
     51   1.1      fvdl 
     52  1.13        ad #ifdef _KERNEL
     53  1.12        ad void	x86_pause(void);
     54  1.13        ad #else
     55  1.13        ad static __inline void
     56  1.13        ad x86_pause(void)
     57  1.13        ad {
     58  1.13        ad 	__asm volatile("pause");
     59  1.13        ad }
     60  1.13        ad #endif
     61   1.3      fvdl 
     62   1.9        ad /*
     63   1.9        ad  * XXX if lfence isn't available...
     64   1.9        ad  *
     65   1.9        ad  * memory clobber to avoid compiler reordering.
     66   1.9        ad  */
     67   1.7     perry static __inline void
     68   1.4      yamt x86_lfence(void)
     69   1.4      yamt {
     70   1.4      yamt 
     71   1.6     perry 	__asm volatile("lfence" : : : "memory");
     72   1.4      yamt }
     73   1.4      yamt 
     74   1.9        ad static __inline void
     75   1.9        ad x86_sfence(void)
     76   1.9        ad {
     77   1.9        ad 
     78   1.9        ad 	__asm volatile("sfence" : : : "memory");
     79   1.9        ad }
     80   1.9        ad 
     81   1.9        ad static __inline void
     82   1.9        ad x86_mfence(void)
     83   1.9        ad {
     84   1.9        ad 
     85   1.9        ad 	__asm volatile("mfence" : : : "memory");
     86   1.9        ad }
     87   1.9        ad 
     88   1.1      fvdl #ifdef _KERNEL
     89   1.1      fvdl 
     90  1.14        ad void	x86_flush(void);
     91  1.14        ad void	x86_patch(void);
     92  1.14        ad 
     93   1.2      fvdl extern int cpu_feature;
     94   1.2      fvdl 
     95   1.7     perry static __inline void
     96   1.1      fvdl invlpg(u_int64_t addr)
     97   1.1      fvdl {
     98   1.6     perry         __asm volatile("invlpg (%0)" : : "r" (addr) : "memory");
     99  1.16      fvdl }
    100  1.16      fvdl 
    101  1.16      fvdl static __inline void
    102  1.16      fvdl lgs(u_short sel)
    103  1.16      fvdl {
    104  1.16      fvdl 	__asm volatile("cli");
    105  1.16      fvdl 	__asm volatile("swapgs");
    106  1.16      fvdl 	__asm volatile("movw %0, %%gs" : : "r" (sel));
    107  1.16      fvdl 	__asm volatile("mfence");
    108  1.16      fvdl 	__asm volatile("swapgs");
    109  1.16      fvdl 	__asm volatile("sti");
    110  1.16      fvdl }
    111   1.1      fvdl 
    112   1.7     perry static __inline void
    113   1.8       dsl lidt(struct region_descriptor *region)
    114   1.1      fvdl {
    115   1.8       dsl 	__asm volatile("lidt %0" : : "m" (*region));
    116   1.1      fvdl }
    117   1.1      fvdl 
    118   1.7     perry static __inline void
    119   1.1      fvdl lldt(u_short sel)
    120   1.1      fvdl {
    121   1.6     perry 	__asm volatile("lldt %0" : : "r" (sel));
    122   1.1      fvdl }
    123   1.1      fvdl 
    124   1.7     perry static __inline void
    125   1.1      fvdl ltr(u_short sel)
    126   1.1      fvdl {
    127   1.6     perry 	__asm volatile("ltr %0" : : "r" (sel));
    128   1.1      fvdl }
    129   1.1      fvdl 
    130   1.7     perry static __inline void
    131   1.1      fvdl lcr8(u_int val)
    132   1.1      fvdl {
    133   1.1      fvdl 	u_int64_t val64 = val;
    134   1.6     perry 	__asm volatile("movq %0,%%cr8" : : "r" (val64));
    135   1.1      fvdl }
    136   1.1      fvdl 
    137   1.1      fvdl /*
    138   1.1      fvdl  * Upper 32 bits are reserved anyway, so just keep this 32bits.
    139   1.1      fvdl  */
    140   1.7     perry static __inline void
    141   1.1      fvdl lcr0(u_int val)
    142   1.1      fvdl {
    143   1.1      fvdl 	u_int64_t val64 = val;
    144   1.6     perry 	__asm volatile("movq %0,%%cr0" : : "r" (val64));
    145   1.1      fvdl }
    146   1.1      fvdl 
    147   1.7     perry static __inline u_int
    148   1.1      fvdl rcr0(void)
    149   1.1      fvdl {
    150   1.1      fvdl 	u_int64_t val64;
    151   1.1      fvdl 	u_int val;
    152   1.6     perry 	__asm volatile("movq %%cr0,%0" : "=r" (val64));
    153   1.1      fvdl 	val = val64;
    154   1.1      fvdl 	return val;
    155   1.1      fvdl }
    156   1.1      fvdl 
    157   1.7     perry static __inline u_int64_t
    158   1.1      fvdl rcr2(void)
    159   1.1      fvdl {
    160   1.1      fvdl 	u_int64_t val;
    161   1.6     perry 	__asm volatile("movq %%cr2,%0" : "=r" (val));
    162   1.1      fvdl 	return val;
    163   1.1      fvdl }
    164   1.1      fvdl 
    165   1.7     perry static __inline void
    166   1.1      fvdl lcr3(u_int64_t val)
    167   1.1      fvdl {
    168   1.6     perry 	__asm volatile("movq %0,%%cr3" : : "r" (val));
    169   1.1      fvdl }
    170   1.1      fvdl 
    171   1.7     perry static __inline u_int64_t
    172   1.1      fvdl rcr3(void)
    173   1.1      fvdl {
    174   1.1      fvdl 	u_int64_t val;
    175   1.6     perry 	__asm volatile("movq %%cr3,%0" : "=r" (val));
    176   1.1      fvdl 	return val;
    177   1.1      fvdl }
    178   1.1      fvdl 
    179   1.1      fvdl /*
    180   1.1      fvdl  * Same as for cr0. Don't touch upper 32 bits.
    181   1.1      fvdl  */
    182   1.7     perry static __inline void
    183   1.1      fvdl lcr4(u_int val)
    184   1.1      fvdl {
    185   1.1      fvdl 	u_int64_t val64 = val;
    186   1.1      fvdl 
    187   1.6     perry 	__asm volatile("movq %0,%%cr4" : : "r" (val64));
    188   1.1      fvdl }
    189   1.1      fvdl 
    190   1.7     perry static __inline u_int
    191   1.1      fvdl rcr4(void)
    192   1.1      fvdl {
    193   1.1      fvdl 	u_int val;
    194   1.1      fvdl 	u_int64_t val64;
    195   1.6     perry 	__asm volatile("movq %%cr4,%0" : "=r" (val64));
    196   1.1      fvdl 	val = val64;
    197   1.1      fvdl 	return val;
    198   1.1      fvdl }
    199   1.1      fvdl 
    200   1.7     perry static __inline void
    201   1.1      fvdl tlbflush(void)
    202   1.1      fvdl {
    203   1.1      fvdl 	u_int64_t val;
    204   1.6     perry 	__asm volatile("movq %%cr3,%0" : "=r" (val));
    205   1.6     perry 	__asm volatile("movq %0,%%cr3" : : "r" (val));
    206   1.1      fvdl }
    207   1.1      fvdl 
    208   1.7     perry static __inline void
    209   1.1      fvdl tlbflushg(void)
    210   1.1      fvdl {
    211   1.1      fvdl 	/*
    212   1.1      fvdl 	 * Big hammer: flush all TLB entries, including ones from PTE's
    213   1.1      fvdl 	 * with the G bit set.  This should only be necessary if TLB
    214   1.1      fvdl 	 * shootdown falls far behind.
    215   1.1      fvdl 	 *
    216   1.1      fvdl 	 * Intel Architecture Software Developer's Manual, Volume 3,
    217   1.1      fvdl 	 *	System Programming, section 9.10, "Invalidating the
    218   1.1      fvdl 	 * Translation Lookaside Buffers (TLBS)":
    219   1.1      fvdl 	 * "The following operations invalidate all TLB entries, irrespective
    220   1.1      fvdl 	 * of the setting of the G flag:
    221   1.1      fvdl 	 * ...
    222   1.1      fvdl 	 * "(P6 family processors only): Writing to control register CR4 to
    223   1.1      fvdl 	 * modify the PSE, PGE, or PAE flag."
    224   1.1      fvdl 	 *
    225   1.1      fvdl 	 * (the alternatives not quoted above are not an option here.)
    226   1.1      fvdl 	 *
    227   1.1      fvdl 	 * If PGE is not in use, we reload CR3 for the benefit of
    228   1.1      fvdl 	 * pre-P6-family processors.
    229   1.1      fvdl 	 */
    230   1.1      fvdl 
    231   1.1      fvdl 	if (cpu_feature & CPUID_PGE) {
    232   1.1      fvdl 		u_int cr4 = rcr4();
    233   1.1      fvdl 		lcr4(cr4 & ~CR4_PGE);
    234   1.1      fvdl 		lcr4(cr4);
    235   1.1      fvdl 	} else
    236   1.1      fvdl 		tlbflush();
    237   1.1      fvdl }
    238   1.1      fvdl 
    239   1.1      fvdl #ifdef notyet
    240  1.15  christos void	setidt	__P((int idx, /*XXX*/void *func, int typ, int dpl));
    241   1.1      fvdl #endif
    242   1.1      fvdl 
    243   1.1      fvdl 
    244   1.1      fvdl /* XXXX ought to be in psl.h with spl() functions */
    245   1.1      fvdl 
    246   1.7     perry static __inline void
    247   1.1      fvdl disable_intr(void)
    248   1.1      fvdl {
    249   1.6     perry 	__asm volatile("cli");
    250   1.1      fvdl }
    251   1.1      fvdl 
    252   1.7     perry static __inline void
    253   1.1      fvdl enable_intr(void)
    254   1.1      fvdl {
    255   1.6     perry 	__asm volatile("sti");
    256   1.1      fvdl }
    257   1.1      fvdl 
    258   1.7     perry static __inline u_long
    259   1.1      fvdl read_rflags(void)
    260   1.1      fvdl {
    261   1.1      fvdl 	u_long	ef;
    262   1.1      fvdl 
    263   1.6     perry 	__asm volatile("pushfq; popq %0" : "=r" (ef));
    264   1.1      fvdl 	return (ef);
    265   1.1      fvdl }
    266   1.1      fvdl 
    267   1.7     perry static __inline void
    268   1.1      fvdl write_rflags(u_long ef)
    269   1.1      fvdl {
    270   1.6     perry 	__asm volatile("pushq %0; popfq" : : "r" (ef));
    271   1.1      fvdl }
    272   1.1      fvdl 
    273  1.10        ad 
    274   1.7     perry static __inline u_int64_t
    275   1.1      fvdl rdmsr(u_int msr)
    276   1.1      fvdl {
    277   1.1      fvdl 	uint32_t hi, lo;
    278   1.6     perry 	__asm volatile("rdmsr" : "=d" (hi), "=a" (lo) : "c" (msr));
    279   1.1      fvdl 	return (((uint64_t)hi << 32) | (uint64_t) lo);
    280   1.1      fvdl }
    281   1.1      fvdl 
    282   1.7     perry static __inline void
    283   1.1      fvdl wrmsr(u_int msr, u_int64_t newval)
    284   1.1      fvdl {
    285   1.6     perry 	__asm volatile("wrmsr" :
    286   1.1      fvdl 	    : "a" (newval & 0xffffffff), "d" (newval >> 32), "c" (msr));
    287   1.1      fvdl }
    288   1.1      fvdl 
    289  1.10        ad /*
    290  1.10        ad  * Some of the undocumented AMD64 MSRs need a 'passcode' to access.
    291  1.10        ad  *
    292  1.10        ad  * See LinuxBIOSv2: src/cpu/amd/model_fxx/model_fxx_init.c
    293  1.10        ad  */
    294  1.10        ad 
    295  1.10        ad #define	OPTERON_MSR_PASSCODE	0x9c5a203a
    296  1.10        ad 
    297  1.10        ad static __inline u_int64_t
    298  1.10        ad rdmsr_locked(u_int msr, u_int code)
    299  1.10        ad {
    300  1.10        ad 	uint32_t hi, lo;
    301  1.10        ad 	__asm volatile("rdmsr"
    302  1.10        ad 	    : "=d" (hi), "=a" (lo)
    303  1.10        ad 	    : "c" (msr), "D" (code));
    304  1.10        ad 	return (((uint64_t)hi << 32) | (uint64_t) lo);
    305  1.10        ad }
    306  1.10        ad 
    307  1.10        ad static __inline void
    308  1.10        ad wrmsr_locked(u_int msr, u_int code, u_int64_t newval)
    309  1.10        ad {
    310  1.10        ad 	__asm volatile("wrmsr"
    311  1.10        ad 	    :
    312  1.10        ad 	    : "a" (newval & 0xffffffff), "d" (newval >> 32), "c" (msr),
    313  1.10        ad 	      "D" (code));
    314  1.10        ad }
    315  1.10        ad 
    316   1.7     perry static __inline void
    317   1.1      fvdl wbinvd(void)
    318   1.1      fvdl {
    319   1.6     perry 	__asm volatile("wbinvd");
    320   1.1      fvdl }
    321   1.1      fvdl 
    322   1.7     perry static __inline u_int64_t
    323   1.1      fvdl rdtsc(void)
    324   1.1      fvdl {
    325   1.1      fvdl 	uint32_t hi, lo;
    326   1.1      fvdl 
    327   1.6     perry 	__asm volatile("rdtsc" : "=d" (hi), "=a" (lo));
    328   1.1      fvdl 	return (((uint64_t)hi << 32) | (uint64_t) lo);
    329   1.1      fvdl }
    330   1.1      fvdl 
    331   1.7     perry static __inline u_int64_t
    332   1.1      fvdl rdpmc(u_int pmc)
    333   1.1      fvdl {
    334   1.1      fvdl 	uint32_t hi, lo;
    335   1.1      fvdl 
    336   1.6     perry 	__asm volatile("rdpmc" : "=d" (hi), "=a" (lo) : "c" (pmc));
    337   1.1      fvdl 	return (((uint64_t)hi << 32) | (uint64_t) lo);
    338   1.1      fvdl }
    339   1.1      fvdl 
    340   1.1      fvdl /* Break into DDB/KGDB. */
    341   1.7     perry static __inline void
    342   1.1      fvdl breakpoint(void)
    343   1.1      fvdl {
    344   1.6     perry 	__asm volatile("int $3");
    345   1.1      fvdl }
    346   1.1      fvdl 
    347   1.1      fvdl #define read_psl()	read_rflags()
    348   1.1      fvdl #define write_psl(x)	write_rflags(x)
    349   1.1      fvdl 
    350   1.1      fvdl #endif /* _KERNEL */
    351   1.1      fvdl 
    352   1.1      fvdl #endif /* !_AMD64_CPUFUNC_H_ */
    353