Home | History | Annotate | Line # | Download | only in include
ctlreg.h revision 1.24
      1 /*	$NetBSD: ctlreg.h,v 1.24 2000/12/04 20:14:05 fvdl Exp $ */
      2 
      3 /*
      4  * Copyright (c) 1996-1999 Eduardo Horvath
      5  *
      6  * Redistribution and use in source and binary forms, with or without
      7  * modification, are permitted provided that the following conditions
      8  * are met:
      9  * 1. Redistributions of source code must retain the above copyright
     10  *    notice, this list of conditions and the following disclaimer.
     11  *
     12  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR  ``AS IS'' AND
     13  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     14  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     15  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR  BE LIABLE
     16  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     17  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     18  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     19  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     20  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     21  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     22  * SUCH DAMAGE.
     23  *
     24  */
     25 
     26 /*
     27  * Sun 4u control registers. (includes address space definitions
     28  * and some registers in control space).
     29  */
     30 
     31 /*
     32  * The Alternate address spaces.
     33  *
     34  * 0x00-0x7f are privileged
     35  * 0x80-0xff can be used by users
     36  */
     37 
     38 #define ASI_LITTLE	0x08		/* This bit should make an ASI little endian */
     39 
     40 #define ASI_NUCLEUS			0x04	/* [4u] kernel address space */
     41 #define ASI_NUCLEUS_LITTLE		0x0c	/* [4u] kernel address space, little endian */
     42 
     43 #define ASI_AS_IF_USER_PRIMARY		0x10	/* [4u] primary user address space */
     44 #define ASI_AS_IF_USER_SECONDARY	0x11	/* [4u] secondary user address space */
     45 
     46 #define ASI_PHYS_CACHED			0x14	/* [4u] MMU bypass to main memory */
     47 #define ASI_PHYS_NON_CACHED		0x15	/* [4u] MMU bypass to I/O location */
     48 
     49 #define ASI_AS_IF_USER_PRIMARY_LITTLE	0x18	/* [4u] primary user address space, little endian  */
     50 #define ASI_AS_IF_USER_SECONDARY_LITTIE	0x19	/* [4u] secondary user address space, little endian  */
     51 
     52 #define ASI_PHYS_CACHED_LITTLE		0x1c	/* [4u] MMU bypass to main memory, little endian */
     53 #define ASI_PHYS_NON_CACHED_LITTLE	0x1d	/* [4u] MMU bypass to I/O location, little endian */
     54 
     55 #define ASI_NUCLEUS_QUAD_LDD		0x24	/* [4u] use w/LDDA to load 128-bit item */
     56 #define ASI_NUCLEUS_QUAD_LDD_LITTLE	0x2c	/* [4u] use w/LDDA to load 128-bit item, little endian */
     57 
     58 #define ASI_FLUSH_D_PAGE_PRIMARY	0x38	/* [4u] flush D-cache page using primary context */
     59 #define ASI_FLUSH_D_PAGE_SECONDARY	0x39	/* [4u] flush D-cache page using secondary context */
     60 #define ASI_FLUSH_D_CTX_PRIMARY		0x3a	/* [4u] flush D-cache context using primary context */
     61 #define ASI_FLUSH_D_CTX_SECONDARY	0x3b	/* [4u] flush D-cache context using secondary context */
     62 
     63 #define ASI_LSU_CONTROL_REGISTER	0x45	/* [4u] load/store unit control register */
     64 
     65 #define ASI_DCACHE_DATA			0x46	/* [4u] diagnostic access to D-cache data RAM */
     66 #define ASI_DCACHE_TAG			0x47	/* [4u] diagnostic access to D-cache tag RAM */
     67 
     68 #define ASI_INTR_DISPATCH_STATUS	0x48	/* [4u] interrupt dispatch status register */
     69 #define ASI_INTR_RECEIVE		0x49	/* [4u] interrupt receive status register */
     70 #define ASI_MID_REG			0x4a	/* [4u] hardware config and MID */
     71 #define ASI_ERROR_EN_REG		0x4b	/* [4u] asynchronous error enables */
     72 #define ASI_AFSR			0x4c	/* [4u] asynchronous fault status register */
     73 #define ASI_AFAR			0x4d	/* [4u] asynchronous fault address register */
     74 
     75 #define ASI_ICACHE_DATA			0x66	/* [4u] diagnostic access to D-cache data RAM */
     76 #define ASI_ICACHE_TAG			0x67	/* [4u] diagnostic access to D-cache tag RAM */
     77 #define ASI_FLUSH_I_PAGE_PRIMARY	0x68	/* [4u] flush D-cache page using primary context */
     78 #define ASI_FLUSH_I_PAGE_SECONDARY	0x69	/* [4u] flush D-cache page using secondary context */
     79 #define ASI_FLUSH_I_CTX_PRIMARY		0x6a	/* [4u] flush D-cache context using primary context */
     80 #define ASI_FLUSH_I_CTX_SECONDARY	0x6b	/* [4u] flush D-cache context using secondary context */
     81 
     82 #define ASI_BLOCK_AS_IF_USER_PRIMARY	0x70	/* [4u] primary user address space, block loads/stores */
     83 #define ASI_BLOCK_AS_IF_USER_SECONDARY	0x71	/* [4u] secondary user address space, block loads/stores */
     84 
     85 #define ASI_ECACHE_DIAG			0x76	/* [4u] diag access to E-cache tag and data */
     86 #define ASI_DATAPATH_ERR_REG_WRITE	0x77	/* [4u] ASI is reused */
     87 
     88 #define ASI_BLOCK_AS_IF_USER_PRIMARY_LITTLE	0x78	/* [4u] primary user address space, block loads/stores */
     89 #define ASI_BLOCK_AS_IF_USER_SECONDARY_LITTLE	0x79	/* [4u] secondary user address space, block loads/stores */
     90 
     91 #define ASI_INTERRUPT_RECEIVE_DATA	0x7f	/* [4u] interrupt receive data registers {0,1,2} */
     92 #define ASI_DATAPATH_ERR_REG_READ	0x7f	/* [4u] read access to datapath error registers (ASI reused) */
     93 
     94 #define ASI_PRIMARY			0x80	/* [4u] primary address space */
     95 #define ASI_SECONDARY			0x81	/* [4u] secondary address space */
     96 #define ASI_PRIMARY_NO_FAULT		0x82	/* [4u] primary address space, no fault */
     97 #define ASI_SECONDARY_NO_FAULT		0x83	/* [4u] secondary address space, no fault */
     98 
     99 #define ASI_PRIMARY_LITTLE		0x88	/* [4u] primary address space, little endian */
    100 #define ASI_SECONDARY_LITTLE		0x89	/* [4u] secondary address space, little endian */
    101 #define ASI_PRIMARY_NO_FAULT_LITTLE	0x8a	/* [4u] primary address space, no fault, little endian */
    102 #define ASI_SECONDARY_NO_FAULT_LITTLE	0x8b	/* [4u] secondary address space, no fault, little endian */
    103 
    104 #define ASI_PST8_PRIMARY		0xc0	/* [VIS] Eight 8-bit partial store, primary */
    105 #define ASI_PST8_SECONDARY		0xc1	/* [VIS] Eight 8-bit partial store, secondary */
    106 #define ASI_PST16_PRIMARY		0xc2	/* [VIS] Four 16-bit partial store, primary */
    107 #define ASI_PST16_SECONDARY		0xc3	/* [VIS] Fout 16-bit partial store, secondary */
    108 #define ASI_PST32_PRIMARY		0xc4	/* [VIS] Two 32-bit partial store, primary */
    109 #define ASI_PST32_SECONDARY		0xc5	/* [VIS] Two 32-bit partial store, secondary */
    110 
    111 #define ASI_PST8_PRIMARY_LITTLE		0xc8	/* [VIS] Eight 8-bit partial store, primary, little endian */
    112 #define ASI_PST8_SECONDARY_LITTLE	0xc9	/* [VIS] Eight 8-bit partial store, secondary, little endian */
    113 #define ASI_PST16_PRIMARY_LITTLE	0xca	/* [VIS] Four 16-bit partial store, primary, little endian */
    114 #define ASI_PST16_SECONDARY_LITTLE	0xcb	/* [VIS] Fout 16-bit partial store, secondary, little endian */
    115 #define ASI_PST32_PRIMARY_LITTLE	0xcc	/* [VIS] Two 32-bit partial store, primary, little endian */
    116 #define ASI_PST32_SECONDARY_LITTLE	0xcd	/* [VIS] Two 32-bit partial store, secondary, little endian */
    117 
    118 #define ASI_FL8_PRIMARY			0xd0	/* [VIS] One 8-bit load/store floating, primary */
    119 #define ASI_FL8_SECONDARY		0xd1	/* [VIS] One 8-bit load/store floating, secondary */
    120 #define ASI_FL16_PRIMARY		0xd2	/* [VIS] One 16-bit load/store floating, primary */
    121 #define ASI_FL16_SECONDARY		0xd3	/* [VIS] One 16-bit load/store floating, secondary */
    122 
    123 #define ASI_FL8_PRIMARY_LITTLE		0xd8	/* [VIS] One 8-bit load/store floating, primary, little endian */
    124 #define ASI_FL8_SECONDARY_LITTLE	0xd9	/* [VIS] One 8-bit load/store floating, secondary, little endian */
    125 #define ASI_FL16_PRIMARY_LITTLE		0xda	/* [VIS] One 16-bit load/store floating, primary, little endian */
    126 #define ASI_FL16_SECONDARY_LITTLE	0xdb	/* [VIS] One 16-bit load/store floating, secondary, little endian */
    127 
    128 #define ASI_BLOCK_COMMIT_PRIMARY	0xe0	/* [4u] block store with commit, primary */
    129 #define ASI_BLOCK_COMMIT_SECONDARY	0xe1	/* [4u] block store with commit, secondary */
    130 #define ASI_BLOCK_PRIMARY		0xf0	/* [4u] block load/store, primary */
    131 #define ASI_BLOCK_SECONDARY		0xf1	/* [4u] block load/store, secondary */
    132 #define ASI_BLOCK_PRIMARY_LITTLE	0xf8	/* [4u] block load/store, primary, little endian */
    133 #define ASI_BLOCK_SECONDARY_LITTLE	0xf9	/* [4u] block load/store, secondary, little endian */
    134 
    135 
    136 /*
    137  * These are the shorter names used by Solaris
    138  */
    139 
    140 #define ASI_N		ASI_NUCLEUS
    141 #define ASI_NL		ASI_NUCLEUS_LITTLE
    142 #define ASI_AIUP	ASI_AS_IF_USER_PRIMARY
    143 #define ASI_AIUS	ASI_AS_IF_USER_SECONDARY
    144 #define ASI_AIUPL	ASI_AS_IF_USER_PRIMARY_LITTLE
    145 #define ASI_AIUSL	ASI_AS_IF_USER_SECONDARY_LITTLE
    146 #define ASI_P		ASI_PRIMARY
    147 #define ASI_S		ASI_SECONDARY
    148 #define ASI_PNF		ASI_PRIMARY_NO_FAULT
    149 #define ASI_SNF		ASI_SECONDARY_NO_FAULT
    150 #define ASI_PL		ASI_PRIMARY_LITTLE
    151 #define ASI_SL		ASI_SECONDARY_LITTLE
    152 #define ASI_PNFL	ASI_PRIMARY_NO_FAULT_LITTLE
    153 #define ASI_SNFL	ASI_SECONDARY_NO_FAULT_LITTLE
    154 #define ASI_BLK_AIUP	ASI_BLOCK_AS_IF_USER_PRIMARY
    155 #define ASI_BLK_AIUPL	ASI_BLOCK_AS_IF_USER_PRIMARY_LITTLE
    156 #define ASI_BLK_AIUS	ASI_BLOCK_AS_IF_USER_SECONDARY
    157 #define ASI_BLK_AIUSL	ASI_BLOCK_AS_IF_USER_SECONDARY_LITTLE
    158 #define ASI_BLK_COMMIT_P		ASI_BLOCK_COMMIT_PRIMARY
    159 #define ASI_BLK_COMMIT_PRIMARY		ASI_BLOCK_COMMIT_PRIMARY
    160 #define ASI_BLK_COMMIT_S		ASI_BLOCK_COMMIT_SECONDARY
    161 #define ASI_BLK_COMMIT_SECONDARY	ASI_BLOCK_COMMIT_SECONDARY
    162 #define ASI_BLK_P			ASI_BLOCK_PRIMARY
    163 #define ASI_BLK_PL			ASI_BLOCK_PRIMARY_LITTLE
    164 #define ASI_BLK_S			ASI_BLOCK_SECONDARY
    165 #define ASI_BLK_SL			ASI_BLOCK_SECONDARY_LITTLE
    166 
    167 #define PHYS_ASI(x)	(((x) | 0x09) == 0x1d)
    168 #define LITTLE_ASI(x)	((x) & ASI_LITTLE)
    169 
    170 /*
    171  * The following are 4u control registers
    172  */
    173 
    174 
    175 /* Get the CPU's UPAID */
    176 #define	UPA_CR_MID(x)	(((x)>>17)&0x1f)
    177 #define	CPU_UPAID	UPA_CR_MID(ldxa(0, ASI_MID_REG))
    178 
    179 /*
    180  * [4u] MMU and Cache Control Register (MCCR)
    181  * use ASI = 0x45
    182  */
    183 #define ASI_MCCR	ASI_LSU_CONTROL_REGISTER
    184 #define MCCR		0x00
    185 
    186 /* MCCR Bits and their meanings */
    187 #define MCCR_DMMU_EN	0x08
    188 #define MCCR_IMMU_EN	0x04
    189 #define MCCR_DCACHE_EN	0x02
    190 #define MCCR_ICACHE_EN	0x01
    191 
    192 
    193 /*
    194  * MMU control registers
    195  */
    196 
    197 /* Choose an MMU */
    198 #define ASI_DMMU		0x58
    199 #define ASI_IMMU		0x50
    200 
    201 /* Other assorted MMU ASIs */
    202 #define ASI_IMMU_8KPTR		0x51
    203 #define ASI_IMMU_64KPTR		0x52
    204 #define ASI_IMMU_DATA_IN	0x54
    205 #define ASI_IMMU_TLB_DATA	0x55
    206 #define ASI_IMMU_TLB_TAG	0x56
    207 #define ASI_DMMU_8KPTR		0x59
    208 #define ASI_DMMU_64KPTR		0x5a
    209 #define ASI_DMMU_DATA_IN	0x5c
    210 #define ASI_DMMU_TLB_DATA	0x5d
    211 #define ASI_DMMU_TLB_TAG	0x5e
    212 
    213 /*
    214  * The following are the control registers
    215  * They work on both MMUs unless noted.
    216  *
    217  * Register contents are defined later on individual registers.
    218  */
    219 #define TSB_TAG_TARGET		0x0
    220 #define TLB_DATA_IN		0x0
    221 #define CTX_PRIMARY		0x08	/* primary context -- DMMU only */
    222 #define CTX_SECONDARY		0x10	/* secondary context -- DMMU only */
    223 #define SFSR			0x18
    224 #define SFAR			0x20	/* fault address -- DMMU only */
    225 #define TSB			0x28
    226 #define TLB_TAG_ACCESS		0x30
    227 #define VIRTUAL_WATCHPOINT	0x38
    228 #define PHYSICAL_WATCHPOINT	0x40
    229 
    230 /* Tag Target bits */
    231 #define TAG_TARGET_VA_MASK	0x03ffffffffffffffffLL
    232 #define TAG_TARGET_VA(x)	(((x)<<22)&TAG_TARGET_VA_MASK)
    233 #define TAG_TARGET_CONTEXT(x)	((x)>>48)
    234 #define TAG_TARGET(c,v)		((((uint64_t)c)<<48)|(((uint64_t)v)&TAG_TARGET_VA_MASK))
    235 
    236 /* SFSR bits for both D_SFSR and I_SFSR */
    237 #define SFSR_ASI(x)		((x)>>16)
    238 #define SFSR_FT_VA_OOR_2	0x02000 /* IMMU: jumpl or return to unsupportd VA */
    239 #define SFSR_FT_VA_OOR_1	0x01000 /* fault at unsupported VA */
    240 #define SFSR_FT_NFO		0x00800	/* DMMU: Access to page marked NFO */
    241 #define SFSR_ILL_ASI		0x00400	/* DMMU: Illegal (unsupported) ASI */
    242 #define SFSR_FT_IO_ATOMIC	0x00200	/* DMMU: Atomic access to noncacheable page */
    243 #define SFSR_FT_ILL_NF		0x00100	/* DMMU: NF load or flush to page marked E (has side effects) */
    244 #define SFSR_FT_PRIV		0x00080	/* Privilege violation */
    245 #define SFSR_FT_E		0x00040	/* DMUU: value of E bit associated address */
    246 #define SFSR_CTXT(x)		(((x)>>4)&0x3)
    247 #define SFSR_CTXT_IS_PRIM(x)	(SFSR_CTXT(x)==0x00)
    248 #define SFSR_CTXT_IS_SECOND(x)	(SFSR_CTXT(x)==0x01)
    249 #define SFSR_CTXT_IS_NUCLEUS(x)	(SFSR_CTXT(x)==0x02)
    250 #define SFSR_PRIV		0x00008	/* value of PSTATE.PRIV for faulting access */
    251 #define SFSR_W			0x00004 /* DMMU: attempted write */
    252 #define SFSR_OW			0x00002 /* Overwrite; prev vault was still valid */
    253 #define SFSR_FV			0x00001	/* Fault is valid */
    254 #define SFSR_FT	(SFSR_FT_VA_OOR_2|SFSR_FT_VA_OOR_1|SFSR_FT_NFO|SFSR_ILL_ASI|SFSR_FT_IO_ATOMIC|SFSR_FT_ILL_NF|SFSR_FT_PRIV)
    255 
    256 #if 0
    257 /* Old bits */
    258 #define SFSR_BITS "\40\16VAT\15VAD\14NFO\13ASI\12A\11NF\10PRIV\7E\6NUCLEUS\5SECONDCTX\4PRIV\3W\2OW\1FV"
    259 #else
    260 /* New bits */
    261 #define SFSR_BITS "\177\20" \
    262 	"f\20\30ASI\0" "b\16VAT\0" "b\15VAD\0" "b\14NFO\0" "b\13ASI\0" "b\12A\0" "b\11NF\0" "b\10PRIV\0" \
    263 	 "b\7E\0" "b\6NUCLEUS\0" "b\5SECONDCTX\0" "b\4PRIV\0" "b\3W\0" "b\2OW\0" "b\1FV\0"
    264 #endif
    265 
    266 /* ASFR bits */
    267 #define ASFR_ME			0x100000000LL
    268 #define ASFR_PRIV		0x080000000LL
    269 #define ASFR_ISAP		0x040000000LL
    270 #define ASFR_ETP		0x020000000LL
    271 #define ASFR_IVUE		0x010000000LL
    272 #define ASFR_TO			0x008000000LL
    273 #define ASFR_BERR		0x004000000LL
    274 #define ASFR_LDP		0x002000000LL
    275 #define ASFR_CP			0x001000000LL
    276 #define ASFR_WP			0x000800000LL
    277 #define ASFR_EDP		0x000400000LL
    278 #define ASFR_UE			0x000200000LL
    279 #define ASFR_CE			0x000100000LL
    280 #define ASFR_ETS		0x0000f0000LL
    281 #define ASFT_P_SYND		0x00000ffffLL
    282 
    283 #define AFSR_BITS "\177\20" \
    284         "b\40ME\0"      "b\37PRIV\0"    "b\36ISAP\0"    "b\35ETP\0" \
    285         "b\34IVUE\0"    "b\33TO\0"      "b\32BERR\0"    "b\31LDP\0" \
    286         "b\30CP\0"      "b\27WP\0"      "b\26EDP\0"     "b\25UE\0" \
    287         "b\24CE\0"      "f\20\4ETS\0"   "f\0\20P_SYND\0"
    288 
    289 /*
    290  * Here's the spitfire TSB control register bits.
    291  *
    292  * Each TSB entry is 16-bytes wide.  The TSB must be size aligned
    293  */
    294 #define TSB_SIZE_512		0x0	/* 8kB, etc. */
    295 #define TSB_SIZE_1K		0x01
    296 #define TSB_SIZE_2K		0x02
    297 #define TSB_SIZE_4K		0x03
    298 #define	TSB_SIZE_8K		0x04
    299 #define TSB_SIZE_16K		0x05
    300 #define TSB_SIZE_32K		0x06
    301 #define TSB_SIZE_64K		0x07
    302 #define TSB_SPLIT		0x1000
    303 #define TSB_BASE		0xffffffffffffe000
    304 
    305 /*  TLB Tag Access bits */
    306 #define TLB_TAG_ACCESS_VA	0xffffffffffffe000
    307 #define TLB_TAG_ACCESS_CTX	0x0000000000001fff
    308 
    309 /*
    310  * TLB demap registers.  TTEs are defined in v9pte.h
    311  *
    312  * Use the address space to select between IMMU and DMMU.
    313  * The address of the register selects which context register
    314  * to read the ASI from.
    315  *
    316  * The data stored in the register is interpreted as the VA to
    317  * use.  The DEMAP_CTX_<> registers ignore the address and demap the
    318  * entire ASI.
    319  *
    320  */
    321 #define ASI_IMMU_DEMAP			0x57	/* [4u] IMMU TLB demap */
    322 #define ASI_DMMU_DEMAP			0x5f	/* [4u] IMMU TLB demap */
    323 
    324 #define DEMAP_PAGE_NUCLEUS		((0x02)<<4)	/* Demap page from kernel AS */
    325 #define DEMAP_PAGE_PRIMARY		((0x00)<<4)	/* Demap a page from primary CTXT */
    326 #define DEMAP_PAGE_SECONDARY		((0x01)<<4)	/* Demap page from secondary CTXT (DMMU only) */
    327 #define DEMAP_CTX_NUCLEUS		((0x06)<<4)	/* Demap all of kernel CTXT */
    328 #define DEMAP_CTX_PRIMARY		((0x04)<<4)	/* Demap all of primary CTXT */
    329 #define DEMAP_CTX_SECONDARY		((0x05)<<4)	/* Demap all of secondary CTXT */
    330 
    331 /*
    332  * Interrupt registers.  This really gets hairy.
    333  */
    334 
    335 /* IRSR -- Interrupt Receive Status Ragister */
    336 #define ASI_IRSR	0x49
    337 #define IRSR		0x00
    338 #define IRSR_BUSY	0x020
    339 #define IRSR_MID(x)	(x&0x1f)
    340 
    341 /* IRDR -- Interrupt Receive Data Registers */
    342 #define ASI_IRDR	0x7f
    343 #define IRDR_0H		0x40
    344 #define IRDR_0L		0x48	/* unimplemented */
    345 #define IRDR_1H		0x50
    346 #define IRDR_1L		0x58	/* unimplemented */
    347 #define IRDR_2H		0x60
    348 #define IRDR_2L		0x68	/* unimplemented */
    349 #define IRDR_3H		0x70	/* unimplemented */
    350 #define IRDR_3L		0x78	/* unimplemented */
    351 
    352 /* SOFTINT ASRs */
    353 #define SET_SOFTINT	%asr20	/* Sets these bits */
    354 #define CLEAR_SOFTINT	%asr21	/* Clears these bits */
    355 #define SOFTINT		%asr22	/* Reads the register */
    356 #define TICK_CMPR	%asr23
    357 
    358 #define	TICK_INT	0x01	/* level-14 clock tick */
    359 #define SOFTINT1	(0x1<<1)
    360 #define SOFTINT2	(0x1<<2)
    361 #define SOFTINT3	(0x1<<3)
    362 #define SOFTINT4	(0x1<<4)
    363 #define SOFTINT5	(0x1<<5)
    364 #define SOFTINT6	(0x1<<6)
    365 #define SOFTINT7	(0x1<<7)
    366 #define SOFTINT8	(0x1<<8)
    367 #define SOFTINT9	(0x1<<9)
    368 #define SOFTINT10	(0x1<<10)
    369 #define SOFTINT11	(0x1<<11)
    370 #define SOFTINT12	(0x1<<12)
    371 #define SOFTINT13	(0x1<<13)
    372 #define SOFTINT14	(0x1<<14)
    373 #define SOFTINT15	(0x1<<15)
    374 
    375 /* Interrupt Dispatch -- usually reserved for cross-calls */
    376 #define ASR_IDSR	0x48 /* Interrupt dispatch status reg */
    377 #define IDSR		0x00
    378 #define IDSR_NACK	0x02
    379 #define IDSR_BUSY	0x01
    380 
    381 #define ASI_INTERRUPT_DISPATCH		0x77	/* [4u] spitfire interrupt dispatch regs */
    382 #define IDCR(x)		(((x)<<14)&0x70)	/* Store anything to this address to dispatch crosscall to CPU (x) */
    383 #define IDDR_0H		0x40			/* Store data to send in these regs */
    384 #define IDDR_0L		0x48	/* unimplemented */
    385 #define IDDR_1H		0x50
    386 #define IDDR_1L		0x58	/* unimplemented */
    387 #define IDDR_2H		0x60
    388 #define IDDR_2L		0x68	/* unimplemented */
    389 #define IDDR_3H		0x70	/* unimplemented */
    390 #define IDDR_3L		0x78	/* unimplemented */
    391 
    392 /*
    393  * Error registers
    394  */
    395 
    396 /* Since we won't try to fix async errs, we don't care about the bits in the regs */
    397 #define ASI_AFAR	0x4d	/* Asynchronous fault address register */
    398 #define AFAR		0x00
    399 #define ASI_AFSR	0x4c	/* Asynchronous fault status register */
    400 #define AFSR		0x00
    401 
    402 #define ASI_P_EER	0x4b	/* Error enable register */
    403 #define P_EER		0x00
    404 #define P_EER_ISAPEN	0x04	/* Enable fatal on ISAP */
    405 #define P_EER_NCEEN	0x02	/* Enable trap on uncorrectable errs */
    406 #define P_EER_CEEN	0x01	/* Enable trap on correctable errs */
    407 
    408 #define ASI_DATAPATH_READ	0x7f /* Read the regs */
    409 #define ASI_DATAPATH_WRITE	0x77 /* Write to the regs */
    410 #define P_DPER_0	0x00	/* Datapath err reg 0 */
    411 #define P_DPER_1	0x18	/* Datapath err reg 1 */
    412 #define P_DCR_0		0x20	/* Datapath control reg 0 */
    413 #define P_DCR_1		0x38	/* Datapath control reg 0 */
    414 
    415 
    416 /* From sparc64/asm.h which I think I'll deprecate since it makes bus.h a pain. */
    417 
    418 #ifndef _LOCORE
    419 /*
    420  * GCC __asm constructs for doing assembly stuff.
    421  */
    422 
    423 /*
    424  * ``Routines'' to load and store from/to alternate address space.
    425  * The location can be a variable, the asi value (address space indicator)
    426  * must be a constant.
    427  *
    428  * N.B.: You can put as many special functions here as you like, since
    429  * they cost no kernel space or time if they are not used.
    430  *
    431  * These were static inline functions, but gcc screws up the constraints
    432  * on the address space identifiers (the "n"umeric value part) because
    433  * it inlines too late, so we have to use the funny valued-macro syntax.
    434  */
    435 
    436 /*
    437  * Apparently the definition of bypass ASIs is that they all use the
    438  * D$ so we need to flush the D$ to make sure we don't get data pollution.
    439  */
    440 
    441 static __inline__ u_char lduba __P((paddr_t loc, int asi));
    442 static __inline__ u_short lduha __P((paddr_t loc, int asi));
    443 static __inline__ u_int lda __P((paddr_t loc, int asi));
    444 static __inline__ int ldswa __P((paddr_t loc, int asi));
    445 static __inline__ u_int64_t ldxa __P((paddr_t loc, int asi));
    446 static __inline__ u_int64_t ldda __P((paddr_t loc, int asi));
    447 
    448 static __inline__ void stba __P((paddr_t loc, int asi, u_char value));
    449 static __inline__ void stha __P((paddr_t loc, int asi, u_short value));
    450 static __inline__ void sta __P((paddr_t loc, int asi, u_int value));
    451 static __inline__ void stxa __P((paddr_t loc, int asi, u_int64_t value));
    452 static __inline__ void stda __P((paddr_t loc, int asi, u_int64_t value));
    453 
    454 #if 0
    455 static __inline__ unsigned int casa __P((paddr_t loc, int asi,
    456 	unsigned int value, unsigned int oldvalue));
    457 static __inline__ u_int64_t casxa __P((paddr_t loc, int asi,
    458 	u_int64_t value, u_int64_t oldvalue));
    459 #endif
    460 
    461 #ifdef __arch64__
    462 static __inline__ u_char
    463 lduba(paddr_t loc, int asi)
    464 {
    465 	register unsigned int _lduba_v;
    466 
    467 	if (PHYS_ASI(asi)) {
    468 		__asm __volatile("wr %3,%%g0,%%asi; "
    469 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
    470 " lduba [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
    471 " stxa %%g0,[%1] %4; membar #Sync" :
    472 				 "=&r" (_lduba_v), "=r" (loc):
    473 				 "r" ((unsigned long)(loc)),
    474 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    475 	} else {
    476 		__asm __volatile("wr %2,%%g0,%%asi; lduba [%1]%%asi,%0" :
    477 				 "=r" (_lduba_v) :
    478 				 "r" ((unsigned long)(loc)), "r" (asi));
    479 	}
    480 	return (_lduba_v);
    481 }
    482 #else
    483 static __inline__ u_char
    484 lduba(paddr_t loc, int asi)
    485 {
    486 	register unsigned int _lduba_v, _loc_hi, _pstate;
    487 
    488 	_loc_hi = (((u_int64_t)loc)>>32);
    489 	if (PHYS_ASI(asi)) {
    490 		__asm __volatile("wr %4,%%g0,%%asi; "
    491 " andn %2,0x1f,%0; stxa %%g0,[%0] %5; rdpr %%pstate,%1; "
    492 " sllx %3,32,%0; or %0,%2,%0; wrpr %1,8,%%pstate; "
    493 " membar #Sync; lduba [%0]%%asi,%0; wrpr %1,0,%%pstate; "
    494 " andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" :
    495 				 "=&r" (_lduba_v),  "=&r" (_pstate) :
    496 				 "r" ((unsigned long)(loc)), "r" (_loc_hi),
    497 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    498 	} else {
    499 		__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; "
    500 " or %0,%1,%0; lduba [%0]%%asi,%0" : "=&r" (_lduba_v) :
    501 				 "r" ((unsigned long)(loc)),
    502 				 "r" (_loc_hi), "r" (asi));
    503 	}
    504 	return (_lduba_v);
    505 }
    506 #endif
    507 
    508 #ifdef __arch64__
    509 /* load half-word from alternate address space */
    510 static __inline__ u_short
    511 lduha(paddr_t loc, int asi)
    512 {
    513 	register unsigned int _lduha_v;
    514 
    515 	if (PHYS_ASI(asi)) {
    516 		__asm __volatile("wr %3,%%g0,%%asi; "
    517 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
    518 " lduha [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
    519 " stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lduha_v), "=r" (loc) :
    520 				 "r" ((unsigned long)(loc)),
    521 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    522 	} else {
    523 		__asm __volatile("wr %2,%%g0,%%asi; lduha [%1]%%asi,%0" :
    524 				 "=r" (_lduha_v) :
    525 				 "r" ((unsigned long)(loc)), "r" (asi));
    526 	}
    527 	return (_lduha_v);
    528 }
    529 #else
    530 /* load half-word from alternate address space */
    531 static __inline__ u_short
    532 lduha(paddr_t loc, int asi) {
    533 	register unsigned int _lduha_v, _loc_hi, _pstate;
    534 
    535 	_loc_hi = (((u_int64_t)loc)>>32);
    536 
    537 	if (PHYS_ASI(asi)) {
    538 		__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1; "
    539 " andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; sllx %3,32,%0; "
    540 " or %0,%2,%0; membar #Sync; lduha [%0]%%asi,%0; wrpr %1,0,%%pstate; "
    541 " andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" :
    542 				 "=&r" (_lduha_v), "=&r" (_pstate) :
    543 				 "r" ((unsigned long)(loc)), "r" (_loc_hi),
    544 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    545 	} else {
    546 		__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; "
    547 " or %0,%1,%0; lduha [%0]%%asi,%0" : "=&r" (_lduha_v) :
    548 				 "r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi));
    549 	}
    550 	return (_lduha_v);
    551 }
    552 #endif
    553 
    554 
    555 #ifdef __arch64__
    556 /* load unsigned int from alternate address space */
    557 static __inline__ u_int
    558 lda(paddr_t loc, int asi)
    559 {
    560 	register unsigned int _lda_v;
    561 
    562 	if (PHYS_ASI(asi)) {
    563 		__asm __volatile("wr %3,%%g0,%%asi; "
    564 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
    565 " lda [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
    566 " stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) :
    567 				 "r" ((unsigned long)(loc)),
    568 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    569 	} else {
    570 		__asm __volatile("wr %2,%%g0,%%asi; lda [%1]%%asi,%0" :
    571 				 "=r" (_lda_v) :
    572 				 "r" ((unsigned long)(loc)), "r" (asi));
    573 	}
    574 	return (_lda_v);
    575 }
    576 
    577 /* load signed int from alternate address space */
    578 static __inline__ int
    579 ldswa(paddr_t loc, int asi)
    580 {
    581 	register int _lda_v;
    582 
    583 	if (PHYS_ASI(asi)) {
    584 		__asm __volatile("wr %3,%%g0,%%asi; "
    585 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
    586 " ldswa [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
    587 " stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) :
    588 				 "r" ((unsigned long)(loc)),
    589 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    590 	} else {
    591 		__asm __volatile("wr %2,%%g0,%%asi; ldswa [%1]%%asi,%0" :
    592 				 "=r" (_lda_v) :
    593 				 "r" ((unsigned long)(loc)), "r" (asi));
    594 	}
    595 	return (_lda_v);
    596 }
    597 #else	/* __arch64__ */
    598 /* load unsigned int from alternate address space */
    599 static __inline__ u_int
    600 lda(paddr_t loc, int asi)
    601 {
    602 	register unsigned int _lda_v, _loc_hi, _pstate;
    603 
    604 	_loc_hi = (((u_int64_t)loc)>>32);
    605 	if (PHYS_ASI(asi)) {
    606 		__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;"
    607 " andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; "
    608 " sllx %3,32,%0; or %0,%2,%0; membar #Sync;lda [%0]%%asi,%0; "
    609 " wrpr %1,0,%%pstate; andn %2,0x1f,%1; membar #Sync; "
    610 " stxa %%g0,[%1] %5; membar #Sync" : "=&r" (_lda_v), "=&r" (_pstate) :
    611 				 "r" ((unsigned long)(loc)), "r" (_loc_hi),
    612 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    613 	} else {
    614 		__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; "
    615 " or %0,%1,%0; lda [%0]%%asi,%0" : "=&r" (_lda_v) :
    616 				 "r" ((unsigned long)(loc)),
    617 				 "r" (_loc_hi), "r" (asi));
    618 	}
    619 	return (_lda_v);
    620 }
    621 
    622 /* load signed int from alternate address space */
    623 static __inline__ int
    624 ldswa(paddr_t loc, int asi)
    625 {
    626 	register int _lda_v, _loc_hi, _pstate;
    627 
    628 	_loc_hi = (((u_int64_t)loc)>>32);
    629 	if (PHYS_ASI(asi)) {
    630 		__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;"
    631 " andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; sllx %3,32,%0;"
    632 " or %0,%2,%0; membar #Sync; ldswa [%0]%%asi,%0; wrpr %1,0,%%pstate; "
    633 " andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" :
    634 				 "=&r" (_lda_v), "=&r" (_pstate) :
    635 				 "r" ((unsigned long)(loc)), "r" (_loc_hi),
    636 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    637 	} else {
    638 		__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; "
    639 " or %0,%1,%0; ldswa [%0]%%asi,%0" : "=&r" (_lda_v) :
    640 				 "r" ((unsigned long)(loc)),
    641 				 "r" (_loc_hi), "r" (asi));
    642 	}
    643 	return (_lda_v);
    644 }
    645 #endif /* __arch64__ */
    646 
    647 #ifdef	__arch64__
    648 /* load 64-bit int from alternate address space -- these should never be used */
    649 static __inline__ u_int64_t
    650 ldda(paddr_t loc, int asi)
    651 {
    652 	register long long _lda_v;
    653 
    654 	if (PHYS_ASI(asi)) {
    655 		__asm __volatile("wr %3,%%g0,%%asi; "
    656 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
    657 " ldda [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
    658 " stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=&r" (loc) :
    659 				 "r" ((unsigned long)(loc)),
    660 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    661 	} else {
    662 		__asm __volatile("wr %2,%%g0,%%asi; ldda [%1]%%asi,%0" :
    663 				 "=r" (_lda_v) :
    664 				 "r" ((unsigned long)(loc)), "r" (asi));
    665 	}
    666 	return (_lda_v);
    667 }
    668 #else
    669 /* load 64-bit int from alternate address space */
    670 static __inline__ u_int64_t
    671 ldda(paddr_t loc, int asi)
    672 {
    673 	register long long _lda_v, _loc_hi, _pstate;
    674 
    675 	_loc_hi = (((u_int64_t)loc)>>32);
    676 	if (PHYS_ASI(asi)) {
    677 		__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;"
    678 " andn %2,0x1f,%0; rdpr %%pstate,%1; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate;"
    679 " sllx %3,32,%0; or %0,%2,%0; membar #Sync; ldda [%0]%%asi,%0; wrpr %1,0,%%pstate; "
    680 " andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" :
    681 				 "=&r" (_lda_v), "=&r" (_pstate) :
    682 				 "r" ((unsigned long)(loc)), "r" (_loc_hi),
    683 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    684 	} else {
    685 		__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; "
    686 " or %0,%1,%0; ldda [%0]%%asi,%0" : "=&r" (_lda_v) :
    687 				 "r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi));
    688 	}
    689 	return (_lda_v);
    690 }
    691 #endif
    692 
    693 
    694 #ifdef __arch64__
    695 /* native load 64-bit int from alternate address space w/64-bit compiler*/
    696 static __inline__ u_int64_t
    697 ldxa(paddr_t loc, int asi)
    698 {
    699 	register unsigned long _lda_v;
    700 
    701 	if (PHYS_ASI(asi)) {
    702 		__asm __volatile("wr %3,%%g0,%%asi; "
    703 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
    704 " ldxa [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
    705 " stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) :
    706 				 "r" ((unsigned long)(loc)),
    707 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    708 	} else {
    709 		__asm __volatile("wr %2,%%g0,%%asi; ldxa [%1]%%asi,%0" :
    710 				 "=r" (_lda_v) :
    711 				 "r" ((unsigned long)(loc)), "r" (asi));
    712 	}
    713 	return (_lda_v);
    714 }
    715 #else
    716 /* native load 64-bit int from alternate address space w/32-bit compiler*/
    717 static __inline__ u_int64_t
    718 ldxa(paddr_t loc, int asi)
    719 {
    720 	register unsigned long _ldxa_lo, _ldxa_hi, _loc_hi;
    721 
    722 	_loc_hi = (((u_int64_t)loc)>>32);
    723 	if (PHYS_ASI(asi)) {
    724 		__asm __volatile("wr %4,%%g0,%%asi; "
    725 " andn %2,0x1f,%0; rdpr %%pstate,%1; stxa %%g0,[%0] %5; "
    726 " sllx %3,32,%0; wrpr %1,8,%%pstate; or %0,%2,%0; membar #Sync; ldxa [%0]%%asi,%0; "
    727 " wrpr %1,0,%%pstate; andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync; "
    728 " srlx %0,32,%1; srl %0,0,%0" :
    729 				 "=&r" (_ldxa_lo), "=&r" (_ldxa_hi) :
    730 				 "r" ((unsigned long)(loc)), "r" (_loc_hi),
    731 				 "r" (asi), "n" (ASI_DCACHE_TAG));
    732 	} else {
    733 		__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; "
    734 " or %0,%2,%0; ldxa [%0]%%asi,%0; srlx %0,32,%1; srl %0,0,%0;" :
    735 				 "=&r" (_ldxa_lo), "=&r" (_ldxa_hi) :
    736 				 "r" ((unsigned long)(loc)), "r" (_loc_hi),
    737 				 "r" (asi));
    738 	}
    739 	return ((((int64_t)_ldxa_hi)<<32)|_ldxa_lo);
    740 }
    741 #endif
    742 
    743 /* store byte to alternate address space */
    744 #ifdef __arch64__
    745 static __inline__ void
    746 stba(paddr_t loc, int asi, u_char value)
    747 {
    748 	if (PHYS_ASI(asi)) {
    749 		__asm __volatile("wr %3,%%g0,%%asi; stba %1,[%2]%%asi;"
    750 " andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" :
    751 			"=&r" (loc) :
    752 			"r" ((int)(value)), "r" ((unsigned long)(loc)),
    753 			"r" (asi), "n" (ASI_DCACHE_TAG));
    754 	} else {
    755 		__asm __volatile("wr %2,%%g0,%%asi; stba %0,[%1]%%asi" : :
    756 			"r" ((int)(value)), "r" ((unsigned long)(loc)),
    757 			"r" (asi));
    758 	}
    759 }
    760 #else
    761 static __inline__ void
    762 stba(paddr_t loc, int asi, u_char value)
    763 {
    764 	register int _loc_hi, _pstate;
    765 
    766 	_loc_hi = (((u_int64_t)loc)>>32);
    767 	if (PHYS_ASI(asi)) {
    768 		__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;"
    769 " or %3,%0,%0; wrpr %1,8,%%pstate; stba %2,[%0]%%asi; wrpr %1,0,%%pstate; "
    770 " andn %0,0x1f,%1;  membar #Sync; stxa %%g0,[%1] %6; membar #Sync" :
    771 				 "=&r" (_loc_hi), "=&r" (_pstate) :
    772 				 "r" ((int)(value)), "r" ((unsigned long)(loc)),
    773 				 "r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG));
    774 	} else {
    775 		__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; "
    776 " or %2,%0,%0; stba %1,[%0]%%asi" : "=&r" (_loc_hi) :
    777 				 "r" ((int)(value)), "r" ((unsigned long)(loc)),
    778 				 "r" (_loc_hi), "r" (asi));
    779 	}
    780 }
    781 #endif
    782 
    783 /* store half-word to alternate address space */
    784 #ifdef __arch64__
    785 static __inline__ void
    786 stha(paddr_t loc, int asi, u_short value)
    787 {
    788 	if (PHYS_ASI(asi)) {
    789 		__asm __volatile("wr %3,%%g0,%%asi; stha %1,[%2]%%asi;"
    790 " andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" :
    791 			"=&r" (loc) :
    792 			"r" ((int)(value)), "r" ((unsigned long)(loc)),
    793 			"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
    794 	} else {
    795 		__asm __volatile("wr %2,%%g0,%%asi; stha %0,[%1]%%asi" : :
    796 			"r" ((int)(value)), "r" ((unsigned long)(loc)),
    797 			"r" (asi) : "memory");
    798 	}
    799 }
    800 #else
    801 static __inline__ void
    802 stha(paddr_t loc, int asi, u_short value)
    803 {
    804 	register int _loc_hi, _pstate;
    805 
    806 	_loc_hi = (((u_int64_t)loc)>>32);
    807 	if (PHYS_ASI(asi)) {
    808 		__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;"
    809 " or %3,%0,%0; wrpr %1,8,%%pstate; stha %2,[%0]%%asi; wrpr %1,0,%%pstate; "
    810 " andn %0,0x1f,%1;  membar #Sync; stxa %%g0,[%1] %6; membar #Sync" :
    811 			"=&r" (_loc_hi), "=&r" (_pstate) :
    812 			"r" ((int)(value)), "r" ((unsigned long)(loc)),
    813 			"r" (_loc_hi), "r" (asi),
    814 			"n" (ASI_DCACHE_TAG) : "memory");
    815 	} else {
    816 		__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; "
    817 " or %2,%0,%0; stha %1,[%0]%%asi" : "=&r" (_loc_hi) :
    818 				 "r" ((int)(value)), "r" ((unsigned long)(loc)),
    819 				 "r" (_loc_hi), "r" (asi) : "memory");
    820 	}
    821 }
    822 #endif
    823 
    824 
    825 /* store int to alternate address space */
    826 #ifdef __arch64__
    827 static __inline__ void
    828 sta(paddr_t loc, int asi, u_int value)
    829 {
    830 	if (PHYS_ASI(asi)) {
    831 		__asm __volatile("wr %3,%%g0,%%asi; sta %1,[%2]%%asi;"
    832 " andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" :
    833 			"=&r" (loc) :
    834 			"r" ((int)(value)), "r" ((unsigned long)(loc)),
    835 			"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
    836 	} else {
    837 		__asm __volatile("wr %2,%%g0,%%asi; sta %0,[%1]%%asi" : :
    838 			"r" ((int)(value)), "r" ((unsigned long)(loc)),
    839 			"r" (asi) : "memory");
    840 	}
    841 }
    842 #else
    843 static __inline__ void
    844 sta(paddr_t loc, int asi, u_int value)
    845 {
    846 	register int _loc_hi, _pstate;
    847 
    848 	_loc_hi = (((u_int64_t)loc)>>32);
    849 	if (PHYS_ASI(asi)) {
    850 		__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;"
    851 " or %3,%0,%0; wrpr %1,8,%%pstate; sta %2,[%0]%%asi; wrpr %1,0,%%pstate; "
    852 " andn %0,0x1f,%1;  membar #Sync; stxa %%g0,[%1] %6; membar #Sync" :
    853 			"=&r" (_loc_hi), "=&r" (_pstate) :
    854 			"r" ((int)(value)), "r" ((unsigned long)(loc)),
    855 			"r" (_loc_hi), "r" (asi),
    856 			"n" (ASI_DCACHE_TAG) : "memory");
    857 	} else {
    858 		__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; "
    859 " or %2,%0,%0; sta %1,[%0]%%asi" : "=&r" (_loc_hi) :
    860 				 "r" ((int)(value)), "r" ((unsigned long)(loc)),
    861 				 "r" (_loc_hi), "r" (asi) : "memory");
    862 	}
    863 }
    864 #endif
    865 
    866 /* store 64-bit int to alternate address space */
    867 #ifdef __arch64__
    868 static __inline__ void
    869 stda(paddr_t loc, int asi, u_int64_t value)
    870 {
    871 	if (PHYS_ASI(asi)) {
    872 		__asm __volatile("wr %3,%%g0,%%asi; stda %1,[%2]%%asi;"
    873 " andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" :
    874 			"=&r" (loc) :
    875 			"r" ((long long)(value)), "r" ((unsigned long)(loc)),
    876 			"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
    877 	} else {
    878 		__asm __volatile("wr %2,%%g0,%%asi; stda %0,[%1]%%asi" : :
    879 			"r" ((long long)(value)), "r" ((unsigned long)(loc)),
    880 			"r" (asi) : "memory");
    881 	}
    882 }
    883 #else
    884 static __inline__ void
    885 stda(paddr_t loc, int asi, u_int64_t value)
    886 {
    887 	register int _loc_hi, _pstate;
    888 
    889 	_loc_hi = (((u_int64_t)loc)>>32);
    890 	if (PHYS_ASI(asi)) {
    891 		__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1; "
    892 " or %3,%0,%0; wrpr %1,8,%%pstate; stda %2,[%0]%%asi; wrpr %1,0,%%pstate;"
    893 " andn %0,0x1f,%1;  membar #Sync; stxa %%g0,[%1] %6; membar #Sync" :
    894 			"=&r" (_loc_hi), "=&r" (_pstate) :
    895 			"r" ((long long)(value)), "r" ((unsigned long)(loc)),
    896 			"r" (_loc_hi), "r" (asi),
    897 			"n" (ASI_DCACHE_TAG) : "memory");
    898 	} else {
    899 		__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; "
    900 " or %2,%0,%0; stda %1,[%0]%%asi" :
    901 			"=&r" (_loc_hi) :
    902 			"r" ((long long)(value)), "r" ((unsigned long)(loc)),
    903 			"r" (_loc_hi), "r" (asi) : "memory");
    904 	}
    905 }
    906 #endif
    907 
    908 #ifdef __arch64__
    909 /* native store 64-bit int to alternate address space w/64-bit compiler*/
    910 static __inline__ void
    911 stxa(paddr_t loc, int asi, u_int64_t value)
    912 {
    913 	if (PHYS_ASI(asi)) {
    914 		__asm __volatile("wr %3,%%g0,%%asi; stxa %1,[%2]%%asi;"
    915 " andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" :
    916 			"=&r" (asi) :
    917 			"r" ((unsigned long)(value)),
    918 			"r" ((unsigned long)(loc)),
    919 			"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
    920 	} else {
    921 		__asm __volatile("wr %2,%%g0,%%asi; stxa %0,[%1]%%asi" : :
    922 			"r" ((unsigned long)(value)),
    923 			"r" ((unsigned long)(loc)), "r" (asi) : "memory");
    924 	}
    925 }
    926 #else
    927 /* native store 64-bit int to alternate address space w/32-bit compiler*/
    928 static __inline__ void
    929 stxa(paddr_t loc, int asi, u_int64_t value)
    930 {
    931 	int _stxa_lo, _stxa_hi, _loc_hi;
    932 
    933 	_stxa_lo = value;
    934 	_stxa_hi = ((u_int64_t)value)>>32;
    935 	_loc_hi = (((u_int64_t)(u_long)loc)>>32);
    936 
    937 	if (PHYS_ASI(asi)) {
    938 		__asm __volatile("wr %7,%%g0,%%asi; sllx %4,32,%1; sllx %6,32,%0; "
    939 " or %1,%3,%1; rdpr %%pstate,%2; or %0,%5,%0; wrpr %2,8,%%pstate; "
    940 " stxa %1,[%0]%%asi; wrpr %2,0,%%pstate; "
    941 " andn %0,0x1f,%1;  membar #Sync; stxa %%g0,[%1] %8; membar #Sync" :
    942 				 "=&r" (_loc_hi), "=&r" (_stxa_hi),
    943 				 "=&r" ((int)(_stxa_lo)) :
    944 				 "r" ((int)(_stxa_lo)), "r" ((int)(_stxa_hi)),
    945 				 "r" ((unsigned long)(loc)), "r" (_loc_hi),
    946 				 "r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
    947 	} else {
    948 		__asm __volatile("wr %6,%%g0,%%asi; sllx %3,32,%1; sllx %5,32,%0; "
    949 " or %1,%2,%1; or %0,%4,%0; stxa %1,[%0]%%asi" :
    950 				 "=&r" (_loc_hi), "=&r" (_stxa_hi) :
    951 				 "r" ((int)(_stxa_lo)), "r" ((int)(_stxa_hi)),
    952 				 "r" ((unsigned long)(loc)), "r" (_loc_hi),
    953 				 "r" (asi) : "memory");
    954 	}
    955 }
    956 #endif
    957 
    958 #if 0
    959 #ifdef __arch64__
    960 /* native store 64-bit int to alternate address space w/64-bit compiler*/
    961 static __inline__ u_int64_t
    962 casxa(paddr_t loc, int asi, u_int64_t value, u_int64_t oldvalue)
    963 {
    964 	if (PHYS_ASI(asi)) {
    965 		__asm __volatile("wr %4,%%g0,%%asi; casxa [%3]%%asi,%2,%1;"
    966 " andn %3,0x1f,%0; membar #Sync; stxa %%g0,[%0] %5; membar #Sync" :
    967 			"=&r" (loc), "+r" (value) :
    968 			"r" ((unsigned long)(oldvalue)),
    969 			"r" ((unsigned long)(loc)),
    970 			"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
    971 	} else {
    972 		__asm __volatile("wr %3,%%g0,%%asi; casxa [%1]%%asi,%2,%0" :
    973 			"+r" (value) :
    974 			"r" ((unsigned long)(loc)), "r" (oldvalue), "r" (asi) :
    975 			"memory");
    976 	}
    977 	return (value);
    978 }
    979 #else
    980 /* native store 64-bit int to alternate address space w/32-bit compiler*/
    981 static __inline__ u_int64_t
    982 casxa(paddr_t loc, int asi, u_int64_t value, u_int64_t oldvalue)
    983 {
    984 	int _casxa_lo, _casxa_hi, _loc_hi, _oval_hi;
    985 
    986 	_casxa_lo = value;
    987 	_casxa_hi = ((u_int64_t)value)>>32;
    988 	_oval_hi = ((u_int64_t)oldvalue)>>32;
    989 	_loc_hi = (((u_int64_t)(u_long)loc)>>32);
    990 
    991 	if (PHYS_ASI(asi)) {
    992 		__asm __volatile("wr %7,%%g0,%%asi; sllx %1,32,%1; sllx %5,32,%0; "
    993 " sllx %3,32,%3; or %1,%2,%1; rdpr %%pstate,%2; or %0,%4,%0; or %3,%6,%3; "
    994 " wrpr %2,8,%%pstate; casxa [%0]%%asi,%3,%1; wrpr %2,0,%%pstate; "
    995 " andn %0,0x1f,%3;  membar #Sync; stxa %%g0,[%3] %8; membar #Sync; "
    996 " sll %1,0,%2; srax %1,32,%1 " :
    997 			"=&r" (_loc_hi), "+r" (_casxa_hi),
    998 			"+r" (_casxa_lo), "+r" (_oval_hi) :
    999 			"r" ((unsigned long)(loc)), "r" (_loc_hi),
   1000 			"r" ((unsigned int)(oval))
   1001 			"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
   1002 	} else {
   1003 		__asm __volatile("wr %7,%%g0,%%asi; sllx %1,32,%1; sllx %5,32,%0; "
   1004 " or %1,%2,%1; sllx %3,32,%2; or %0,%4,%0; or %2,%4,%2; "
   1005 " casxa [%0]%%asi,%2,%1; sll %1,0,%2; srax %o1,32,%o1 " :
   1006 			"=&r" (_loc_hi), "+r" (_casxa_hi), "+r" (_casxa_lo) :
   1007 			"r" ((int)(_oval_hi)), "r" ((int)(oval)),
   1008 			"r" ((unsigned long)(loc)), "r" (_loc_hi),
   1009 			"r" (asi) : "memory");
   1010 	}
   1011 }
   1012 #endif
   1013 #endif /* 0 */
   1014 
   1015 #if 0
   1016 #ifdef __arch64__
   1017 /* load byte from alternate address space */
   1018 #define	lduba(loc, asi) ({ \
   1019 	register unsigned int _lduba_v; \
   1020 	if (PHYS_ASI(asi)) { \
   1021 		__asm __volatile("wr %3,%%g0,%%asi; " \
   1022 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
   1023 " lduba [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
   1024 " stxa %%g0,[%1] %4; membar #Sync" : \
   1025 		"=&r" (_lduba_v), "=r" (loc): \
   1026 		"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
   1027 	} else { \
   1028 		__asm __volatile("wr %2,%%g0,%%asi; lduba [%1]%%asi,%0" : \
   1029 		"=r" (_lduba_v) : \
   1030 		"r" ((unsigned long)(loc)), "r" (asi)); \
   1031 	} \
   1032 	_lduba_v; \
   1033 })
   1034 #else
   1035 /* load byte from alternate address space */
   1036 #define	lduba(loc, asi) ({ \
   1037 	register unsigned int _lduba_v, _loc_hi, _pstate; \
   1038 	_loc_hi = (((u_int64_t)loc)>>32); \
   1039 	if (PHYS_ASI(asi)) { \
   1040 		__asm __volatile("wr %4,%%g0,%%asi; " \
   1041 " andn %2,0x1f,%0; stxa %%g0,[%0] %5; rdpr %%pstate,%1; " \
   1042 " sllx %3,32,%0; or %0,%2,%0; wrpr %1,8,%%pstate; " \
   1043 " membar #Sync; lduba [%0]%%asi,%0; wrpr %1,0,%%pstate; " \
   1044 " andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" : \
   1045 		"=&r" (_lduba_v),  "=&r" (_pstate) : \
   1046 		"r" ((unsigned long)(loc)), "r" (_loc_hi), \
   1047 		"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1048 	} else { \
   1049 		__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; " \
   1050 " or %0,%1,%0; lduba [%0]%%asi,%0" : "=&r" (_lduba_v) : \
   1051 		"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
   1052 	} \
   1053 	_lduba_v; \
   1054 })
   1055 #endif
   1056 
   1057 #ifdef __arch64__
   1058 /* load half-word from alternate address space */
   1059 #define	lduha(loc, asi) ({ \
   1060 	register unsigned int _lduha_v; \
   1061 	if (PHYS_ASI(asi)) { \
   1062 		__asm __volatile("wr %3,%%g0,%%asi; " \
   1063 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
   1064 " lduha [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
   1065 " stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lduha_v), "=r" (loc) : \
   1066 		"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
   1067 	} else { \
   1068 		__asm __volatile("wr %2,%%g0,%%asi; lduha [%1]%%asi,%0" : "=r" (_lduha_v) : \
   1069 		"r" ((unsigned long)(loc)), "r" (asi)); \
   1070 	} \
   1071 	_lduha_v; \
   1072 })
   1073 #else
   1074 /* load half-word from alternate address space */
   1075 #define	lduha(loc, asi) ({ \
   1076 	register unsigned int _lduha_v, _loc_hi, _pstate; \
   1077 	_loc_hi = (((u_int64_t)loc)>>32); \
   1078 	if (PHYS_ASI(asi)) { \
   1079 		__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1; " \
   1080 " andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; sllx %3,32,%0; " \
   1081 " or %0,%2,%0; membar #Sync; lduha [%0]%%asi,%0; wrpr %1,0,%%pstate; " \
   1082 " andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" : \
   1083 		"=&r" (_lduha_v), "=&r" (_pstate) : \
   1084 		"r" ((unsigned long)(loc)), "r" (_loc_hi), \
   1085 		"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1086 	} else { \
   1087 		__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; " \
   1088 " or %0,%1,%0; lduha [%0]%%asi,%0" : "=&r" (_lduha_v) : \
   1089 		"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
   1090 	} \
   1091 	_lduha_v; \
   1092 })
   1093 #endif
   1094 
   1095 #ifdef __arch64__
   1096 /* load unsigned int from alternate address space */
   1097 #define	lda(loc, asi) ({ \
   1098 	register unsigned int _lda_v; \
   1099 	if (PHYS_ASI(asi)) { \
   1100 		__asm __volatile("wr %3,%%g0,%%asi; " \
   1101 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
   1102 " lda [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
   1103 " stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) : \
   1104 		"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
   1105 	} else { \
   1106 		__asm __volatile("wr %2,%%g0,%%asi; lda [%1]%%asi,%0" : "=r" (_lda_v) : \
   1107 		"r" ((unsigned long)(loc)), "r" (asi)); \
   1108 	} \
   1109 	_lda_v; \
   1110 })
   1111 
   1112 /* load signed int from alternate address space */
   1113 #define	ldswa(loc, asi) ({ \
   1114 	register int _lda_v; \
   1115 	if (PHYS_ASI(asi)) { \
   1116 		__asm __volatile("wr %3,%%g0,%%asi; " \
   1117 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
   1118 " ldswa [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
   1119 " stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) : \
   1120 		"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
   1121 	} else { \
   1122 		__asm __volatile("wr %2,%%g0,%%asi; ldswa [%1]%%asi,%0" : "=r" (_lda_v) : \
   1123 		"r" ((unsigned long)(loc)), "r" (asi)); \
   1124 	} \
   1125 	_lda_v; \
   1126 })
   1127 #else	/* __arch64__ */
   1128 /* load unsigned int from alternate address space */
   1129 #define	lda(loc, asi) ({ \
   1130 	register unsigned int _lda_v, _loc_hi, _pstate; \
   1131 	_loc_hi = (((u_int64_t)loc)>>32); \
   1132 	if (PHYS_ASI(asi)) { \
   1133 		__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;" \
   1134 " andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; " \
   1135 " sllx %3,32,%0; or %0,%2,%0; membar #Sync;lda [%0]%%asi,%0; " \
   1136 " wrpr %1,0,%%pstate; andn %2,0x1f,%1; membar #Sync; " \
   1137 " stxa %%g0,[%1] %5; membar #Sync" : "=&r" (_lda_v), "=&r" (_pstate) : \
   1138 		"r" ((unsigned long)(loc)), "r" (_loc_hi), \
   1139 		"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1140 	} else { \
   1141 		__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; " \
   1142 " or %0,%1,%0; lda [%0]%%asi,%0" : "=&r" (_lda_v) : \
   1143 		"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
   1144 	} \
   1145 	_lda_v; \
   1146 })
   1147 
   1148 /* load signed int from alternate address space */
   1149 #define	ldswa(loc, asi) ({ \
   1150 	register int _lda_v, _loc_hi, _pstate; \
   1151 	_loc_hi = (((u_int64_t)loc)>>32); \
   1152 	if (PHYS_ASI(asi)) { \
   1153 		__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;" \
   1154 " andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; sllx %3,32,%0;" \
   1155 " or %0,%2,%0; membar #Sync; ldswa [%0]%%asi,%0; wrpr %1,0,%%pstate; " \
   1156 " andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" : \
   1157 		"=&r" (_lda_v), "=&r" (_pstate) : \
   1158 		"r" ((unsigned long)(loc)), "r" (_loc_hi), \
   1159 		"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1160 	} else { \
   1161 		__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; " \
   1162 " or %0,%1,%0; ldswa [%0]%%asi,%0" : "=&r" (_lda_v) : \
   1163 		"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
   1164 	} \
   1165 	_lda_v; \
   1166 })
   1167 #endif /* __arch64__ */
   1168 
   1169 #ifdef	__arch64__
   1170 /* load 64-bit int from alternate address space -- these should never be used */
   1171 #define	ldda(loc, asi) ({ \
   1172 	register long long _lda_v; \
   1173 	if (PHYS_ASI(asi)) { \
   1174 		__asm __volatile("wr %3,%%g0,%%asi; " \
   1175 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
   1176 " ldda [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
   1177 " stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=&r" (loc) : \
   1178 		"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
   1179 	} else { \
   1180 		__asm __volatile("wr %2,%%g0,%%asi; ldda [%1]%%asi,%0" : "=r" (_lda_v) : \
   1181 		"r" ((unsigned long)(loc)), "r" (asi)); \
   1182 	} \
   1183 	_lda_v; \
   1184 })
   1185 #else
   1186 /* load 64-bit int from alternate address space */
   1187 #define	ldda(loc, asi) ({ \
   1188 	register long long _lda_v, _loc_hi, _pstate; \
   1189 	_loc_hi = (((u_int64_t)loc)>>32); \
   1190 	if (PHYS_ASI(asi)) { \
   1191 		__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;" \
   1192 " andn %2,0x1f,%0; rdpr %%pstate,%1; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate;" \
   1193 " sllx %3,32,%0; or %0,%2,%0; membar #Sync; ldda [%0]%%asi,%0; wrpr %1,0,%%pstate; " \
   1194 " andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" : \
   1195 		 "=&r" (_lda_v), "=&r" (_pstate) : \
   1196 		"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG)); \
   1197 	} else { \
   1198 		__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; " \
   1199 " or %0,%1,%0; ldda [%0]%%asi,%0" : "=&r" (_lda_v) : \
   1200 			"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
   1201 	} \
   1202 	_lda_v; \
   1203 })
   1204 #endif
   1205 
   1206 #ifdef __arch64__
   1207 /* native load 64-bit int from alternate address space w/64-bit compiler*/
   1208 #define	ldxa(loc, asi) ({ \
   1209 	register unsigned long _lda_v; \
   1210 	if (PHYS_ASI(asi)) { \
   1211 		__asm __volatile("wr %3,%%g0,%%asi; "\
   1212 " andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
   1213 " ldxa [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
   1214 " stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) : \
   1215 		"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
   1216 	} else { \
   1217 		__asm __volatile("wr %2,%%g0,%%asi; ldxa [%1]%%asi,%0" : "=r" (_lda_v) : \
   1218 		"r" ((unsigned long)(loc)), "r" (asi)); \
   1219 	} \
   1220 	_lda_v; \
   1221 })
   1222 #else
   1223 /* native load 64-bit int from alternate address space w/32-bit compiler*/
   1224 #define	ldxa(loc, asi) ({ \
   1225 	register unsigned long _ldxa_lo, _ldxa_hi, _loc_hi; \
   1226 	_loc_hi = (((u_int64_t)loc)>>32); \
   1227 	if (PHYS_ASI(asi)) { \
   1228 		__asm __volatile("wr %4,%%g0,%%asi; " \
   1229 " andn %2,0x1f,%0; rdpr %%pstate,%1; stxa %%g0,[%0] %5; " \
   1230 " sllx %3,32,%0; wrpr %1,8,%%pstate; or %0,%2,%0; membar #Sync; ldxa [%0]%%asi,%0; " \
   1231 " wrpr %1,0,%%pstate; andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync; " \
   1232 " srlx %0,32,%1; srl %0,0,%0" : \
   1233 		"=&r" (_ldxa_lo), "=&r" (_ldxa_hi) : \
   1234 		"r" ((unsigned long)(loc)), "r" (_loc_hi), \
   1235 		"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1236 	} else { \
   1237 		__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; " \
   1238 " or %0,%2,%0; ldxa [%0]%%asi,%0; srlx %0,32,%1; srl %0,0,%0;" : \
   1239 		"=&r" (_ldxa_lo), "=&r" (_ldxa_hi) : \
   1240 		"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
   1241 	} \
   1242 	((((int64_t)_ldxa_hi)<<32)|_ldxa_lo); \
   1243 })
   1244 #endif
   1245 
   1246 
   1247 /* store byte to alternate address space */
   1248 #ifdef __arch64__
   1249 #define	stba(loc, asi, value) ({ \
   1250 	if (PHYS_ASI(asi)) { \
   1251 		__asm __volatile("wr %3,%%g0,%%asi; stba %1,[%2]%%asi;" \
   1252 " andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" : "=&r" (loc) : \
   1253 			"r" ((int)(value)), "r" ((unsigned long)(loc)), \
   1254 			"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1255 	} else { \
   1256 		__asm __volatile("wr %2,%%g0,%%asi; stba %0,[%1]%%asi" : : \
   1257 		"r" ((int)(value)), "r" ((unsigned long)(loc)), "r" (asi)); \
   1258 	} \
   1259 })
   1260 #else
   1261 #define	stba(loc, asi, value) ({ \
   1262 	register int _loc_hi, _pstate; \
   1263 	_loc_hi = (((u_int64_t)loc)>>32); \
   1264 	if (PHYS_ASI(asi)) { \
   1265 		__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;" \
   1266 " or %3,%0,%0; wrpr %1,8,%%pstate; stba %2,[%0]%%asi; wrpr %1,0,%%pstate; " \
   1267 " andn %0,0x1f,%1;  membar #Sync; stxa %%g0,[%1] %6; membar #Sync" : \
   1268 		"=&r" (_loc_hi), "=&r" (_pstate) : \
   1269 		"r" ((int)(value)), "r" ((unsigned long)(loc)), \
   1270 		"r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG)); \
   1271 	} else { \
   1272 		__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; " \
   1273 " or %2,%0,%0; stba %1,[%0]%%asi" : "=&r" (_loc_hi) : \
   1274 		"r" ((int)(value)), "r" ((unsigned long)(loc)), \
   1275 		"r" (_loc_hi), "r" (asi)); \
   1276 	} \
   1277 })
   1278 #endif
   1279 
   1280 /* store half-word to alternate address space */
   1281 #ifdef __arch64__
   1282 #define	stha(loc, asi, value) ({ \
   1283 	if (PHYS_ASI(asi)) { \
   1284 		__asm __volatile("wr %3,%%g0,%%asi; stha %1,[%2]%%asi;" \
   1285 " andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" : "=&r" (loc) : \
   1286 			"r" ((int)(value)), "r" ((unsigned long)(loc)), \
   1287 			"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1288 	} else { \
   1289 	__asm __volatile("wr %2,%%g0,%%asi; stha %0,[%1]%%asi" : : \
   1290 	    "r" ((int)(value)), "r" ((unsigned long)(loc)), "r" (asi)); \
   1291 	} \
   1292 })
   1293 #else
   1294 #define	stha(loc, asi, value) ({ \
   1295 	register int _loc_hi, _pstate; \
   1296 	_loc_hi = (((u_int64_t)loc)>>32); \
   1297 	if (PHYS_ASI(asi)) { \
   1298 		__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;" \
   1299 " or %3,%0,%0; wrpr %1,8,%%pstate; stha %2,[%0]%%asi; wrpr %1,0,%%pstate; " \
   1300 " andn %0,0x1f,%1;  membar #Sync; stxa %%g0,[%1] %6; membar #Sync" : \
   1301 		"=&r" (_loc_hi), "=&r" (_pstate) : \
   1302 		"r" ((int)(value)), "r" ((unsigned long)(loc)), \
   1303 		"r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG)); \
   1304 	} else { \
   1305 		__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; " \
   1306 " or %2,%0,%0; stha %1,[%0]%%asi" : "=&r" (_loc_hi) : \
   1307 	    "r" ((int)(value)), "r" ((unsigned long)(loc)), \
   1308 		"r" (_loc_hi), "r" (asi)); \
   1309 	} \
   1310 })
   1311 #endif
   1312 
   1313 /* store int to alternate address space */
   1314 #ifdef __arch64__
   1315 #define	sta(loc, asi, value) ({ \
   1316 	if (PHYS_ASI(asi)) { \
   1317 		__asm __volatile("wr %3,%%g0,%%asi; sta %1,[%2]%%asi;" \
   1318 " andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" : "=&r" (loc) : \
   1319 			"r" ((int)(value)), "r" ((unsigned long)(loc)), \
   1320 			"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1321 	} else { \
   1322 	__asm __volatile("wr %2,%%g0,%%asi; sta %0,[%1]%%asi" : : \
   1323 	    "r" ((int)(value)), "r" ((unsigned long)(loc)), "r" (asi)); \
   1324 	} \
   1325 })
   1326 #else
   1327 #define	sta(loc, asi, value) ({ \
   1328 	register int _loc_hi, _pstate; \
   1329 	_loc_hi = (((u_int64_t)loc)>>32); \
   1330 	if (PHYS_ASI(asi)) { \
   1331 		__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;" \
   1332 " or %3,%0,%0; wrpr %1,8,%%pstate; sta %2,[%0]%%asi; wrpr %1,0,%%pstate; " \
   1333 " andn %0,0x1f,%1;  membar #Sync; stxa %%g0,[%1] %6; membar #Sync" : \
   1334 		"=&r" (_loc_hi), "=&r" (_pstate) : \
   1335 		"r" ((int)(value)), "r" ((unsigned long)(loc)), \
   1336 		"r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG)); \
   1337 	} else { \
   1338 		__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; " \
   1339 " or %2,%0,%0; sta %1,[%0]%%asi" : "=&r" (_loc_hi) : \
   1340 		"r" ((int)(value)), "r" ((unsigned long)(loc)), \
   1341 		"r" (_loc_hi), "r" (asi)); \
   1342 	} \
   1343 })
   1344 #endif
   1345 
   1346 /* store 64-bit int to alternate address space */
   1347 #ifdef __arch64__
   1348 #define	stda(loc, asi, value) ({ \
   1349 	if (PHYS_ASI(asi)) { \
   1350 		__asm __volatile("wr %3,%%g0,%%asi; stda %1,[%2]%%asi;" \
   1351 " andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" : "=&r" (loc) : \
   1352 			"r" ((int)(value)), "r" ((unsigned long)(loc)), \
   1353 			"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1354 	} else { \
   1355 	__asm __volatile("wr %2,%%g0,%%asi; stda %0,[%1]%%asi" : : \
   1356 	    "r" ((long long)(value)), "r" ((unsigned long)(loc)), "r" (asi)); \
   1357 	} \
   1358 })
   1359 #else
   1360 #define	stda(loc, asi, value) ({ \
   1361 	register int _loc_hi, _pstate; \
   1362 	_loc_hi = (((u_int64_t)loc)>>32); \
   1363 	if (PHYS_ASI(asi)) { \
   1364 	__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1; " \
   1365 " or %3,%0,%0; wrpr %1,8,%%pstate; stda %2,[%0]%%asi; wrpr %1,0,%%pstate;" \
   1366 " andn %0,0x1f,%1;  membar #Sync; stxa %%g0,[%1] %6; membar #Sync" : \
   1367 		"=&r" (_loc_hi), "=&r" (_pstate) : \
   1368 		"r" ((long long)(value)), "r" ((unsigned long)(loc)), \
   1369 		"r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG)); \
   1370 	} else { \
   1371 		__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; " \
   1372 " or %2,%0,%0; stda %1,[%0]%%asi" : "=&r" (_loc_hi) : \
   1373 		"r" ((long long)(value)), "r" ((unsigned long)(loc)), \
   1374 		"r" (_loc_hi), "r" (asi)); \
   1375 	} \
   1376 })
   1377 #endif
   1378 
   1379 #ifdef __arch64__
   1380 /* native store 64-bit int to alternate address space w/64-bit compiler*/
   1381 #define	stxa(loc, asi, value) ({ \
   1382 	if (PHYS_ASI(asi)) { \
   1383 		__asm __volatile("wr %3,%%g0,%%asi; stxa %1,[%2]%%asi;" \
   1384 " andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" : "=&r" (loc) : \
   1385 			"r" ((int)(value)), "r" ((unsigned long)(loc)), \
   1386 			"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1387 	} else { \
   1388 	__asm __volatile("wr %2,%%g0,%%asi; stxa %0,[%1]%%asi" : : \
   1389 	    "r" ((unsigned long)(value)), "r" ((unsigned long)(loc)), "r" (asi)); \
   1390 })
   1391 #else
   1392 /* native store 64-bit int to alternate address space w/32-bit compiler*/
   1393 #define	stxa(loc, asi, value) ({ \
   1394 	int _stxa_lo, _stxa_hi, _loc_hi; \
   1395 	_stxa_lo = value; _stxa_hi = ((u_int64_t)value)>>32; \
   1396 	_loc_hi = (((u_int64_t)(u_long)loc)>>32); \
   1397 	if (PHYS_ASI(asi)) { \
   1398 		__asm __volatile("wr %7,%%g0,%%asi; sllx %4,32,%1; sllx %6,32,%0; " \
   1399 " or %1,%3,%1; rdpr %%pstate,%2; or %0,%5,%0; wrpr %2,8,%%pstate; " \
   1400 " stxa %1,[%0]%%asi; wrpr %2,0,%%pstate; "  \
   1401 " andn %0,0x1f,%1;  membar #Sync; stxa %%g0,[%1] %8; membar #Sync": \
   1402 		"=&r" (_loc_hi), "=&r" (_stxa_hi), "=&r" ((int)(_stxa_lo)): \
   1403 		"r" ((int)(_stxa_lo)), "r" ((int)(_stxa_hi)), \
   1404 		"r" ((unsigned long)(loc)), "r" (_loc_hi), \
   1405 		"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1406 	} else { \
   1407 	__asm __volatile("wr %6,%%g0,%%asi; sllx %3,32,%1; sllx %5,32,%0; " \
   1408 " or %1,%2,%1; or %0,%4,%0; stxa %1,[%0]%%asi" : \
   1409 	    "=&r" (_loc_hi), "=&r" (_stxa_hi) : \
   1410 	    "r" ((int)(_stxa_lo)), "r" ((int)(_stxa_hi)), \
   1411 	    "r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
   1412 	} \
   1413 })
   1414 #endif
   1415 
   1416 
   1417 #ifdef __arch64__
   1418 /* native store 64-bit int to alternate address space w/64-bit compiler*/
   1419 #define	casxa(loc, asi, value, ovalue) ({ \
   1420 	if (PHYS_ASI(asi)) { \
   1421 		__asm __volatile("wr %5,%%g0,%%asi; casxa [%4]%%asi,%3, %1;" \
   1422 " andn %4,0x1f,%0; membar #Sync; stxa %%g0,[%0] %5; membar #Sync" : \
   1423 			"=&r" (loc), "=&r" (value) : \
   1424 			"r" ((unsigned long)(value)),  "r" ((unsigned long)(ovalue)), \
   1425 			"r" ((unsigned long)(loc)), \
   1426 			"r" (asi), "n" (ASI_DCACHE_TAG)); \
   1427 	} else { \
   1428 	__asm __volatile("wr %4,%%g0,%%asi; casxa [%3]%%asi,%2,%1" : \
   1429 	    "=&r" (value) : \
   1430 	    "r" ((unsigned long)(value)), "r" ((unsigned long)(ovalue), \
   1431 	    "r" ((unsigned long)(loc)), "r" (asi)); \
   1432 })
   1433 #else
   1434 /* native store 64-bit int to alternate address space w/32-bit compiler*/
   1435 #define	casxa(loc, asi, value, ovalue) ({ \
   1436 	int _casxa_lo, _casxa_hi, _oval_lo, _oval_hi, _loc_hi; \
   1437 	_casxa_lo = value; _casxa_hi = ((u_int64_t)value)>>32; \
   1438 	_oval_lo = ovalue; _oval_hi = ((u_int64_t)ovalue)>>32; \
   1439 	_loc_hi = (((u_int64_t)(u_long)loc)>>32); \
   1440 	if (PHYS_ASI(asi)) { \
   1441 		__asm __volatile("wr %9,%%g0,%%asi; sllx %4,32,%1; sllx %8,32,%0; " \
   1442 " or %1,%3,%1; rdpr %%pstate,%3; or %0,%5,%0; wrpr %3,8,%%pstate; " \
   1443 " casxa %1,[%0]%%asi; wrpr %3,0,%%pstate; "  \
   1444 " andn %0,0x1f,%1;  membar #Sync; stxa %%g0,[%1] %8; membar #Sync": \
   1445 		"=&r" (_casxa_hi), "=&r" ((int)(_casxa_lo)): \
   1446 		"r" ((int)(_casxa_lo)), "r" ((int)(_casxa_hi)), \
   1447 		"r" ((int)(_oval_lo)), "r" ((int)(_oval_hi)), \
   1448 		"r" ((unsigned long)(loc)), "r" (_loc_hi), \
   1449 		"r" (asi), "n" (ASI_DCACHE_TAG) : \
   1450 		"r" (loc), "r", (oval_lo) \
   1451 	} else { \
   1452 	__asm __volatile("wr %6,%%g0,%%asi; sllx %3,32,%1; sllx %5,32,%0; " \
   1453 " or %1,%2,%1; or %0,%4,%0; stxa %1,[%0]%%asi" : \
   1454 	    "=&r" (_loc_hi), "=&r" (_stxa_hi) : \
   1455 	    "r" ((int)(_stxa_lo)), "r" ((int)(_stxa_hi)), \
   1456 	    "r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
   1457 	} \
   1458 })
   1459 #endif
   1460 #endif
   1461 
   1462 
   1463 /* flush address from data cache */
   1464 #define flush(loc) ({ \
   1465 	__asm __volatile("flush %0" : : \
   1466 	     "r" ((unsigned long)(loc))); \
   1467 })
   1468 
   1469 /* Flush a D$ line */
   1470 #if 0
   1471 #define flushline(loc) ({ \
   1472 	stxa(((paddr_t)loc)&(~0x1f), (ASI_DCACHE_TAG), 0); \
   1473         membar_sync(); \
   1474 })
   1475 #else
   1476 #define flushline(loc)
   1477 #endif
   1478 
   1479 /* The following two enable or disable the dcache in the LSU control register */
   1480 #define dcenable() ({ \
   1481 	int res; \
   1482 	__asm __volatile("ldxa [%%g0] %1,%0; or %0,%2,%0; stxa %0,[%%g0] %1; membar #Sync" \
   1483 		: "r" (res) : "n" (ASI_MCCR), "n" (MCCR_DCACHE_EN)); \
   1484 })
   1485 #define dcdisable() ({ \
   1486 	int res; \
   1487 	__asm __volatile("ldxa [%%g0] %1,%0; andn %0,%2,%0; stxa %0,[%%g0] %1; membar #Sync" \
   1488 		: "r" (res) : "n" (ASI_MCCR), "n" (MCCR_DCACHE_EN)); \
   1489 })
   1490 
   1491 /*
   1492  * SPARC V9 memory barrier instructions.
   1493  */
   1494 /* Make all stores complete before next store */
   1495 #define membar_storestore() __asm __volatile("membar #StoreStore" : :)
   1496 /* Make all loads complete before next store */
   1497 #define membar_loadstore() __asm __volatile("membar #LoadStore" : :)
   1498 /* Make all stores complete before next load */
   1499 #define membar_storeload() __asm __volatile("membar #StoreLoad" : :)
   1500 /* Make all loads complete before next load */
   1501 #define membar_loadload() __asm __volatile("membar #LoadLoad" : :)
   1502 /* Complete all outstanding memory operations and exceptions */
   1503 #define membar_sync() __asm __volatile("membar #Sync" : :)
   1504 /* Complete all outstanding memory operations */
   1505 #define membar_memissue() __asm __volatile("membar #MemIssue" : :)
   1506 /* Complete all outstanding stores before any new loads */
   1507 #define membar_lookaside() __asm __volatile("membar #Lookaside" : :)
   1508 
   1509 #ifdef __arch64__
   1510 /* read 64-bit %tick register */
   1511 #define	tick() ({ \
   1512 	register u_long _tick_tmp; \
   1513 	__asm __volatile("rdpr %%tick, %0" : "=r" (_tick_tmp) :); \
   1514 	_tick_tmp; \
   1515 })
   1516 #else
   1517 /* read 64-bit %tick register on 32-bit system */
   1518 #define	tick() ({ \
   1519 	register int _tick_hi = 0, _tick_lo = 0; \
   1520 	__asm __volatile("rdpr %%tick, %1; srlx %0,32,%2; srl %0,0,%0 " \
   1521 		: "=r" (_tick_hi), "=r" (_tick_lo) : ); \
   1522 	(((u_int64_t)_tick_hi)<<32)|((u_int64_t)_tick_lo); \
   1523 })
   1524 #endif
   1525 
   1526 extern void next_tick __P((long));
   1527 #endif
   1528