NetBSD/sys/arch/sparc64/include/ctlreg.h

1526 lines
55 KiB
C

/* $NetBSD: ctlreg.h,v 1.23 2000/08/31 19:08:47 eeh Exp $ */
/*
* Copyright (c) 1996-1999 Eduardo Horvath
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
*/
/*
* Sun 4u control registers. (includes address space definitions
* and some registers in control space).
*/
/*
* The Alternate address spaces.
*
* 0x00-0x7f are privileged
* 0x80-0xff can be used by users
*/
#define ASI_LITTLE 0x08 /* This bit should make an ASI little endian */
#define ASI_NUCLEUS 0x04 /* [4u] kernel address space */
#define ASI_NUCLEUS_LITTLE 0x0c /* [4u] kernel address space, little endian */
#define ASI_AS_IF_USER_PRIMARY 0x10 /* [4u] primary user address space */
#define ASI_AS_IF_USER_SECONDARY 0x11 /* [4u] secondary user address space */
#define ASI_PHYS_CACHED 0x14 /* [4u] MMU bypass to main memory */
#define ASI_PHYS_NON_CACHED 0x15 /* [4u] MMU bypass to I/O location */
#define ASI_AS_IF_USER_PRIMARY_LITTLE 0x18 /* [4u] primary user address space, little endian */
#define ASI_AS_IF_USER_SECONDARY_LITTIE 0x19 /* [4u] secondary user address space, little endian */
#define ASI_PHYS_CACHED_LITTLE 0x1c /* [4u] MMU bypass to main memory, little endian */
#define ASI_PHYS_NON_CACHED_LITTLE 0x1d /* [4u] MMU bypass to I/O location, little endian */
#define ASI_NUCLEUS_QUAD_LDD 0x24 /* [4u] use w/LDDA to load 128-bit item */
#define ASI_NUCLEUS_QUAD_LDD_LITTLE 0x2c /* [4u] use w/LDDA to load 128-bit item, little endian */
#define ASI_FLUSH_D_PAGE_PRIMARY 0x38 /* [4u] flush D-cache page using primary context */
#define ASI_FLUSH_D_PAGE_SECONDARY 0x39 /* [4u] flush D-cache page using secondary context */
#define ASI_FLUSH_D_CTX_PRIMARY 0x3a /* [4u] flush D-cache context using primary context */
#define ASI_FLUSH_D_CTX_SECONDARY 0x3b /* [4u] flush D-cache context using secondary context */
#define ASI_LSU_CONTROL_REGISTER 0x45 /* [4u] load/store unit control register */
#define ASI_DCACHE_DATA 0x46 /* [4u] diagnostic access to D-cache data RAM */
#define ASI_DCACHE_TAG 0x47 /* [4u] diagnostic access to D-cache tag RAM */
#define ASI_INTR_DISPATCH_STATUS 0x48 /* [4u] interrupt dispatch status register */
#define ASI_INTR_RECEIVE 0x49 /* [4u] interrupt receive status register */
#define ASI_MID_REG 0x4a /* [4u] hardware config and MID */
#define ASI_ERROR_EN_REG 0x4b /* [4u] asynchronous error enables */
#define ASI_AFSR 0x4c /* [4u] asynchronous fault status register */
#define ASI_AFAR 0x4d /* [4u] asynchronous fault address register */
#define ASI_ICACHE_DATA 0x66 /* [4u] diagnostic access to D-cache data RAM */
#define ASI_ICACHE_TAG 0x67 /* [4u] diagnostic access to D-cache tag RAM */
#define ASI_FLUSH_I_PAGE_PRIMARY 0x68 /* [4u] flush D-cache page using primary context */
#define ASI_FLUSH_I_PAGE_SECONDARY 0x69 /* [4u] flush D-cache page using secondary context */
#define ASI_FLUSH_I_CTX_PRIMARY 0x6a /* [4u] flush D-cache context using primary context */
#define ASI_FLUSH_I_CTX_SECONDARY 0x6b /* [4u] flush D-cache context using secondary context */
#define ASI_BLOCK_AS_IF_USER_PRIMARY 0x70 /* [4u] primary user address space, block loads/stores */
#define ASI_BLOCK_AS_IF_USER_SECONDARY 0x71 /* [4u] secondary user address space, block loads/stores */
#define ASI_ECACHE_DIAG 0x76 /* [4u] diag access to E-cache tag and data */
#define ASI_DATAPATH_ERR_REG_WRITE 0x77 /* [4u] ASI is reused */
#define ASI_BLOCK_AS_IF_USER_PRIMARY_LITTLE 0x78 /* [4u] primary user address space, block loads/stores */
#define ASI_BLOCK_AS_IF_USER_SECONDARY_LITTLE 0x79 /* [4u] secondary user address space, block loads/stores */
#define ASI_INTERRUPT_RECEIVE_DATA 0x7f /* [4u] interrupt receive data registers {0,1,2} */
#define ASI_DATAPATH_ERR_REG_READ 0x7f /* [4u] read access to datapath error registers (ASI reused) */
#define ASI_PRIMARY 0x80 /* [4u] primary address space */
#define ASI_SECONDARY 0x81 /* [4u] secondary address space */
#define ASI_PRIMARY_NO_FAULT 0x82 /* [4u] primary address space, no fault */
#define ASI_SECONDARY_NO_FAULT 0x83 /* [4u] secondary address space, no fault */
#define ASI_PRIMARY_LITTLE 0x88 /* [4u] primary address space, little endian */
#define ASI_SECONDARY_LITTLE 0x89 /* [4u] secondary address space, little endian */
#define ASI_PRIMARY_NO_FAULT_LITTLE 0x8a /* [4u] primary address space, no fault, little endian */
#define ASI_SECONDARY_NO_FAULT_LITTLE 0x8b /* [4u] secondary address space, no fault, little endian */
#define ASI_PST8_PRIMARY 0xc0 /* [VIS] Eight 8-bit partial store, primary */
#define ASI_PST8_SECONDARY 0xc1 /* [VIS] Eight 8-bit partial store, secondary */
#define ASI_PST16_PRIMARY 0xc2 /* [VIS] Four 16-bit partial store, primary */
#define ASI_PST16_SECONDARY 0xc3 /* [VIS] Fout 16-bit partial store, secondary */
#define ASI_PST32_PRIMARY 0xc4 /* [VIS] Two 32-bit partial store, primary */
#define ASI_PST32_SECONDARY 0xc5 /* [VIS] Two 32-bit partial store, secondary */
#define ASI_PST8_PRIMARY_LITTLE 0xc8 /* [VIS] Eight 8-bit partial store, primary, little endian */
#define ASI_PST8_SECONDARY_LITTLE 0xc9 /* [VIS] Eight 8-bit partial store, secondary, little endian */
#define ASI_PST16_PRIMARY_LITTLE 0xca /* [VIS] Four 16-bit partial store, primary, little endian */
#define ASI_PST16_SECONDARY_LITTLE 0xcb /* [VIS] Fout 16-bit partial store, secondary, little endian */
#define ASI_PST32_PRIMARY_LITTLE 0xcc /* [VIS] Two 32-bit partial store, primary, little endian */
#define ASI_PST32_SECONDARY_LITTLE 0xcd /* [VIS] Two 32-bit partial store, secondary, little endian */
#define ASI_FL8_PRIMARY 0xd0 /* [VIS] One 8-bit load/store floating, primary */
#define ASI_FL8_SECONDARY 0xd1 /* [VIS] One 8-bit load/store floating, secondary */
#define ASI_FL16_PRIMARY 0xd2 /* [VIS] One 16-bit load/store floating, primary */
#define ASI_FL16_SECONDARY 0xd3 /* [VIS] One 16-bit load/store floating, secondary */
#define ASI_FL8_PRIMARY_LITTLE 0xd8 /* [VIS] One 8-bit load/store floating, primary, little endian */
#define ASI_FL8_SECONDARY_LITTLE 0xd9 /* [VIS] One 8-bit load/store floating, secondary, little endian */
#define ASI_FL16_PRIMARY_LITTLE 0xda /* [VIS] One 16-bit load/store floating, primary, little endian */
#define ASI_FL16_SECONDARY_LITTLE 0xdb /* [VIS] One 16-bit load/store floating, secondary, little endian */
#define ASI_BLOCK_COMMIT_PRIMARY 0xe0 /* [4u] block store with commit, primary */
#define ASI_BLOCK_COMMIT_SECONDARY 0xe1 /* [4u] block store with commit, secondary */
#define ASI_BLOCK_PRIMARY 0xf0 /* [4u] block load/store, primary */
#define ASI_BLOCK_SECONDARY 0xf1 /* [4u] block load/store, secondary */
#define ASI_BLOCK_PRIMARY_LITTLE 0xf8 /* [4u] block load/store, primary, little endian */
#define ASI_BLOCK_SECONDARY_LITTLE 0xf9 /* [4u] block load/store, secondary, little endian */
/*
* These are the shorter names used by Solaris
*/
#define ASI_N ASI_NUCLEUS
#define ASI_NL ASI_NUCLEUS_LITTLE
#define ASI_AIUP ASI_AS_IF_USER_PRIMARY
#define ASI_AIUS ASI_AS_IF_USER_SECONDARY
#define ASI_AIUPL ASI_AS_IF_USER_PRIMARY_LITTLE
#define ASI_AIUSL ASI_AS_IF_USER_SECONDARY_LITTLE
#define ASI_P ASI_PRIMARY
#define ASI_S ASI_SECONDARY
#define ASI_PNF ASI_PRIMARY_NO_FAULT
#define ASI_SNF ASI_SECONDARY_NO_FAULT
#define ASI_PL ASI_PRIMARY_LITTLE
#define ASI_SL ASI_SECONDARY_LITTLE
#define ASI_PNFL ASI_PRIMARY_NO_FAULT_LITTLE
#define ASI_SNFL ASI_SECONDARY_NO_FAULT_LITTLE
#define ASI_BLK_AIUP ASI_BLOCK_AS_IF_USER_PRIMARY
#define ASI_BLK_AIUPL ASI_BLOCK_AS_IF_USER_PRIMARY_LITTLE
#define ASI_BLK_AIUS ASI_BLOCK_AS_IF_USER_SECONDARY
#define ASI_BLK_AIUSL ASI_BLOCK_AS_IF_USER_SECONDARY_LITTLE
#define ASI_BLK_COMMIT_P ASI_BLOCK_COMMIT_PRIMARY
#define ASI_BLK_COMMIT_PRIMARY ASI_BLOCK_COMMIT_PRIMARY
#define ASI_BLK_COMMIT_S ASI_BLOCK_COMMIT_SECONDARY
#define ASI_BLK_COMMIT_SECONDARY ASI_BLOCK_COMMIT_SECONDARY
#define ASI_BLK_P ASI_BLOCK_PRIMARY
#define ASI_BLK_PL ASI_BLOCK_PRIMARY_LITTLE
#define ASI_BLK_S ASI_BLOCK_SECONDARY
#define ASI_BLK_SL ASI_BLOCK_SECONDARY_LITTLE
#define PHYS_ASI(x) (((x) | 0x09) == 0x1d)
#define LITTLE_ASI(x) ((x) & ASI_LITTLE)
/*
* The following are 4u control registers
*/
/* Get the CPU's UPAID */
#define UPA_CR_MID(x) (((x)>>17)&0x1f)
#define CPU_UPAID UPA_CR_MID(ldxa(0, ASI_MID_REG))
/*
* [4u] MMU and Cache Control Register (MCCR)
* use ASI = 0x45
*/
#define ASI_MCCR ASI_LSU_CONTROL_REGISTER
#define MCCR 0x00
/* MCCR Bits and their meanings */
#define MCCR_DMMU_EN 0x08
#define MCCR_IMMU_EN 0x04
#define MCCR_DCACHE_EN 0x02
#define MCCR_ICACHE_EN 0x01
/*
* MMU control registers
*/
/* Choose an MMU */
#define ASI_DMMU 0x58
#define ASI_IMMU 0x50
/* Other assorted MMU ASIs */
#define ASI_IMMU_8KPTR 0x51
#define ASI_IMMU_64KPTR 0x52
#define ASI_IMMU_DATA_IN 0x54
#define ASI_IMMU_TLB_DATA 0x55
#define ASI_IMMU_TLB_TAG 0x56
#define ASI_DMMU_8KPTR 0x59
#define ASI_DMMU_64KPTR 0x5a
#define ASI_DMMU_DATA_IN 0x5c
#define ASI_DMMU_TLB_DATA 0x5d
#define ASI_DMMU_TLB_TAG 0x5e
/*
* The following are the control registers
* They work on both MMUs unless noted.
*
* Register contents are defined later on individual registers.
*/
#define TSB_TAG_TARGET 0x0
#define TLB_DATA_IN 0x0
#define CTX_PRIMARY 0x08 /* primary context -- DMMU only */
#define CTX_SECONDARY 0x10 /* secondary context -- DMMU only */
#define SFSR 0x18
#define SFAR 0x20 /* fault address -- DMMU only */
#define TSB 0x28
#define TLB_TAG_ACCESS 0x30
#define VIRTUAL_WATCHPOINT 0x38
#define PHYSICAL_WATCHPOINT 0x40
/* Tag Target bits */
#define TAG_TARGET_VA_MASK 0x03ffffffffffffffffLL
#define TAG_TARGET_VA(x) (((x)<<22)&TAG_TARGET_VA_MASK)
#define TAG_TARGET_CONTEXT(x) ((x)>>48)
#define TAG_TARGET(c,v) ((((uint64_t)c)<<48)|(((uint64_t)v)&TAG_TARGET_VA_MASK))
/* SFSR bits for both D_SFSR and I_SFSR */
#define SFSR_ASI(x) ((x)>>16)
#define SFSR_FT_VA_OOR_2 0x02000 /* IMMU: jumpl or return to unsupportd VA */
#define SFSR_FT_VA_OOR_1 0x01000 /* fault at unsupported VA */
#define SFSR_FT_NFO 0x00800 /* DMMU: Access to page marked NFO */
#define SFSR_ILL_ASI 0x00400 /* DMMU: Illegal (unsupported) ASI */
#define SFSR_FT_IO_ATOMIC 0x00200 /* DMMU: Atomic access to noncacheable page */
#define SFSR_FT_ILL_NF 0x00100 /* DMMU: NF load or flush to page marked E (has side effects) */
#define SFSR_FT_PRIV 0x00080 /* Privilege violation */
#define SFSR_FT_E 0x00040 /* DMUU: value of E bit associated address */
#define SFSR_CTXT(x) (((x)>>4)&0x3)
#define SFSR_CTXT_IS_PRIM(x) (SFSR_CTXT(x)==0x00)
#define SFSR_CTXT_IS_SECOND(x) (SFSR_CTXT(x)==0x01)
#define SFSR_CTXT_IS_NUCLEUS(x) (SFSR_CTXT(x)==0x02)
#define SFSR_PRIV 0x00008 /* value of PSTATE.PRIV for faulting access */
#define SFSR_W 0x00004 /* DMMU: attempted write */
#define SFSR_OW 0x00002 /* Overwrite; prev vault was still valid */
#define SFSR_FV 0x00001 /* Fault is valid */
#define SFSR_FT (SFSR_FT_VA_OOR_2|SFSR_FT_VA_OOR_1|SFSR_FT_NFO|SFSR_ILL_ASI|SFSR_FT_IO_ATOMIC|SFSR_FT_ILL_NF|SFSR_FT_PRIV)
#if 0
/* Old bits */
#define SFSR_BITS "\40\16VAT\15VAD\14NFO\13ASI\12A\11NF\10PRIV\7E\6NUCLEUS\5SECONDCTX\4PRIV\3W\2OW\1FV"
#else
/* New bits */
#define SFSR_BITS "\177\20" \
"f\20\30ASI\0" "b\16VAT\0" "b\15VAD\0" "b\14NFO\0" "b\13ASI\0" "b\12A\0" "b\11NF\0" "b\10PRIV\0" \
"b\7E\0" "b\6NUCLEUS\0" "b\5SECONDCTX\0" "b\4PRIV\0" "b\3W\0" "b\2OW\0" "b\1FV\0"
#endif
/* ASFR bits */
#define ASFR_ME 0x100000000LL
#define ASFR_PRIV 0x080000000LL
#define ASFR_ISAP 0x040000000LL
#define ASFR_ETP 0x020000000LL
#define ASFR_IVUE 0x010000000LL
#define ASFR_TO 0x008000000LL
#define ASFR_BERR 0x004000000LL
#define ASFR_LDP 0x002000000LL
#define ASFR_CP 0x001000000LL
#define ASFR_WP 0x000800000LL
#define ASFR_EDP 0x000400000LL
#define ASFR_UE 0x000200000LL
#define ASFR_CE 0x000100000LL
#define ASFR_ETS 0x0000f0000LL
#define ASFT_P_SYND 0x00000ffffLL
#define AFSR_BITS "\177\20" \
"b\40ME\0" "b\37PRIV\0" "b\36ISAP\0" "b\35ETP\0" \
"b\34IVUE\0" "b\33TO\0" "b\32BERR\0" "b\31LDP\0" \
"b\30CP\0" "b\27WP\0" "b\26EDP\0" "b\25UE\0" \
"b\24CE\0" "f\20\4ETS\0" "f\0\20P_SYND\0"
/*
* Here's the spitfire TSB control register bits.
*
* Each TSB entry is 16-bytes wide. The TSB must be size aligned
*/
#define TSB_SIZE_512 0x0 /* 8kB, etc. */
#define TSB_SIZE_1K 0x01
#define TSB_SIZE_2K 0x02
#define TSB_SIZE_4K 0x03
#define TSB_SIZE_8K 0x04
#define TSB_SIZE_16K 0x05
#define TSB_SIZE_32K 0x06
#define TSB_SIZE_64K 0x07
#define TSB_SPLIT 0x1000
#define TSB_BASE 0xffffffffffffe000
/* TLB Tag Access bits */
#define TLB_TAG_ACCESS_VA 0xffffffffffffe000
#define TLB_TAG_ACCESS_CTX 0x0000000000001fff
/*
* TLB demap registers. TTEs are defined in v9pte.h
*
* Use the address space to select between IMMU and DMMU.
* The address of the register selects which context register
* to read the ASI from.
*
* The data stored in the register is interpreted as the VA to
* use. The DEMAP_CTX_<> registers ignore the address and demap the
* entire ASI.
*
*/
#define ASI_IMMU_DEMAP 0x57 /* [4u] IMMU TLB demap */
#define ASI_DMMU_DEMAP 0x5f /* [4u] IMMU TLB demap */
#define DEMAP_PAGE_NUCLEUS ((0x02)<<4) /* Demap page from kernel AS */
#define DEMAP_PAGE_PRIMARY ((0x00)<<4) /* Demap a page from primary CTXT */
#define DEMAP_PAGE_SECONDARY ((0x01)<<4) /* Demap page from secondary CTXT (DMMU only) */
#define DEMAP_CTX_NUCLEUS ((0x06)<<4) /* Demap all of kernel CTXT */
#define DEMAP_CTX_PRIMARY ((0x04)<<4) /* Demap all of primary CTXT */
#define DEMAP_CTX_SECONDARY ((0x05)<<4) /* Demap all of secondary CTXT */
/*
* Interrupt registers. This really gets hairy.
*/
/* IRSR -- Interrupt Receive Status Ragister */
#define ASI_IRSR 0x49
#define IRSR 0x00
#define IRSR_BUSY 0x020
#define IRSR_MID(x) (x&0x1f)
/* IRDR -- Interrupt Receive Data Registers */
#define ASI_IRDR 0x7f
#define IRDR_0H 0x40
#define IRDR_0L 0x48 /* unimplemented */
#define IRDR_1H 0x50
#define IRDR_1L 0x58 /* unimplemented */
#define IRDR_2H 0x60
#define IRDR_2L 0x68 /* unimplemented */
#define IRDR_3H 0x70 /* unimplemented */
#define IRDR_3L 0x78 /* unimplemented */
/* SOFTINT ASRs */
#define SET_SOFTINT %asr20 /* Sets these bits */
#define CLEAR_SOFTINT %asr21 /* Clears these bits */
#define SOFTINT %asr22 /* Reads the register */
#define TICK_CMPR %asr23
#define TICK_INT 0x01 /* level-14 clock tick */
#define SOFTINT1 (0x1<<1)
#define SOFTINT2 (0x1<<2)
#define SOFTINT3 (0x1<<3)
#define SOFTINT4 (0x1<<4)
#define SOFTINT5 (0x1<<5)
#define SOFTINT6 (0x1<<6)
#define SOFTINT7 (0x1<<7)
#define SOFTINT8 (0x1<<8)
#define SOFTINT9 (0x1<<9)
#define SOFTINT10 (0x1<<10)
#define SOFTINT11 (0x1<<11)
#define SOFTINT12 (0x1<<12)
#define SOFTINT13 (0x1<<13)
#define SOFTINT14 (0x1<<14)
#define SOFTINT15 (0x1<<15)
/* Interrupt Dispatch -- usually reserved for cross-calls */
#define ASR_IDSR 0x48 /* Interrupt dispatch status reg */
#define IDSR 0x00
#define IDSR_NACK 0x02
#define IDSR_BUSY 0x01
#define ASI_INTERRUPT_DISPATCH 0x77 /* [4u] spitfire interrupt dispatch regs */
#define IDCR(x) (((x)<<14)&0x70) /* Store anything to this address to dispatch crosscall to CPU (x) */
#define IDDR_0H 0x40 /* Store data to send in these regs */
#define IDDR_0L 0x48 /* unimplemented */
#define IDDR_1H 0x50
#define IDDR_1L 0x58 /* unimplemented */
#define IDDR_2H 0x60
#define IDDR_2L 0x68 /* unimplemented */
#define IDDR_3H 0x70 /* unimplemented */
#define IDDR_3L 0x78 /* unimplemented */
/*
* Error registers
*/
/* Since we won't try to fix async errs, we don't care about the bits in the regs */
#define ASI_AFAR 0x4d /* Asynchronous fault address register */
#define AFAR 0x00
#define ASI_AFSR 0x4c /* Asynchronous fault status register */
#define AFSR 0x00
#define ASI_P_EER 0x4b /* Error enable register */
#define P_EER 0x00
#define P_EER_ISAPEN 0x04 /* Enable fatal on ISAP */
#define P_EER_NCEEN 0x02 /* Enable trap on uncorrectable errs */
#define P_EER_CEEN 0x01 /* Enable trap on correctable errs */
#define ASI_DATAPATH_READ 0x7f /* Read the regs */
#define ASI_DATAPATH_WRITE 0x77 /* Write to the regs */
#define P_DPER_0 0x00 /* Datapath err reg 0 */
#define P_DPER_1 0x18 /* Datapath err reg 1 */
#define P_DCR_0 0x20 /* Datapath control reg 0 */
#define P_DCR_1 0x38 /* Datapath control reg 0 */
/* From sparc64/asm.h which I think I'll deprecate since it makes bus.h a pain. */
#ifndef _LOCORE
/*
* GCC __asm constructs for doing assembly stuff.
*/
/*
* ``Routines'' to load and store from/to alternate address space.
* The location can be a variable, the asi value (address space indicator)
* must be a constant.
*
* N.B.: You can put as many special functions here as you like, since
* they cost no kernel space or time if they are not used.
*
* These were static inline functions, but gcc screws up the constraints
* on the address space identifiers (the "n"umeric value part) because
* it inlines too late, so we have to use the funny valued-macro syntax.
*/
/*
* Apparently the definition of bypass ASIs is that they all use the
* D$ so we need to flush the D$ to make sure we don't get data pollution.
*/
static __inline__ u_char lduba __P((paddr_t loc, int asi));
static __inline__ u_short lduha __P((paddr_t loc, int asi));
static __inline__ u_int lda __P((paddr_t loc, int asi));
static __inline__ int ldswa __P((paddr_t loc, int asi));
static __inline__ u_int64_t ldxa __P((paddr_t loc, int asi));
static __inline__ u_int64_t ldda __P((paddr_t loc, int asi));
static __inline__ void stba __P((paddr_t loc, int asi, u_char value));
static __inline__ void stha __P((paddr_t loc, int asi, u_short value));
static __inline__ void sta __P((paddr_t loc, int asi, u_int value));
static __inline__ void stxa __P((paddr_t loc, int asi, u_int64_t value));
static __inline__ void stda __P((paddr_t loc, int asi, u_int64_t value));
#if 0
static __inline__ unsigned int casa __P((paddr_t loc, int asi,
unsigned int value, unsigned int oldvalue));
#endif
static __inline__ u_int64_t casxa __P((paddr_t loc, int asi,
u_int64_t value, u_int64_t oldvalue));
#ifdef __arch64__
static __inline__ u_char
lduba(paddr_t loc, int asi)
{
register unsigned int _lduba_v;
if (PHYS_ASI(asi)) {
__asm __volatile("wr %3,%%g0,%%asi; "
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
" lduba [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
" stxa %%g0,[%1] %4; membar #Sync" :
"=&r" (_lduba_v), "=r" (loc):
"r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %2,%%g0,%%asi; lduba [%1]%%asi,%0" :
"=r" (_lduba_v) :
"r" ((unsigned long)(loc)), "r" (asi));
}
return (_lduba_v);
}
#else
static __inline__ u_char
lduba(paddr_t loc, int asi)
{
register unsigned int _lduba_v, _loc_hi, _pstate;
_loc_hi = (((u_int64_t)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %4,%%g0,%%asi; "
" andn %2,0x1f,%0; stxa %%g0,[%0] %5; rdpr %%pstate,%1; "
" sllx %3,32,%0; or %0,%2,%0; wrpr %1,8,%%pstate; "
" membar #Sync; lduba [%0]%%asi,%0; wrpr %1,0,%%pstate; "
" andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" :
"=&r" (_lduba_v), "=&r" (_pstate) :
"r" ((unsigned long)(loc)), "r" (_loc_hi),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; "
" or %0,%1,%0; lduba [%0]%%asi,%0" : "=&r" (_lduba_v) :
"r" ((unsigned long)(loc)),
"r" (_loc_hi), "r" (asi));
}
return (_lduba_v);
}
#endif
#ifdef __arch64__
/* load half-word from alternate address space */
static __inline__ u_short
lduha(paddr_t loc, int asi)
{
register unsigned int _lduha_v;
if (PHYS_ASI(asi)) {
__asm __volatile("wr %3,%%g0,%%asi; "
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
" lduha [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
" stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lduha_v), "=r" (loc) :
"r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %2,%%g0,%%asi; lduha [%1]%%asi,%0" :
"=r" (_lduha_v) :
"r" ((unsigned long)(loc)), "r" (asi));
}
return (_lduha_v);
}
#else
/* load half-word from alternate address space */
static __inline__ u_short
lduha(paddr_t loc, int asi) {
register unsigned int _lduha_v, _loc_hi, _pstate;
_loc_hi = (((u_int64_t)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1; "
" andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; sllx %3,32,%0; "
" or %0,%2,%0; membar #Sync; lduha [%0]%%asi,%0; wrpr %1,0,%%pstate; "
" andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" :
"=&r" (_lduha_v), "=&r" (_pstate) :
"r" ((unsigned long)(loc)), "r" (_loc_hi),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; "
" or %0,%1,%0; lduha [%0]%%asi,%0" : "=&r" (_lduha_v) :
"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi));
}
return (_lduha_v);
}
#endif
#ifdef __arch64__
/* load unsigned int from alternate address space */
static __inline__ u_int
lda(paddr_t loc, int asi)
{
register unsigned int _lda_v;
if (PHYS_ASI(asi)) {
__asm __volatile("wr %3,%%g0,%%asi; "
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
" lda [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
" stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) :
"r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %2,%%g0,%%asi; lda [%1]%%asi,%0" :
"=r" (_lda_v) :
"r" ((unsigned long)(loc)), "r" (asi));
}
return (_lda_v);
}
/* load signed int from alternate address space */
static __inline__ int
ldswa(paddr_t loc, int asi)
{
register int _lda_v;
if (PHYS_ASI(asi)) {
__asm __volatile("wr %3,%%g0,%%asi; "
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
" ldswa [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
" stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) :
"r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %2,%%g0,%%asi; ldswa [%1]%%asi,%0" :
"=r" (_lda_v) :
"r" ((unsigned long)(loc)), "r" (asi));
}
return (_lda_v);
}
#else /* __arch64__ */
/* load unsigned int from alternate address space */
static __inline__ u_int
lda(paddr_t loc, int asi)
{
register unsigned int _lda_v, _loc_hi, _pstate;
_loc_hi = (((u_int64_t)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;"
" andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; "
" sllx %3,32,%0; or %0,%2,%0; membar #Sync;lda [%0]%%asi,%0; "
" wrpr %1,0,%%pstate; andn %2,0x1f,%1; membar #Sync; "
" stxa %%g0,[%1] %5; membar #Sync" : "=&r" (_lda_v), "=&r" (_pstate) :
"r" ((unsigned long)(loc)), "r" (_loc_hi),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; "
" or %0,%1,%0; lda [%0]%%asi,%0" : "=&r" (_lda_v) :
"r" ((unsigned long)(loc)),
"r" (_loc_hi), "r" (asi));
}
return (_lda_v);
}
/* load signed int from alternate address space */
static __inline__ int
ldswa(paddr_t loc, int asi)
{
register int _lda_v, _loc_hi, _pstate;
_loc_hi = (((u_int64_t)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;"
" andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; sllx %3,32,%0;"
" or %0,%2,%0; membar #Sync; ldswa [%0]%%asi,%0; wrpr %1,0,%%pstate; "
" andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" :
"=&r" (_lda_v), "=&r" (_pstate) :
"r" ((unsigned long)(loc)), "r" (_loc_hi),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; "
" or %0,%1,%0; ldswa [%0]%%asi,%0" : "=&r" (_lda_v) :
"r" ((unsigned long)(loc)),
"r" (_loc_hi), "r" (asi));
}
return (_lda_v);
}
#endif /* __arch64__ */
#ifdef __arch64__
/* load 64-bit int from alternate address space -- these should never be used */
static __inline__ u_int64_t
ldda(paddr_t loc, int asi)
{
register long long _lda_v;
if (PHYS_ASI(asi)) {
__asm __volatile("wr %3,%%g0,%%asi; "
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
" ldda [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
" stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=&r" (loc) :
"r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %2,%%g0,%%asi; ldda [%1]%%asi,%0" :
"=r" (_lda_v) :
"r" ((unsigned long)(loc)), "r" (asi));
}
return (_lda_v);
}
#else
/* load 64-bit int from alternate address space */
static __inline__ u_int64_t
ldda(paddr_t loc, int asi)
{
register long long _lda_v, _loc_hi, _pstate;
_loc_hi = (((u_int64_t)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;"
" andn %2,0x1f,%0; rdpr %%pstate,%1; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate;"
" sllx %3,32,%0; or %0,%2,%0; membar #Sync; ldda [%0]%%asi,%0; wrpr %1,0,%%pstate; "
" andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" :
"=&r" (_lda_v), "=&r" (_pstate) :
"r" ((unsigned long)(loc)), "r" (_loc_hi),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; "
" or %0,%1,%0; ldda [%0]%%asi,%0" : "=&r" (_lda_v) :
"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi));
}
return (_lda_v);
}
#endif
#ifdef __arch64__
/* native load 64-bit int from alternate address space w/64-bit compiler*/
static __inline__ u_int64_t
ldxa(paddr_t loc, int asi)
{
register unsigned long _lda_v;
if (PHYS_ASI(asi)) {
__asm __volatile("wr %3,%%g0,%%asi; "
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; "
" ldxa [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; "
" stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) :
"r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %2,%%g0,%%asi; ldxa [%1]%%asi,%0" :
"=r" (_lda_v) :
"r" ((unsigned long)(loc)), "r" (asi));
}
return (_lda_v);
}
#else
/* native load 64-bit int from alternate address space w/32-bit compiler*/
static __inline__ u_int64_t
ldxa(paddr_t loc, int asi)
{
register unsigned long _ldxa_lo, _ldxa_hi, _loc_hi;
_loc_hi = (((u_int64_t)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %4,%%g0,%%asi; "
" andn %2,0x1f,%0; rdpr %%pstate,%1; stxa %%g0,[%0] %5; "
" sllx %3,32,%0; wrpr %1,8,%%pstate; or %0,%2,%0; membar #Sync; ldxa [%0]%%asi,%0; "
" wrpr %1,0,%%pstate; andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync; "
" srlx %0,32,%1; srl %0,0,%0" :
"=&r" (_ldxa_lo), "=&r" (_ldxa_hi) :
"r" ((unsigned long)(loc)), "r" (_loc_hi),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; "
" or %0,%2,%0; ldxa [%0]%%asi,%0; srlx %0,32,%1; srl %0,0,%0;" :
"=&r" (_ldxa_lo), "=&r" (_ldxa_hi) :
"r" ((unsigned long)(loc)), "r" (_loc_hi),
"r" (asi));
}
return ((((int64_t)_ldxa_hi)<<32)|_ldxa_lo);
}
#endif
/* store byte to alternate address space */
#ifdef __arch64__
static __inline__ void
stba(paddr_t loc, int asi, u_char value)
{
if (PHYS_ASI(asi)) {
__asm __volatile("wr %3,%%g0,%%asi; stba %1,[%2]%%asi;"
" andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" :
"=&r" (loc) :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %2,%%g0,%%asi; stba %0,[%1]%%asi" : :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (asi));
}
}
#else
static __inline__ void
stba(paddr_t loc, int asi, u_char value)
{
register int _loc_hi, _pstate;
_loc_hi = (((u_int64_t)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;"
" or %3,%0,%0; wrpr %1,8,%%pstate; stba %2,[%0]%%asi; wrpr %1,0,%%pstate; "
" andn %0,0x1f,%1; membar #Sync; stxa %%g0,[%1] %6; membar #Sync" :
"=&r" (_loc_hi), "=&r" (_pstate) :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG));
} else {
__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; "
" or %2,%0,%0; stba %1,[%0]%%asi" : "=&r" (_loc_hi) :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (_loc_hi), "r" (asi));
}
}
#endif
/* store half-word to alternate address space */
#ifdef __arch64__
static __inline__ void
stha(paddr_t loc, int asi, u_short value)
{
if (PHYS_ASI(asi)) {
__asm __volatile("wr %3,%%g0,%%asi; stha %1,[%2]%%asi;"
" andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" :
"=&r" (loc) :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
} else {
__asm __volatile("wr %2,%%g0,%%asi; stha %0,[%1]%%asi" : :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (asi) : "memory");
}
}
#else
static __inline__ void
stha(paddr_t loc, int asi, u_short value)
{
register int _loc_hi, _pstate;
_loc_hi = (((u_int64_t)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;"
" or %3,%0,%0; wrpr %1,8,%%pstate; stha %2,[%0]%%asi; wrpr %1,0,%%pstate; "
" andn %0,0x1f,%1; membar #Sync; stxa %%g0,[%1] %6; membar #Sync" :
"=&r" (_loc_hi), "=&r" (_pstate) :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (_loc_hi), "r" (asi),
"n" (ASI_DCACHE_TAG) : "memory");
} else {
__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; "
" or %2,%0,%0; stha %1,[%0]%%asi" : "=&r" (_loc_hi) :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (_loc_hi), "r" (asi) : "memory");
}
}
#endif
/* store int to alternate address space */
#ifdef __arch64__
static __inline__ void
sta(paddr_t loc, int asi, u_int value)
{
if (PHYS_ASI(asi)) {
__asm __volatile("wr %3,%%g0,%%asi; sta %1,[%2]%%asi;"
" andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" :
"=&r" (loc) :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
} else {
__asm __volatile("wr %2,%%g0,%%asi; sta %0,[%1]%%asi" : :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (asi) : "memory");
}
}
#else
static __inline__ void
sta(paddr_t loc, int asi, u_int value)
{
register int _loc_hi, _pstate;
_loc_hi = (((u_int64_t)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;"
" or %3,%0,%0; wrpr %1,8,%%pstate; sta %2,[%0]%%asi; wrpr %1,0,%%pstate; "
" andn %0,0x1f,%1; membar #Sync; stxa %%g0,[%1] %6; membar #Sync" :
"=&r" (_loc_hi), "=&r" (_pstate) :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (_loc_hi), "r" (asi),
"n" (ASI_DCACHE_TAG) : "memory");
} else {
__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; "
" or %2,%0,%0; sta %1,[%0]%%asi" : "=&r" (_loc_hi) :
"r" ((int)(value)), "r" ((unsigned long)(loc)),
"r" (_loc_hi), "r" (asi) : "memory");
}
}
#endif
/* store 64-bit int to alternate address space */
#ifdef __arch64__
static __inline__ void
stda(paddr_t loc, int asi, u_int64_t value)
{
if (PHYS_ASI(asi)) {
__asm __volatile("wr %3,%%g0,%%asi; stda %1,[%2]%%asi;"
" andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" :
"=&r" (loc) :
"r" ((long long)(value)), "r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
} else {
__asm __volatile("wr %2,%%g0,%%asi; stda %0,[%1]%%asi" : :
"r" ((long long)(value)), "r" ((unsigned long)(loc)),
"r" (asi) : "memory");
}
}
#else
static __inline__ void
stda(paddr_t loc, int asi, u_int64_t value)
{
register int _loc_hi, _pstate;
_loc_hi = (((u_int64_t)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1; "
" or %3,%0,%0; wrpr %1,8,%%pstate; stda %2,[%0]%%asi; wrpr %1,0,%%pstate;"
" andn %0,0x1f,%1; membar #Sync; stxa %%g0,[%1] %6; membar #Sync" :
"=&r" (_loc_hi), "=&r" (_pstate) :
"r" ((long long)(value)), "r" ((unsigned long)(loc)),
"r" (_loc_hi), "r" (asi),
"n" (ASI_DCACHE_TAG) : "memory");
} else {
__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; "
" or %2,%0,%0; stda %1,[%0]%%asi" :
"=&r" (_loc_hi) :
"r" ((long long)(value)), "r" ((unsigned long)(loc)),
"r" (_loc_hi), "r" (asi) : "memory");
}
}
#endif
#ifdef __arch64__
/* native store 64-bit int to alternate address space w/64-bit compiler*/
static __inline__ void
stxa(paddr_t loc, int asi, u_int64_t value)
{
if (PHYS_ASI(asi)) {
__asm __volatile("wr %3,%%g0,%%asi; stxa %1,[%2]%%asi;"
" andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" :
"=&r" (asi) :
"r" ((unsigned long)(value)),
"r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
} else {
__asm __volatile("wr %2,%%g0,%%asi; stxa %0,[%1]%%asi" : :
"r" ((unsigned long)(value)),
"r" ((unsigned long)(loc)), "r" (asi) : "memory");
}
}
#else
/* native store 64-bit int to alternate address space w/32-bit compiler*/
static __inline__ void
stxa(paddr_t loc, int asi, u_int64_t value)
{
int _stxa_lo, _stxa_hi, _loc_hi;
_stxa_lo = value;
_stxa_hi = ((u_int64_t)value)>>32;
_loc_hi = (((u_int64_t)(u_long)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %7,%%g0,%%asi; sllx %4,32,%1; sllx %6,32,%0; "
" or %1,%3,%1; rdpr %%pstate,%2; or %0,%5,%0; wrpr %2,8,%%pstate; "
" stxa %1,[%0]%%asi; wrpr %2,0,%%pstate; "
" andn %0,0x1f,%1; membar #Sync; stxa %%g0,[%1] %8; membar #Sync" :
"=&r" (_loc_hi), "=&r" (_stxa_hi),
"=&r" ((int)(_stxa_lo)) :
"r" ((int)(_stxa_lo)), "r" ((int)(_stxa_hi)),
"r" ((unsigned long)(loc)), "r" (_loc_hi),
"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
} else {
__asm __volatile("wr %6,%%g0,%%asi; sllx %3,32,%1; sllx %5,32,%0; "
" or %1,%2,%1; or %0,%4,%0; stxa %1,[%0]%%asi" :
"=&r" (_loc_hi), "=&r" (_stxa_hi) :
"r" ((int)(_stxa_lo)), "r" ((int)(_stxa_hi)),
"r" ((unsigned long)(loc)), "r" (_loc_hi),
"r" (asi) : "memory");
}
}
#endif
#ifdef __arch64__
/* native store 64-bit int to alternate address space w/64-bit compiler*/
static __inline__ u_int64_t
casxa(paddr_t loc, int asi, u_int64_t value, u_int64_t oldvalue)
{
if (PHYS_ASI(asi)) {
__asm __volatile("wr %4,%%g0,%%asi; casxa [%3]%%asi,%2,%1;"
" andn %3,0x1f,%0; membar #Sync; stxa %%g0,[%0] %5; membar #Sync" :
"=&r" (loc), "+r" (value) :
"r" ((unsigned long)(oldvalue)),
"r" ((unsigned long)(loc)),
"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
} else {
__asm __volatile("wr %3,%%g0,%%asi; casxa [%1]%%asi,%2,%0" :
"+r" (value) :
"r" ((unsigned long)(loc)), "r" (oldvalue), "r" (asi) :
"memory");
}
return (value);
}
#else
/* native store 64-bit int to alternate address space w/32-bit compiler*/
static __inline__ u_int64_t
casxa(paddr_t loc, int asi, u_int64_t value, u_int64_t oldvalue)
{
int _casxa_lo, _casxa_hi, _loc_hi, _oval_hi;
_casxa_lo = value;
_casxa_hi = ((u_int64_t)value)>>32;
_oval_hi = ((u_int64_t)oldvalue)>>32;
_loc_hi = (((u_int64_t)(u_long)loc)>>32);
if (PHYS_ASI(asi)) {
__asm __volatile("wr %7,%%g0,%%asi; sllx %1,32,%1; sllx %5,32,%0; "
" sllx %3,32,%3; or %1,%2,%1; rdpr %%pstate,%2; or %0,%4,%0; or %3,%6,%3; "
" wrpr %2,8,%%pstate; casxa [%0]%%asi,%3,%1; wrpr %2,0,%%pstate; "
" andn %0,0x1f,%3; membar #Sync; stxa %%g0,[%3] %8; membar #Sync; "
" sll %1,0,%2; srax %1,32,%1 " :
"=&r" (_loc_hi), "+r" (_casxa_hi),
"+r" (_casxa_lo), "+r" (_oval_hi) :
"r" ((unsigned long)(loc)), "r" (_loc_hi),
"r" ((unsigned int)(oval))
"r" (asi), "n" (ASI_DCACHE_TAG) : "memory");
} else {
__asm __volatile("wr %7,%%g0,%%asi; sllx %1,32,%1; sllx %5,32,%0; "
" or %1,%2,%1; sllx %3,32,%2; or %0,%4,%0; or %2,%4,%2; "
" casxa [%0]%%asi,%2,%1; sll %1,0,%2; srax %o1,32,%o1 " :
"=&r" (_loc_hi), "+r" (_casxa_hi), "+r" (_casxa_lo) :
"r" ((int)(_oval_hi)), "r" ((int)(oval)),
"r" ((unsigned long)(loc)), "r" (_loc_hi),
"r" (asi) : "memory");
}
}
#endif
#if 0
#ifdef __arch64__
/* load byte from alternate address space */
#define lduba(loc, asi) ({ \
register unsigned int _lduba_v; \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %3,%%g0,%%asi; " \
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
" lduba [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
" stxa %%g0,[%1] %4; membar #Sync" : \
"=&r" (_lduba_v), "=r" (loc): \
"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %2,%%g0,%%asi; lduba [%1]%%asi,%0" : \
"=r" (_lduba_v) : \
"r" ((unsigned long)(loc)), "r" (asi)); \
} \
_lduba_v; \
})
#else
/* load byte from alternate address space */
#define lduba(loc, asi) ({ \
register unsigned int _lduba_v, _loc_hi, _pstate; \
_loc_hi = (((u_int64_t)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %4,%%g0,%%asi; " \
" andn %2,0x1f,%0; stxa %%g0,[%0] %5; rdpr %%pstate,%1; " \
" sllx %3,32,%0; or %0,%2,%0; wrpr %1,8,%%pstate; " \
" membar #Sync; lduba [%0]%%asi,%0; wrpr %1,0,%%pstate; " \
" andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" : \
"=&r" (_lduba_v), "=&r" (_pstate) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; " \
" or %0,%1,%0; lduba [%0]%%asi,%0" : "=&r" (_lduba_v) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
} \
_lduba_v; \
})
#endif
#ifdef __arch64__
/* load half-word from alternate address space */
#define lduha(loc, asi) ({ \
register unsigned int _lduha_v; \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %3,%%g0,%%asi; " \
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
" lduha [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
" stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lduha_v), "=r" (loc) : \
"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %2,%%g0,%%asi; lduha [%1]%%asi,%0" : "=r" (_lduha_v) : \
"r" ((unsigned long)(loc)), "r" (asi)); \
} \
_lduha_v; \
})
#else
/* load half-word from alternate address space */
#define lduha(loc, asi) ({ \
register unsigned int _lduha_v, _loc_hi, _pstate; \
_loc_hi = (((u_int64_t)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1; " \
" andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; sllx %3,32,%0; " \
" or %0,%2,%0; membar #Sync; lduha [%0]%%asi,%0; wrpr %1,0,%%pstate; " \
" andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" : \
"=&r" (_lduha_v), "=&r" (_pstate) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; " \
" or %0,%1,%0; lduha [%0]%%asi,%0" : "=&r" (_lduha_v) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
} \
_lduha_v; \
})
#endif
#ifdef __arch64__
/* load unsigned int from alternate address space */
#define lda(loc, asi) ({ \
register unsigned int _lda_v; \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %3,%%g0,%%asi; " \
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
" lda [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
" stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) : \
"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %2,%%g0,%%asi; lda [%1]%%asi,%0" : "=r" (_lda_v) : \
"r" ((unsigned long)(loc)), "r" (asi)); \
} \
_lda_v; \
})
/* load signed int from alternate address space */
#define ldswa(loc, asi) ({ \
register int _lda_v; \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %3,%%g0,%%asi; " \
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
" ldswa [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
" stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) : \
"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %2,%%g0,%%asi; ldswa [%1]%%asi,%0" : "=r" (_lda_v) : \
"r" ((unsigned long)(loc)), "r" (asi)); \
} \
_lda_v; \
})
#else /* __arch64__ */
/* load unsigned int from alternate address space */
#define lda(loc, asi) ({ \
register unsigned int _lda_v, _loc_hi, _pstate; \
_loc_hi = (((u_int64_t)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;" \
" andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; " \
" sllx %3,32,%0; or %0,%2,%0; membar #Sync;lda [%0]%%asi,%0; " \
" wrpr %1,0,%%pstate; andn %2,0x1f,%1; membar #Sync; " \
" stxa %%g0,[%1] %5; membar #Sync" : "=&r" (_lda_v), "=&r" (_pstate) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; " \
" or %0,%1,%0; lda [%0]%%asi,%0" : "=&r" (_lda_v) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
} \
_lda_v; \
})
/* load signed int from alternate address space */
#define ldswa(loc, asi) ({ \
register int _lda_v, _loc_hi, _pstate; \
_loc_hi = (((u_int64_t)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;" \
" andn %2,0x1f,%0; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate; sllx %3,32,%0;" \
" or %0,%2,%0; membar #Sync; ldswa [%0]%%asi,%0; wrpr %1,0,%%pstate; " \
" andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" : \
"=&r" (_lda_v), "=&r" (_pstate) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; " \
" or %0,%1,%0; ldswa [%0]%%asi,%0" : "=&r" (_lda_v) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
} \
_lda_v; \
})
#endif /* __arch64__ */
#ifdef __arch64__
/* load 64-bit int from alternate address space -- these should never be used */
#define ldda(loc, asi) ({ \
register long long _lda_v; \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %3,%%g0,%%asi; " \
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
" ldda [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
" stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=&r" (loc) : \
"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %2,%%g0,%%asi; ldda [%1]%%asi,%0" : "=r" (_lda_v) : \
"r" ((unsigned long)(loc)), "r" (asi)); \
} \
_lda_v; \
})
#else
/* load 64-bit int from alternate address space */
#define ldda(loc, asi) ({ \
register long long _lda_v, _loc_hi, _pstate; \
_loc_hi = (((u_int64_t)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %4,%%g0,%%asi; rdpr %%pstate,%1;" \
" andn %2,0x1f,%0; rdpr %%pstate,%1; stxa %%g0,[%0] %5; wrpr %1,8,%%pstate;" \
" sllx %3,32,%0; or %0,%2,%0; membar #Sync; ldda [%0]%%asi,%0; wrpr %1,0,%%pstate; " \
" andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync" : \
"=&r" (_lda_v), "=&r" (_pstate) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %3,%%g0,%%asi; sllx %2,32,%0; " \
" or %0,%1,%0; ldda [%0]%%asi,%0" : "=&r" (_lda_v) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
} \
_lda_v; \
})
#endif
#ifdef __arch64__
/* native load 64-bit int from alternate address space w/64-bit compiler*/
#define ldxa(loc, asi) ({ \
register unsigned long _lda_v; \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %3,%%g0,%%asi; "\
" andn %2,0x1f,%0; stxa %%g0,[%0] %4; membar #Sync; " \
" ldxa [%2]%%asi,%0; andn %2,0x1f,%1; membar #Sync; " \
" stxa %%g0,[%1] %4; membar #Sync" : "=&r" (_lda_v), "=r" (loc) : \
"r" ((unsigned long)(loc)), "r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %2,%%g0,%%asi; ldxa [%1]%%asi,%0" : "=r" (_lda_v) : \
"r" ((unsigned long)(loc)), "r" (asi)); \
} \
_lda_v; \
})
#else
/* native load 64-bit int from alternate address space w/32-bit compiler*/
#define ldxa(loc, asi) ({ \
register unsigned long _ldxa_lo, _ldxa_hi, _loc_hi; \
_loc_hi = (((u_int64_t)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %4,%%g0,%%asi; " \
" andn %2,0x1f,%0; rdpr %%pstate,%1; stxa %%g0,[%0] %5; " \
" sllx %3,32,%0; wrpr %1,8,%%pstate; or %0,%2,%0; membar #Sync; ldxa [%0]%%asi,%0; " \
" wrpr %1,0,%%pstate; andn %2,0x1f,%1; membar #Sync; stxa %%g0,[%1] %5; membar #Sync; " \
" srlx %0,32,%1; srl %0,0,%0" : \
"=&r" (_ldxa_lo), "=&r" (_ldxa_hi) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; " \
" or %0,%2,%0; ldxa [%0]%%asi,%0; srlx %0,32,%1; srl %0,0,%0;" : \
"=&r" (_ldxa_lo), "=&r" (_ldxa_hi) : \
"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
} \
((((int64_t)_ldxa_hi)<<32)|_ldxa_lo); \
})
#endif
/* store byte to alternate address space */
#ifdef __arch64__
#define stba(loc, asi, value) ({ \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %3,%%g0,%%asi; stba %1,[%2]%%asi;" \
" andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" : "=&r" (loc) : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %2,%%g0,%%asi; stba %0,[%1]%%asi" : : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), "r" (asi)); \
} \
})
#else
#define stba(loc, asi, value) ({ \
register int _loc_hi, _pstate; \
_loc_hi = (((u_int64_t)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;" \
" or %3,%0,%0; wrpr %1,8,%%pstate; stba %2,[%0]%%asi; wrpr %1,0,%%pstate; " \
" andn %0,0x1f,%1; membar #Sync; stxa %%g0,[%1] %6; membar #Sync" : \
"=&r" (_loc_hi), "=&r" (_pstate) : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), \
"r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; " \
" or %2,%0,%0; stba %1,[%0]%%asi" : "=&r" (_loc_hi) : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), \
"r" (_loc_hi), "r" (asi)); \
} \
})
#endif
/* store half-word to alternate address space */
#ifdef __arch64__
#define stha(loc, asi, value) ({ \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %3,%%g0,%%asi; stha %1,[%2]%%asi;" \
" andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" : "=&r" (loc) : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %2,%%g0,%%asi; stha %0,[%1]%%asi" : : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), "r" (asi)); \
} \
})
#else
#define stha(loc, asi, value) ({ \
register int _loc_hi, _pstate; \
_loc_hi = (((u_int64_t)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;" \
" or %3,%0,%0; wrpr %1,8,%%pstate; stha %2,[%0]%%asi; wrpr %1,0,%%pstate; " \
" andn %0,0x1f,%1; membar #Sync; stxa %%g0,[%1] %6; membar #Sync" : \
"=&r" (_loc_hi), "=&r" (_pstate) : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), \
"r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; " \
" or %2,%0,%0; stha %1,[%0]%%asi" : "=&r" (_loc_hi) : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), \
"r" (_loc_hi), "r" (asi)); \
} \
})
#endif
/* store int to alternate address space */
#ifdef __arch64__
#define sta(loc, asi, value) ({ \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %3,%%g0,%%asi; sta %1,[%2]%%asi;" \
" andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" : "=&r" (loc) : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %2,%%g0,%%asi; sta %0,[%1]%%asi" : : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), "r" (asi)); \
} \
})
#else
#define sta(loc, asi, value) ({ \
register int _loc_hi, _pstate; \
_loc_hi = (((u_int64_t)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1;" \
" or %3,%0,%0; wrpr %1,8,%%pstate; sta %2,[%0]%%asi; wrpr %1,0,%%pstate; " \
" andn %0,0x1f,%1; membar #Sync; stxa %%g0,[%1] %6; membar #Sync" : \
"=&r" (_loc_hi), "=&r" (_pstate) : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), \
"r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; " \
" or %2,%0,%0; sta %1,[%0]%%asi" : "=&r" (_loc_hi) : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), \
"r" (_loc_hi), "r" (asi)); \
} \
})
#endif
/* store 64-bit int to alternate address space */
#ifdef __arch64__
#define stda(loc, asi, value) ({ \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %3,%%g0,%%asi; stda %1,[%2]%%asi;" \
" andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" : "=&r" (loc) : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %2,%%g0,%%asi; stda %0,[%1]%%asi" : : \
"r" ((long long)(value)), "r" ((unsigned long)(loc)), "r" (asi)); \
} \
})
#else
#define stda(loc, asi, value) ({ \
register int _loc_hi, _pstate; \
_loc_hi = (((u_int64_t)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %5,%%g0,%%asi; sllx %4,32,%0; rdpr %%pstate,%1; " \
" or %3,%0,%0; wrpr %1,8,%%pstate; stda %2,[%0]%%asi; wrpr %1,0,%%pstate;" \
" andn %0,0x1f,%1; membar #Sync; stxa %%g0,[%1] %6; membar #Sync" : \
"=&r" (_loc_hi), "=&r" (_pstate) : \
"r" ((long long)(value)), "r" ((unsigned long)(loc)), \
"r" (_loc_hi), "r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %4,%%g0,%%asi; sllx %3,32,%0; " \
" or %2,%0,%0; stda %1,[%0]%%asi" : "=&r" (_loc_hi) : \
"r" ((long long)(value)), "r" ((unsigned long)(loc)), \
"r" (_loc_hi), "r" (asi)); \
} \
})
#endif
#ifdef __arch64__
/* native store 64-bit int to alternate address space w/64-bit compiler*/
#define stxa(loc, asi, value) ({ \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %3,%%g0,%%asi; stxa %1,[%2]%%asi;" \
" andn %2,0x1f,%0; membar #Sync; stxa %%g0,[%0] %4; membar #Sync" : "=&r" (loc) : \
"r" ((int)(value)), "r" ((unsigned long)(loc)), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %2,%%g0,%%asi; stxa %0,[%1]%%asi" : : \
"r" ((unsigned long)(value)), "r" ((unsigned long)(loc)), "r" (asi)); \
})
#else
/* native store 64-bit int to alternate address space w/32-bit compiler*/
#define stxa(loc, asi, value) ({ \
int _stxa_lo, _stxa_hi, _loc_hi; \
_stxa_lo = value; _stxa_hi = ((u_int64_t)value)>>32; \
_loc_hi = (((u_int64_t)(u_long)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %7,%%g0,%%asi; sllx %4,32,%1; sllx %6,32,%0; " \
" or %1,%3,%1; rdpr %%pstate,%2; or %0,%5,%0; wrpr %2,8,%%pstate; " \
" stxa %1,[%0]%%asi; wrpr %2,0,%%pstate; " \
" andn %0,0x1f,%1; membar #Sync; stxa %%g0,[%1] %8; membar #Sync": \
"=&r" (_loc_hi), "=&r" (_stxa_hi), "=&r" ((int)(_stxa_lo)): \
"r" ((int)(_stxa_lo)), "r" ((int)(_stxa_hi)), \
"r" ((unsigned long)(loc)), "r" (_loc_hi), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %6,%%g0,%%asi; sllx %3,32,%1; sllx %5,32,%0; " \
" or %1,%2,%1; or %0,%4,%0; stxa %1,[%0]%%asi" : \
"=&r" (_loc_hi), "=&r" (_stxa_hi) : \
"r" ((int)(_stxa_lo)), "r" ((int)(_stxa_hi)), \
"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
} \
})
#endif
#ifdef __arch64__
/* native store 64-bit int to alternate address space w/64-bit compiler*/
#define casxa(loc, asi, value, ovalue) ({ \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %5,%%g0,%%asi; casxa [%4]%%asi,%3, %1;" \
" andn %4,0x1f,%0; membar #Sync; stxa %%g0,[%0] %5; membar #Sync" : \
"=&r" (loc), "=&r" (value) : \
"r" ((unsigned long)(value)), "r" ((unsigned long)(ovalue)), \
"r" ((unsigned long)(loc)), \
"r" (asi), "n" (ASI_DCACHE_TAG)); \
} else { \
__asm __volatile("wr %4,%%g0,%%asi; casxa [%3]%%asi,%2,%1" : \
"=&r" (value) : \
"r" ((unsigned long)(value)), "r" ((unsigned long)(ovalue), \
"r" ((unsigned long)(loc)), "r" (asi)); \
})
#else
/* native store 64-bit int to alternate address space w/32-bit compiler*/
#define casxa(loc, asi, value, ovalue) ({ \
int _casxa_lo, _casxa_hi, _oval_lo, _oval_hi, _loc_hi; \
_casxa_lo = value; _casxa_hi = ((u_int64_t)value)>>32; \
_oval_lo = ovalue; _oval_hi = ((u_int64_t)ovalue)>>32; \
_loc_hi = (((u_int64_t)(u_long)loc)>>32); \
if (PHYS_ASI(asi)) { \
__asm __volatile("wr %9,%%g0,%%asi; sllx %4,32,%1; sllx %8,32,%0; " \
" or %1,%3,%1; rdpr %%pstate,%3; or %0,%5,%0; wrpr %3,8,%%pstate; " \
" casxa %1,[%0]%%asi; wrpr %3,0,%%pstate; " \
" andn %0,0x1f,%1; membar #Sync; stxa %%g0,[%1] %8; membar #Sync": \
"=&r" (_casxa_hi), "=&r" ((int)(_casxa_lo)): \
"r" ((int)(_casxa_lo)), "r" ((int)(_casxa_hi)), \
"r" ((int)(_oval_lo)), "r" ((int)(_oval_hi)), \
"r" ((unsigned long)(loc)), "r" (_loc_hi), \
"r" (asi), "n" (ASI_DCACHE_TAG) : \
"r" (loc), "r", (oval_lo) \
} else { \
__asm __volatile("wr %6,%%g0,%%asi; sllx %3,32,%1; sllx %5,32,%0; " \
" or %1,%2,%1; or %0,%4,%0; stxa %1,[%0]%%asi" : \
"=&r" (_loc_hi), "=&r" (_stxa_hi) : \
"r" ((int)(_stxa_lo)), "r" ((int)(_stxa_hi)), \
"r" ((unsigned long)(loc)), "r" (_loc_hi), "r" (asi)); \
} \
})
#endif
#endif
/* flush address from data cache */
#define flush(loc) ({ \
__asm __volatile("flush %0" : : \
"r" ((unsigned long)(loc))); \
})
/* Flush a D$ line */
#if 0
#define flushline(loc) ({ \
stxa(((paddr_t)loc)&(~0x1f), (ASI_DCACHE_TAG), 0); \
membar_sync(); \
})
#else
#define flushline(loc)
#endif
/* The following two enable or disable the dcache in the LSU control register */
#define dcenable() ({ \
int res; \
__asm __volatile("ldxa [%%g0] %1,%0; or %0,%2,%0; stxa %0,[%%g0] %1; membar #Sync" \
: "r" (res) : "n" (ASI_MCCR), "n" (MCCR_DCACHE_EN)); \
})
#define dcdisable() ({ \
int res; \
__asm __volatile("ldxa [%%g0] %1,%0; andn %0,%2,%0; stxa %0,[%%g0] %1; membar #Sync" \
: "r" (res) : "n" (ASI_MCCR), "n" (MCCR_DCACHE_EN)); \
})
/*
* SPARC V9 memory barrier instructions.
*/
/* Make all stores complete before next store */
#define membar_storestore() __asm __volatile("membar #StoreStore" : :)
/* Make all loads complete before next store */
#define membar_loadstore() __asm __volatile("membar #LoadStore" : :)
/* Make all stores complete before next load */
#define membar_storeload() __asm __volatile("membar #StoreLoad" : :)
/* Make all loads complete before next load */
#define membar_loadload() __asm __volatile("membar #LoadLoad" : :)
/* Complete all outstanding memory operations and exceptions */
#define membar_sync() __asm __volatile("membar #Sync" : :)
/* Complete all outstanding memory operations */
#define membar_memissue() __asm __volatile("membar #MemIssue" : :)
/* Complete all outstanding stores before any new loads */
#define membar_lookaside() __asm __volatile("membar #Lookaside" : :)
#ifdef __arch64__
/* read 64-bit %tick register */
#define tick() ({ \
register u_long _tick_tmp; \
__asm __volatile("rdpr %%tick, %0" : "=r" (_tick_tmp) :); \
_tick_tmp; \
})
#else
/* read 64-bit %tick register on 32-bit system */
#define tick() ({ \
register int _tick_hi = 0, _tick_lo = 0; \
__asm __volatile("rdpr %%tick, %1; srlx %0,32,%2; srl %0,0,%0 " \
: "=r" (_tick_hi), "=r" (_tick_lo) : ); \
(((u_int64_t)_tick_hi)<<32)|((u_int64_t)_tick_lo); \
})
#endif
extern void next_tick __P((long));
#endif