2 * Copyright (c) 2001 Jake Burkholder.
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 #ifndef _MACHINE_CPUFUNC_H_
30 #define _MACHINE_CPUFUNC_H_
32 #include <machine/asi.h>
33 #include <machine/pstate.h>
38 * membar operand macros for use in other macros when # is a special
39 * character. Keep these in sync with what the hardware expects.
41 #define C_Lookaside (0)
42 #define C_MemIssue (1)
44 #define M_LoadLoad (0)
45 #define M_StoreLoad (1)
46 #define M_LoadStore (2)
47 #define M_StoreStore (3)
49 #define CMASK_SHIFT (4)
50 #define MMASK_SHIFT (0)
52 #define CMASK_GEN(bit) ((1 << (bit)) << CMASK_SHIFT)
53 #define MMASK_GEN(bit) ((1 << (bit)) << MMASK_SHIFT)
55 #define Lookaside CMASK_GEN(C_Lookaside)
56 #define MemIssue CMASK_GEN(C_MemIssue)
57 #define Sync CMASK_GEN(C_Sync)
58 #define LoadLoad MMASK_GEN(M_LoadLoad)
59 #define StoreLoad MMASK_GEN(M_StoreLoad)
60 #define LoadStore MMASK_GEN(M_LoadStore)
61 #define StoreStore MMASK_GEN(M_StoreStore)
63 #define casa(rs1, rs2, rd, asi) ({ \
64 u_int __rd = (uint32_t)(rd); \
65 __asm __volatile("casa [%2] %3, %4, %0" \
66 : "+r" (__rd), "=m" (*rs1) \
67 : "r" (rs1), "n" (asi), "r" (rs2), "m" (*rs1)); \
71 #define casxa(rs1, rs2, rd, asi) ({ \
72 u_long __rd = (uint64_t)(rd); \
73 __asm __volatile("casxa [%2] %3, %4, %0" \
74 : "+r" (__rd), "=m" (*rs1) \
75 : "r" (rs1), "n" (asi), "r" (rs2), "m" (*rs1)); \
79 #define flush(va) do { \
80 __asm __volatile("flush %0" : : "r" (va)); \
83 #define flushw() do { \
84 __asm __volatile("flushw" : :); \
87 #define mov(val, reg) do { \
88 __asm __volatile("mov %0, %" __XSTRING(reg) : : "r" (val)); \
91 /* Generate ld*a/st*a functions for non-constant ASI's. */
92 #define LDNC_GEN(tp, o) \
94 o ## _nc(caddr_t va, int asi) \
97 __asm __volatile("wr %2, 0, %%asi;" #o " [%1] %%asi, %0"\
98 : "=r" (r) : "r" (va), "r" (asi)); \
102 LDNC_GEN(u_char, lduba);
103 LDNC_GEN(u_short, lduha);
104 LDNC_GEN(u_int, lduwa);
105 LDNC_GEN(u_long, ldxa);
107 #define LD_GENERIC(va, asi, op, type) ({ \
109 __asm __volatile(#op " [%1] %2, %0" \
110 : "=r" (__r) : "r" (va), "n" (asi)); \
114 #define lduba(va, asi) LD_GENERIC(va, asi, lduba, u_char)
115 #define lduha(va, asi) LD_GENERIC(va, asi, lduha, u_short)
116 #define lduwa(va, asi) LD_GENERIC(va, asi, lduwa, u_int)
117 #define ldxa(va, asi) LD_GENERIC(va, asi, ldxa, u_long)
120 #define STNC_GEN(tp, o) \
121 static __inline void \
122 o ## _nc(caddr_t va, int asi, tp val) \
124 __asm __volatile(#o " %0, [%g0 + %1] %2"\
125 : : "r" (val), "r" (va), "r" (asi)); \
128 #define STNC_GEN(tp, o) \
129 static __inline void \
130 o ## _nc(caddr_t va, int asi, tp val) \
132 __asm __volatile("wr %2, 0, %%asi;" #o " %0, [%1] %%asi"\
133 : : "r" (val), "r" (va), "r" (asi)); \
137 STNC_GEN(u_char, stba);
138 STNC_GEN(u_short, stha);
139 STNC_GEN(u_int, stwa);
140 STNC_GEN(u_long, stxa);
142 #define ST_GENERIC(va, asi, val, op) \
143 __asm __volatile(#op " %0, [%1] %2" \
144 : : "r" (val), "r" (va), "n" (asi)); \
146 #define stba(va, asi, val) ST_GENERIC(va, asi, val, stba)
147 #define stha(va, asi, val) ST_GENERIC(va, asi, val, stha)
148 #define stwa(va, asi, val) ST_GENERIC(va, asi, val, stwa)
149 #define stxa(va, asi, val) ST_GENERIC(va, asi, val, stxa)
152 * Attempt to read from addr, val. If a Data Access Error trap happens,
153 * they return -1 and the contents of val is undefined. A return of 0
154 * means no trap happened, and the contents of val is valid.
156 int fasword8(u_long asi, void *addr, uint8_t *val);
157 int fasword16(u_long asi, void *addr, uint16_t *val);
158 int fasword32(u_long asi, void *addr, uint32_t *val);
160 #define membar(mask) do { \
161 __asm __volatile("membar %0" : : "n" (mask) : "memory"); \
164 #define rd(name) ({ \
166 __asm __volatile("rd %%" #name ", %0" : "=r" (__sr) :); \
170 #define wr(name, val, xor) do { \
171 __asm __volatile("wr %0, %1, %%" #name \
172 : : "r" (val), "rI" (xor)); \
175 #define rdpr(name) ({ \
177 __asm __volatile("rdpr %%" #name", %0" : "=r" (__pr) :); \
181 #define wrpr(name, val, xor) do { \
182 __asm __volatile("wrpr %0, %1, %%" #name \
183 : : "r" (val), "rI" (xor)); \
187 * Macro intended to be used instead of wr(asr23, val, xor) for writing to
188 * the TICK_CMPR register in order to avoid a bug in BlackBird CPUs that
189 * can cause these writes to fail under certain condidtions which in turn
190 * causes the hardclock to stop. The workaround is to perform the write
191 * at the beginning of an I-Cache line directly followed by a dummy read.
193 #define wrtickcmpr(val, xor) ({ \
195 " ba,pt %%xcc, 1f ; " \
198 "1: wr %0, %1, %%asr23 ; " \
199 " rd %%asr23, %%g0 ; " \
200 : : "r" (val), "rI" (xor)); \
206 __asm __volatile("ta %%xcc, 1" : :);
209 static __inline register_t
210 intr_disable_all(void)
215 wrpr(pstate, s & ~PSTATE_IE, 0);
218 #define intr_restore_all(s) wrpr(pstate, (s), 0)
220 static __inline register_t
229 #define intr_restore(s) wrpr(pil, (s), 0)
233 * In some places, it is required that the store is directly followed by a
234 * membar #Sync. Don't trust the compiler to not insert instructions in
235 * between. We also need to disable interrupts completely.
237 #define stxa_sync(va, asi, val) do { \
239 s = intr_disable_all(); \
240 __asm __volatile("stxa %0, [%1] %2; membar #Sync" \
241 : : "r" (val), "r" (va), "n" (asi)); \
242 intr_restore_all(s); \
245 void ascopy(u_long asi, vm_offset_t src, vm_offset_t dst, size_t len);
246 void ascopyfrom(u_long sasi, vm_offset_t src, caddr_t dst, size_t len);
247 void ascopyto(caddr_t src, u_long dasi, vm_offset_t dst, size_t len);
248 void aszero(u_long asi, vm_offset_t dst, size_t len);
250 #include <machine/sun4v_cpufunc.h>
252 #define USE_CPU_NANOSECONDS
253 #define nanoseconds() rd(tick)
258 #endif /* !_MACHINE_CPUFUNC_H_ */