1069e9bc1SDoug Rabson /*- 2069e9bc1SDoug Rabson * Copyright (c) 1998 Doug Rabson 3069e9bc1SDoug Rabson * All rights reserved. 4069e9bc1SDoug Rabson * 5069e9bc1SDoug Rabson * Redistribution and use in source and binary forms, with or without 6069e9bc1SDoug Rabson * modification, are permitted provided that the following conditions 7069e9bc1SDoug Rabson * are met: 8069e9bc1SDoug Rabson * 1. Redistributions of source code must retain the above copyright 9069e9bc1SDoug Rabson * notice, this list of conditions and the following disclaimer. 10069e9bc1SDoug Rabson * 2. Redistributions in binary form must reproduce the above copyright 11069e9bc1SDoug Rabson * notice, this list of conditions and the following disclaimer in the 12069e9bc1SDoug Rabson * documentation and/or other materials provided with the distribution. 13069e9bc1SDoug Rabson * 14069e9bc1SDoug Rabson * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 15069e9bc1SDoug Rabson * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 16069e9bc1SDoug Rabson * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 17069e9bc1SDoug Rabson * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 18069e9bc1SDoug Rabson * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 19069e9bc1SDoug Rabson * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 20069e9bc1SDoug Rabson * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 21069e9bc1SDoug Rabson * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 22069e9bc1SDoug Rabson * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 23069e9bc1SDoug Rabson * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 24069e9bc1SDoug Rabson * SUCH DAMAGE. 25069e9bc1SDoug Rabson * 26c3aac50fSPeter Wemm * $FreeBSD$ 27069e9bc1SDoug Rabson */ 28069e9bc1SDoug Rabson #ifndef _MACHINE_ATOMIC_H_ 29069e9bc1SDoug Rabson #define _MACHINE_ATOMIC_H_ 30069e9bc1SDoug Rabson 31a5f50ef9SJoerg Wunsch #ifndef _SYS_CDEFS_H_ 32a5f50ef9SJoerg Wunsch #error this file needs sys/cdefs.h as a prerequisite 33a5f50ef9SJoerg Wunsch #endif 34a5f50ef9SJoerg Wunsch 35fa9f322dSKonstantin Belousov #define mb() __asm __volatile("lock; addl $0,(%%esp)" : : : "memory", "cc") 36fa9f322dSKonstantin Belousov #define wmb() __asm __volatile("lock; addl $0,(%%esp)" : : : "memory", "cc") 37fa9f322dSKonstantin Belousov #define rmb() __asm __volatile("lock; addl $0,(%%esp)" : : : "memory", "cc") 38db7f0b97SKip Macy 39069e9bc1SDoug Rabson /* 40f28e1c8fSBruce Evans * Various simple operations on memory, each of which is atomic in the 41f28e1c8fSBruce Evans * presence of interrupts and multiple processors. 42069e9bc1SDoug Rabson * 4347b8bc92SAlan Cox * atomic_set_char(P, V) (*(u_char *)(P) |= (V)) 4447b8bc92SAlan Cox * atomic_clear_char(P, V) (*(u_char *)(P) &= ~(V)) 4547b8bc92SAlan Cox * atomic_add_char(P, V) (*(u_char *)(P) += (V)) 4647b8bc92SAlan Cox * atomic_subtract_char(P, V) (*(u_char *)(P) -= (V)) 4747b8bc92SAlan Cox * 4847b8bc92SAlan Cox * atomic_set_short(P, V) (*(u_short *)(P) |= (V)) 4947b8bc92SAlan Cox * atomic_clear_short(P, V) (*(u_short *)(P) &= ~(V)) 5047b8bc92SAlan Cox * atomic_add_short(P, V) (*(u_short *)(P) += (V)) 5147b8bc92SAlan Cox * atomic_subtract_short(P, V) (*(u_short *)(P) -= (V)) 5247b8bc92SAlan Cox * 5347b8bc92SAlan Cox * atomic_set_int(P, V) (*(u_int *)(P) |= (V)) 5447b8bc92SAlan Cox * atomic_clear_int(P, V) (*(u_int *)(P) &= ~(V)) 5547b8bc92SAlan Cox * atomic_add_int(P, V) (*(u_int *)(P) += (V)) 5647b8bc92SAlan Cox * atomic_subtract_int(P, V) (*(u_int *)(P) -= (V)) 57f28e1c8fSBruce Evans * atomic_readandclear_int(P) (return (*(u_int *)(P)); *(u_int *)(P) = 0;) 5847b8bc92SAlan Cox * 5947b8bc92SAlan Cox * atomic_set_long(P, V) (*(u_long *)(P) |= (V)) 6047b8bc92SAlan Cox * atomic_clear_long(P, V) (*(u_long *)(P) &= ~(V)) 6147b8bc92SAlan Cox * atomic_add_long(P, V) (*(u_long *)(P) += (V)) 6247b8bc92SAlan Cox * atomic_subtract_long(P, V) (*(u_long *)(P) -= (V)) 63f28e1c8fSBruce Evans * atomic_readandclear_long(P) (return (*(u_long *)(P)); *(u_long *)(P) = 0;) 64069e9bc1SDoug Rabson */ 65069e9bc1SDoug Rabson 6647b8bc92SAlan Cox /* 6708c40841SAlan Cox * The above functions are expanded inline in the statically-linked 6808c40841SAlan Cox * kernel. Lock prefixes are generated if an SMP kernel is being 6908c40841SAlan Cox * built. 7008c40841SAlan Cox * 7108c40841SAlan Cox * Kernel modules call real functions which are built into the kernel. 7208c40841SAlan Cox * This allows kernel modules to be portable between UP and SMP systems. 7347b8bc92SAlan Cox */ 7448281036SJohn Baldwin #if defined(KLD_MODULE) || !defined(__GNUCLIKE_ASM) 75e4e991e1SJohn Baldwin #define ATOMIC_ASM(NAME, TYPE, OP, CONS, V) \ 7686d2e48cSAttilio Rao void atomic_##NAME##_##TYPE(volatile u_##TYPE *p, u_##TYPE v); \ 7786d2e48cSAttilio Rao void atomic_##NAME##_barr_##TYPE(volatile u_##TYPE *p, u_##TYPE v) 7808c40841SAlan Cox 79065b12a7SPoul-Henning Kamp int atomic_cmpset_int(volatile u_int *dst, u_int expect, u_int src); 803c2bc2bfSJohn Baldwin u_int atomic_fetchadd_int(volatile u_int *p, u_int v); 81819e370cSPoul-Henning Kamp 82fa9f322dSKonstantin Belousov #define ATOMIC_LOAD(TYPE, LOP) \ 83fa9f322dSKonstantin Belousov u_##TYPE atomic_load_acq_##TYPE(volatile u_##TYPE *p) 84fa9f322dSKonstantin Belousov #define ATOMIC_STORE(TYPE) \ 858306a37bSMark Murray void atomic_store_rel_##TYPE(volatile u_##TYPE *p, u_##TYPE v) 868a6b1c8fSJohn Baldwin 8748281036SJohn Baldwin #else /* !KLD_MODULE && __GNUCLIKE_ASM */ 884c5aee92SMark Murray 892a89a48fSJohn Baldwin /* 90f28e1c8fSBruce Evans * For userland, always use lock prefixes so that the binaries will run 91f28e1c8fSBruce Evans * on both SMP and !SMP systems. 922a89a48fSJohn Baldwin */ 932a89a48fSJohn Baldwin #if defined(SMP) || !defined(_KERNEL) 947e4277e5SBruce Evans #define MPLOCKED "lock ; " 95d2f22d70SBruce Evans #else 9647b8bc92SAlan Cox #define MPLOCKED 97d2f22d70SBruce Evans #endif 98069e9bc1SDoug Rabson 9947b8bc92SAlan Cox /* 10086d2e48cSAttilio Rao * The assembly is volatilized to avoid code chunk removal by the compiler. 10186d2e48cSAttilio Rao * GCC aggressively reorders operations and memory clobbering is necessary 10286d2e48cSAttilio Rao * in order to avoid that for memory barriers. 10347b8bc92SAlan Cox */ 104e4e991e1SJohn Baldwin #define ATOMIC_ASM(NAME, TYPE, OP, CONS, V) \ 10547b8bc92SAlan Cox static __inline void \ 10603e3bc8eSAlan Cox atomic_##NAME##_##TYPE(volatile u_##TYPE *p, u_##TYPE v)\ 10747b8bc92SAlan Cox { \ 1087e4277e5SBruce Evans __asm __volatile(MPLOCKED OP \ 109*fe94be3dSJung-uk Kim : "+m" (*p) \ 110*fe94be3dSJung-uk Kim : CONS (V) \ 1117222d2fbSKonstantin Belousov : "cc"); \ 1126d800f89SBruce Evans } \ 11386d2e48cSAttilio Rao \ 11486d2e48cSAttilio Rao static __inline void \ 11586d2e48cSAttilio Rao atomic_##NAME##_barr_##TYPE(volatile u_##TYPE *p, u_##TYPE v)\ 11686d2e48cSAttilio Rao { \ 11786d2e48cSAttilio Rao __asm __volatile(MPLOCKED OP \ 118*fe94be3dSJung-uk Kim : "+m" (*p) \ 119*fe94be3dSJung-uk Kim : CONS (V) \ 1207222d2fbSKonstantin Belousov : "memory", "cc"); \ 12186d2e48cSAttilio Rao } \ 1226d800f89SBruce Evans struct __hack 1234c5aee92SMark Murray 124d521c6b9SJung-uk Kim #if defined(_KERNEL) && !defined(WANT_FUNCTIONS) 125d521c6b9SJung-uk Kim 126d521c6b9SJung-uk Kim /* I486 does not support SMP or CMPXCHG8B. */ 127d521c6b9SJung-uk Kim static __inline uint64_t 128d521c6b9SJung-uk Kim atomic_load_acq_64_i386(volatile uint64_t *p) 129d521c6b9SJung-uk Kim { 130d521c6b9SJung-uk Kim volatile uint32_t *high, *low; 131d521c6b9SJung-uk Kim uint64_t res; 132d521c6b9SJung-uk Kim 133d521c6b9SJung-uk Kim low = (volatile uint32_t *)p; 134d521c6b9SJung-uk Kim high = (volatile uint32_t *)p + 1; 135d521c6b9SJung-uk Kim __asm __volatile( 136d521c6b9SJung-uk Kim " pushfl ; " 137d521c6b9SJung-uk Kim " cli ; " 138d521c6b9SJung-uk Kim " movl %1,%%eax ; " 139d521c6b9SJung-uk Kim " movl %2,%%edx ; " 140d521c6b9SJung-uk Kim " popfl" 141d521c6b9SJung-uk Kim : "=&A" (res) /* 0 */ 142d521c6b9SJung-uk Kim : "m" (*low), /* 1 */ 143d521c6b9SJung-uk Kim "m" (*high) /* 2 */ 144d521c6b9SJung-uk Kim : "memory"); 145d521c6b9SJung-uk Kim 146d521c6b9SJung-uk Kim return (res); 147d521c6b9SJung-uk Kim } 148d521c6b9SJung-uk Kim 149d521c6b9SJung-uk Kim static __inline void 150d521c6b9SJung-uk Kim atomic_store_rel_64_i386(volatile uint64_t *p, uint64_t v) 151d521c6b9SJung-uk Kim { 152d521c6b9SJung-uk Kim volatile uint32_t *high, *low; 153d521c6b9SJung-uk Kim 154d521c6b9SJung-uk Kim low = (volatile uint32_t *)p; 155d521c6b9SJung-uk Kim high = (volatile uint32_t *)p + 1; 156d521c6b9SJung-uk Kim __asm __volatile( 157d521c6b9SJung-uk Kim " pushfl ; " 158d521c6b9SJung-uk Kim " cli ; " 159d521c6b9SJung-uk Kim " movl %%eax,%0 ; " 160d521c6b9SJung-uk Kim " movl %%edx,%1 ; " 161d521c6b9SJung-uk Kim " popfl" 162d521c6b9SJung-uk Kim : "=m" (*low), /* 0 */ 163d521c6b9SJung-uk Kim "=m" (*high) /* 1 */ 164d521c6b9SJung-uk Kim : "A" (v) /* 2 */ 165d521c6b9SJung-uk Kim : "memory"); 166d521c6b9SJung-uk Kim } 167d521c6b9SJung-uk Kim 168d521c6b9SJung-uk Kim static __inline uint64_t 169d521c6b9SJung-uk Kim atomic_load_acq_64_i586(volatile uint64_t *p) 170d521c6b9SJung-uk Kim { 171d521c6b9SJung-uk Kim uint64_t res; 172d521c6b9SJung-uk Kim 173d521c6b9SJung-uk Kim __asm __volatile( 174d521c6b9SJung-uk Kim " movl %%ebx,%%eax ; " 175d521c6b9SJung-uk Kim " movl %%ecx,%%edx ; " 176d521c6b9SJung-uk Kim " " MPLOCKED " " 177*fe94be3dSJung-uk Kim " cmpxchg8b %1" 178d521c6b9SJung-uk Kim : "=&A" (res), /* 0 */ 179*fe94be3dSJung-uk Kim "+m" (*p) /* 1 */ 180*fe94be3dSJung-uk Kim : : "memory", "cc"); 181d521c6b9SJung-uk Kim 182d521c6b9SJung-uk Kim return (res); 183d521c6b9SJung-uk Kim } 184d521c6b9SJung-uk Kim 185d521c6b9SJung-uk Kim static __inline void 186d521c6b9SJung-uk Kim atomic_store_rel_64_i586(volatile uint64_t *p, uint64_t v) 187d521c6b9SJung-uk Kim { 188d521c6b9SJung-uk Kim 189d521c6b9SJung-uk Kim __asm __volatile( 190d521c6b9SJung-uk Kim " movl %%eax,%%ebx ; " 191d521c6b9SJung-uk Kim " movl %%edx,%%ecx ; " 192d521c6b9SJung-uk Kim "1: " 193d521c6b9SJung-uk Kim " " MPLOCKED " " 194*fe94be3dSJung-uk Kim " cmpxchg8b %0 ; " 195d521c6b9SJung-uk Kim " jne 1b" 196*fe94be3dSJung-uk Kim : "+m" (*p), /* 0 */ 197d521c6b9SJung-uk Kim "+A" (v) /* 1 */ 198*fe94be3dSJung-uk Kim : : "ebx", "ecx", "memory", "cc"); 199d521c6b9SJung-uk Kim } 200d521c6b9SJung-uk Kim 201d521c6b9SJung-uk Kim #endif /* _KERNEL && !WANT_FUNCTIONS */ 202d521c6b9SJung-uk Kim 203819e370cSPoul-Henning Kamp /* 204819e370cSPoul-Henning Kamp * Atomic compare and set, used by the mutex functions 205819e370cSPoul-Henning Kamp * 206065b12a7SPoul-Henning Kamp * if (*dst == expect) *dst = src (all 32 bit words) 207819e370cSPoul-Henning Kamp * 208819e370cSPoul-Henning Kamp * Returns 0 on failure, non-zero on success 209819e370cSPoul-Henning Kamp */ 210819e370cSPoul-Henning Kamp 211f28e1c8fSBruce Evans #ifdef CPU_DISABLE_CMPXCHG 2124c5aee92SMark Murray 2138448afceSAttilio Rao static __inline int 214065b12a7SPoul-Henning Kamp atomic_cmpset_int(volatile u_int *dst, u_int expect, u_int src) 2158448afceSAttilio Rao { 2168448afceSAttilio Rao u_char res; 2178448afceSAttilio Rao 2188448afceSAttilio Rao __asm __volatile( 2198448afceSAttilio Rao " pushfl ; " 2208448afceSAttilio Rao " cli ; " 221*fe94be3dSJung-uk Kim " cmpl %3,%1 ; " 2228448afceSAttilio Rao " jne 1f ; " 2238448afceSAttilio Rao " movl %2,%1 ; " 2248448afceSAttilio Rao "1: " 2258448afceSAttilio Rao " sete %0 ; " 2268448afceSAttilio Rao " popfl ; " 2278448afceSAttilio Rao "# atomic_cmpset_int" 2288448afceSAttilio Rao : "=q" (res), /* 0 */ 229*fe94be3dSJung-uk Kim "+m" (*dst) /* 1 */ 2308448afceSAttilio Rao : "r" (src), /* 2 */ 231*fe94be3dSJung-uk Kim "r" (expect) /* 3 */ 2328448afceSAttilio Rao : "memory"); 2338448afceSAttilio Rao 2348448afceSAttilio Rao return (res); 2358448afceSAttilio Rao } 2364c5aee92SMark Murray 237f28e1c8fSBruce Evans #else /* !CPU_DISABLE_CMPXCHG */ 2384c5aee92SMark Murray 2398448afceSAttilio Rao static __inline int 240065b12a7SPoul-Henning Kamp atomic_cmpset_int(volatile u_int *dst, u_int expect, u_int src) 2418448afceSAttilio Rao { 2428448afceSAttilio Rao u_char res; 2438448afceSAttilio Rao 2448448afceSAttilio Rao __asm __volatile( 2458448afceSAttilio Rao " " MPLOCKED " " 2468448afceSAttilio Rao " cmpxchgl %2,%1 ; " 2478448afceSAttilio Rao " sete %0 ; " 2488448afceSAttilio Rao "# atomic_cmpset_int" 2498448afceSAttilio Rao : "=a" (res), /* 0 */ 250*fe94be3dSJung-uk Kim "+m" (*dst) /* 1 */ 2518448afceSAttilio Rao : "r" (src), /* 2 */ 252*fe94be3dSJung-uk Kim "a" (expect) /* 3 */ 2537222d2fbSKonstantin Belousov : "memory", "cc"); 2548448afceSAttilio Rao 2558448afceSAttilio Rao return (res); 2568448afceSAttilio Rao } 2574c5aee92SMark Murray 258f28e1c8fSBruce Evans #endif /* CPU_DISABLE_CMPXCHG */ 2594c5aee92SMark Murray 2603c2bc2bfSJohn Baldwin /* 2613c2bc2bfSJohn Baldwin * Atomically add the value of v to the integer pointed to by p and return 2623c2bc2bfSJohn Baldwin * the previous value of *p. 2633c2bc2bfSJohn Baldwin */ 2643c2bc2bfSJohn Baldwin static __inline u_int 2653c2bc2bfSJohn Baldwin atomic_fetchadd_int(volatile u_int *p, u_int v) 2663c2bc2bfSJohn Baldwin { 2673c2bc2bfSJohn Baldwin 2683c2bc2bfSJohn Baldwin __asm __volatile( 2697e4277e5SBruce Evans " " MPLOCKED " " 2703c2bc2bfSJohn Baldwin " xaddl %0,%1 ; " 2713c2bc2bfSJohn Baldwin "# atomic_fetchadd_int" 272ee93d117SJung-uk Kim : "+r" (v), /* 0 */ 273*fe94be3dSJung-uk Kim "+m" (*p) /* 1 */ 274*fe94be3dSJung-uk Kim : : "cc"); 2753c2bc2bfSJohn Baldwin return (v); 2763c2bc2bfSJohn Baldwin } 2773c2bc2bfSJohn Baldwin 278fa9f322dSKonstantin Belousov /* 279fa9f322dSKonstantin Belousov * We assume that a = b will do atomic loads and stores. Due to the 280fa9f322dSKonstantin Belousov * IA32 memory model, a simple store guarantees release semantics. 281fa9f322dSKonstantin Belousov * 282fa9f322dSKonstantin Belousov * However, loads may pass stores, so for atomic_load_acq we have to 283fa9f322dSKonstantin Belousov * ensure a Store/Load barrier to do the load in SMP kernels. We use 284fa9f322dSKonstantin Belousov * "lock cmpxchg" as recommended by the AMD Software Optimization 285fa9f322dSKonstantin Belousov * Guide, and not mfence. For UP kernels, however, the cache of the 286fa9f322dSKonstantin Belousov * single processor is always consistent, so we only need to take care 287fa9f322dSKonstantin Belousov * of the compiler. 288fa9f322dSKonstantin Belousov */ 289fa9f322dSKonstantin Belousov #define ATOMIC_STORE(TYPE) \ 290fa9f322dSKonstantin Belousov static __inline void \ 291fa9f322dSKonstantin Belousov atomic_store_rel_##TYPE(volatile u_##TYPE *p, u_##TYPE v)\ 292fa9f322dSKonstantin Belousov { \ 2933a473025SAttilio Rao __compiler_membar(); \ 294fa9f322dSKonstantin Belousov *p = v; \ 295fa9f322dSKonstantin Belousov } \ 296fa9f322dSKonstantin Belousov struct __hack 297fa9f322dSKonstantin Belousov 29890baa95fSJohn Baldwin #if defined(_KERNEL) && !defined(SMP) 2994c5aee92SMark Murray 300fa9f322dSKonstantin Belousov #define ATOMIC_LOAD(TYPE, LOP) \ 301ccbdd9eeSJohn Baldwin static __inline u_##TYPE \ 302ccbdd9eeSJohn Baldwin atomic_load_acq_##TYPE(volatile u_##TYPE *p) \ 303ccbdd9eeSJohn Baldwin { \ 30486d2e48cSAttilio Rao u_##TYPE tmp; \ 30586d2e48cSAttilio Rao \ 30686d2e48cSAttilio Rao tmp = *p; \ 3073a473025SAttilio Rao __compiler_membar(); \ 30886d2e48cSAttilio Rao return (tmp); \ 309ccbdd9eeSJohn Baldwin } \ 3106d800f89SBruce Evans struct __hack 3114c5aee92SMark Murray 312f28e1c8fSBruce Evans #else /* !(_KERNEL && !SMP) */ 313ccbdd9eeSJohn Baldwin 314fa9f322dSKonstantin Belousov #define ATOMIC_LOAD(TYPE, LOP) \ 3159d979d89SJohn Baldwin static __inline u_##TYPE \ 3169d979d89SJohn Baldwin atomic_load_acq_##TYPE(volatile u_##TYPE *p) \ 3179d979d89SJohn Baldwin { \ 3189d979d89SJohn Baldwin u_##TYPE res; \ 3199d979d89SJohn Baldwin \ 3207e4277e5SBruce Evans __asm __volatile(MPLOCKED LOP \ 321f28e1c8fSBruce Evans : "=a" (res), /* 0 */ \ 322*fe94be3dSJung-uk Kim "+m" (*p) /* 1 */ \ 323*fe94be3dSJung-uk Kim : : "memory", "cc"); \ 3249d979d89SJohn Baldwin \ 3259d979d89SJohn Baldwin return (res); \ 3269d979d89SJohn Baldwin } \ 3276d800f89SBruce Evans struct __hack 3284c5aee92SMark Murray 329f28e1c8fSBruce Evans #endif /* _KERNEL && !SMP */ 3304c5aee92SMark Murray 33148281036SJohn Baldwin #endif /* KLD_MODULE || !__GNUCLIKE_ASM */ 3328a6b1c8fSJohn Baldwin 3338306a37bSMark Murray ATOMIC_ASM(set, char, "orb %b1,%0", "iq", v); 3348306a37bSMark Murray ATOMIC_ASM(clear, char, "andb %b1,%0", "iq", ~v); 3358306a37bSMark Murray ATOMIC_ASM(add, char, "addb %b1,%0", "iq", v); 3368306a37bSMark Murray ATOMIC_ASM(subtract, char, "subb %b1,%0", "iq", v); 3378a6b1c8fSJohn Baldwin 3388306a37bSMark Murray ATOMIC_ASM(set, short, "orw %w1,%0", "ir", v); 3398306a37bSMark Murray ATOMIC_ASM(clear, short, "andw %w1,%0", "ir", ~v); 3408306a37bSMark Murray ATOMIC_ASM(add, short, "addw %w1,%0", "ir", v); 3418306a37bSMark Murray ATOMIC_ASM(subtract, short, "subw %w1,%0", "ir", v); 3428a6b1c8fSJohn Baldwin 3438306a37bSMark Murray ATOMIC_ASM(set, int, "orl %1,%0", "ir", v); 3448306a37bSMark Murray ATOMIC_ASM(clear, int, "andl %1,%0", "ir", ~v); 3458306a37bSMark Murray ATOMIC_ASM(add, int, "addl %1,%0", "ir", v); 3468306a37bSMark Murray ATOMIC_ASM(subtract, int, "subl %1,%0", "ir", v); 3478a6b1c8fSJohn Baldwin 3488306a37bSMark Murray ATOMIC_ASM(set, long, "orl %1,%0", "ir", v); 3498306a37bSMark Murray ATOMIC_ASM(clear, long, "andl %1,%0", "ir", ~v); 3508306a37bSMark Murray ATOMIC_ASM(add, long, "addl %1,%0", "ir", v); 3518306a37bSMark Murray ATOMIC_ASM(subtract, long, "subl %1,%0", "ir", v); 3529d979d89SJohn Baldwin 353fa9f322dSKonstantin Belousov ATOMIC_LOAD(char, "cmpxchgb %b0,%1"); 354fa9f322dSKonstantin Belousov ATOMIC_LOAD(short, "cmpxchgw %w0,%1"); 355fa9f322dSKonstantin Belousov ATOMIC_LOAD(int, "cmpxchgl %0,%1"); 356fa9f322dSKonstantin Belousov ATOMIC_LOAD(long, "cmpxchgl %0,%1"); 357fa9f322dSKonstantin Belousov 358fa9f322dSKonstantin Belousov ATOMIC_STORE(char); 359fa9f322dSKonstantin Belousov ATOMIC_STORE(short); 360fa9f322dSKonstantin Belousov ATOMIC_STORE(int); 361fa9f322dSKonstantin Belousov ATOMIC_STORE(long); 362ccbdd9eeSJohn Baldwin 3638a6b1c8fSJohn Baldwin #undef ATOMIC_ASM 364fa9f322dSKonstantin Belousov #undef ATOMIC_LOAD 365fa9f322dSKonstantin Belousov #undef ATOMIC_STORE 366ccbdd9eeSJohn Baldwin 367f28e1c8fSBruce Evans #ifndef WANT_FUNCTIONS 36848281036SJohn Baldwin 369d521c6b9SJung-uk Kim #ifdef _KERNEL 370d521c6b9SJung-uk Kim extern uint64_t (*atomic_load_acq_64)(volatile uint64_t *); 371d521c6b9SJung-uk Kim extern void (*atomic_store_rel_64)(volatile uint64_t *, uint64_t); 372d521c6b9SJung-uk Kim #endif 373d521c6b9SJung-uk Kim 37448281036SJohn Baldwin static __inline int 375065b12a7SPoul-Henning Kamp atomic_cmpset_long(volatile u_long *dst, u_long expect, u_long src) 37648281036SJohn Baldwin { 37748281036SJohn Baldwin 378065b12a7SPoul-Henning Kamp return (atomic_cmpset_int((volatile u_int *)dst, (u_int)expect, 37948281036SJohn Baldwin (u_int)src)); 38048281036SJohn Baldwin } 38148281036SJohn Baldwin 3826eb4157fSPawel Jakub Dawidek static __inline u_long 3836eb4157fSPawel Jakub Dawidek atomic_fetchadd_long(volatile u_long *p, u_long v) 3846eb4157fSPawel Jakub Dawidek { 3856eb4157fSPawel Jakub Dawidek 3866eb4157fSPawel Jakub Dawidek return (atomic_fetchadd_int((volatile u_int *)p, (u_int)v)); 3876eb4157fSPawel Jakub Dawidek } 3886eb4157fSPawel Jakub Dawidek 38948281036SJohn Baldwin /* Read the current value and store a zero in the destination. */ 39048281036SJohn Baldwin #ifdef __GNUCLIKE_ASM 39148281036SJohn Baldwin 39248281036SJohn Baldwin static __inline u_int 393ee93d117SJung-uk Kim atomic_readandclear_int(volatile u_int *p) 39448281036SJohn Baldwin { 395f28e1c8fSBruce Evans u_int res; 39648281036SJohn Baldwin 397f28e1c8fSBruce Evans res = 0; 39848281036SJohn Baldwin __asm __volatile( 39948281036SJohn Baldwin " xchgl %1,%0 ; " 40048281036SJohn Baldwin "# atomic_readandclear_int" 401f28e1c8fSBruce Evans : "+r" (res), /* 0 */ 402*fe94be3dSJung-uk Kim "+m" (*p)); /* 1 */ 40348281036SJohn Baldwin 404f28e1c8fSBruce Evans return (res); 40548281036SJohn Baldwin } 40648281036SJohn Baldwin 40748281036SJohn Baldwin static __inline u_long 408ee93d117SJung-uk Kim atomic_readandclear_long(volatile u_long *p) 40948281036SJohn Baldwin { 410f28e1c8fSBruce Evans u_long res; 41148281036SJohn Baldwin 412f28e1c8fSBruce Evans res = 0; 41348281036SJohn Baldwin __asm __volatile( 41448281036SJohn Baldwin " xchgl %1,%0 ; " 41548281036SJohn Baldwin "# atomic_readandclear_long" 4160b194ec8SBruce Evans : "+r" (res), /* 0 */ 417*fe94be3dSJung-uk Kim "+m" (*p)); /* 1 */ 41848281036SJohn Baldwin 419f28e1c8fSBruce Evans return (res); 42048281036SJohn Baldwin } 42148281036SJohn Baldwin 42248281036SJohn Baldwin #else /* !__GNUCLIKE_ASM */ 42348281036SJohn Baldwin 424ee93d117SJung-uk Kim u_int atomic_readandclear_int(volatile u_int *p); 425ee93d117SJung-uk Kim u_long atomic_readandclear_long(volatile u_long *p); 42648281036SJohn Baldwin 42748281036SJohn Baldwin #endif /* __GNUCLIKE_ASM */ 42848281036SJohn Baldwin 42986d2e48cSAttilio Rao #define atomic_set_acq_char atomic_set_barr_char 43086d2e48cSAttilio Rao #define atomic_set_rel_char atomic_set_barr_char 43186d2e48cSAttilio Rao #define atomic_clear_acq_char atomic_clear_barr_char 43286d2e48cSAttilio Rao #define atomic_clear_rel_char atomic_clear_barr_char 43386d2e48cSAttilio Rao #define atomic_add_acq_char atomic_add_barr_char 43486d2e48cSAttilio Rao #define atomic_add_rel_char atomic_add_barr_char 43586d2e48cSAttilio Rao #define atomic_subtract_acq_char atomic_subtract_barr_char 43686d2e48cSAttilio Rao #define atomic_subtract_rel_char atomic_subtract_barr_char 4378a6b1c8fSJohn Baldwin 43886d2e48cSAttilio Rao #define atomic_set_acq_short atomic_set_barr_short 43986d2e48cSAttilio Rao #define atomic_set_rel_short atomic_set_barr_short 44086d2e48cSAttilio Rao #define atomic_clear_acq_short atomic_clear_barr_short 44186d2e48cSAttilio Rao #define atomic_clear_rel_short atomic_clear_barr_short 44286d2e48cSAttilio Rao #define atomic_add_acq_short atomic_add_barr_short 44386d2e48cSAttilio Rao #define atomic_add_rel_short atomic_add_barr_short 44486d2e48cSAttilio Rao #define atomic_subtract_acq_short atomic_subtract_barr_short 44586d2e48cSAttilio Rao #define atomic_subtract_rel_short atomic_subtract_barr_short 4468a6b1c8fSJohn Baldwin 44786d2e48cSAttilio Rao #define atomic_set_acq_int atomic_set_barr_int 44886d2e48cSAttilio Rao #define atomic_set_rel_int atomic_set_barr_int 44986d2e48cSAttilio Rao #define atomic_clear_acq_int atomic_clear_barr_int 45086d2e48cSAttilio Rao #define atomic_clear_rel_int atomic_clear_barr_int 45186d2e48cSAttilio Rao #define atomic_add_acq_int atomic_add_barr_int 45286d2e48cSAttilio Rao #define atomic_add_rel_int atomic_add_barr_int 45386d2e48cSAttilio Rao #define atomic_subtract_acq_int atomic_subtract_barr_int 45486d2e48cSAttilio Rao #define atomic_subtract_rel_int atomic_subtract_barr_int 4558448afceSAttilio Rao #define atomic_cmpset_acq_int atomic_cmpset_int 4568448afceSAttilio Rao #define atomic_cmpset_rel_int atomic_cmpset_int 4578a6b1c8fSJohn Baldwin 45886d2e48cSAttilio Rao #define atomic_set_acq_long atomic_set_barr_long 45986d2e48cSAttilio Rao #define atomic_set_rel_long atomic_set_barr_long 46086d2e48cSAttilio Rao #define atomic_clear_acq_long atomic_clear_barr_long 46186d2e48cSAttilio Rao #define atomic_clear_rel_long atomic_clear_barr_long 46286d2e48cSAttilio Rao #define atomic_add_acq_long atomic_add_barr_long 46386d2e48cSAttilio Rao #define atomic_add_rel_long atomic_add_barr_long 46486d2e48cSAttilio Rao #define atomic_subtract_acq_long atomic_subtract_barr_long 46586d2e48cSAttilio Rao #define atomic_subtract_rel_long atomic_subtract_barr_long 4668448afceSAttilio Rao #define atomic_cmpset_acq_long atomic_cmpset_long 4678448afceSAttilio Rao #define atomic_cmpset_rel_long atomic_cmpset_long 4688a6b1c8fSJohn Baldwin 46948281036SJohn Baldwin /* Operations on 8-bit bytes. */ 4708a6b1c8fSJohn Baldwin #define atomic_set_8 atomic_set_char 4718a6b1c8fSJohn Baldwin #define atomic_set_acq_8 atomic_set_acq_char 4728a6b1c8fSJohn Baldwin #define atomic_set_rel_8 atomic_set_rel_char 4738a6b1c8fSJohn Baldwin #define atomic_clear_8 atomic_clear_char 4748a6b1c8fSJohn Baldwin #define atomic_clear_acq_8 atomic_clear_acq_char 4758a6b1c8fSJohn Baldwin #define atomic_clear_rel_8 atomic_clear_rel_char 4768a6b1c8fSJohn Baldwin #define atomic_add_8 atomic_add_char 4778a6b1c8fSJohn Baldwin #define atomic_add_acq_8 atomic_add_acq_char 4788a6b1c8fSJohn Baldwin #define atomic_add_rel_8 atomic_add_rel_char 4798a6b1c8fSJohn Baldwin #define atomic_subtract_8 atomic_subtract_char 4808a6b1c8fSJohn Baldwin #define atomic_subtract_acq_8 atomic_subtract_acq_char 4818a6b1c8fSJohn Baldwin #define atomic_subtract_rel_8 atomic_subtract_rel_char 4828a6b1c8fSJohn Baldwin #define atomic_load_acq_8 atomic_load_acq_char 4838a6b1c8fSJohn Baldwin #define atomic_store_rel_8 atomic_store_rel_char 4848a6b1c8fSJohn Baldwin 48548281036SJohn Baldwin /* Operations on 16-bit words. */ 4868a6b1c8fSJohn Baldwin #define atomic_set_16 atomic_set_short 4878a6b1c8fSJohn Baldwin #define atomic_set_acq_16 atomic_set_acq_short 4888a6b1c8fSJohn Baldwin #define atomic_set_rel_16 atomic_set_rel_short 4898a6b1c8fSJohn Baldwin #define atomic_clear_16 atomic_clear_short 4908a6b1c8fSJohn Baldwin #define atomic_clear_acq_16 atomic_clear_acq_short 4918a6b1c8fSJohn Baldwin #define atomic_clear_rel_16 atomic_clear_rel_short 4928a6b1c8fSJohn Baldwin #define atomic_add_16 atomic_add_short 4938a6b1c8fSJohn Baldwin #define atomic_add_acq_16 atomic_add_acq_short 4948a6b1c8fSJohn Baldwin #define atomic_add_rel_16 atomic_add_rel_short 4958a6b1c8fSJohn Baldwin #define atomic_subtract_16 atomic_subtract_short 4968a6b1c8fSJohn Baldwin #define atomic_subtract_acq_16 atomic_subtract_acq_short 4978a6b1c8fSJohn Baldwin #define atomic_subtract_rel_16 atomic_subtract_rel_short 4988a6b1c8fSJohn Baldwin #define atomic_load_acq_16 atomic_load_acq_short 4998a6b1c8fSJohn Baldwin #define atomic_store_rel_16 atomic_store_rel_short 5008a6b1c8fSJohn Baldwin 50148281036SJohn Baldwin /* Operations on 32-bit double words. */ 5028a6b1c8fSJohn Baldwin #define atomic_set_32 atomic_set_int 5038a6b1c8fSJohn Baldwin #define atomic_set_acq_32 atomic_set_acq_int 5048a6b1c8fSJohn Baldwin #define atomic_set_rel_32 atomic_set_rel_int 5058a6b1c8fSJohn Baldwin #define atomic_clear_32 atomic_clear_int 5068a6b1c8fSJohn Baldwin #define atomic_clear_acq_32 atomic_clear_acq_int 5078a6b1c8fSJohn Baldwin #define atomic_clear_rel_32 atomic_clear_rel_int 5088a6b1c8fSJohn Baldwin #define atomic_add_32 atomic_add_int 5098a6b1c8fSJohn Baldwin #define atomic_add_acq_32 atomic_add_acq_int 5108a6b1c8fSJohn Baldwin #define atomic_add_rel_32 atomic_add_rel_int 5118a6b1c8fSJohn Baldwin #define atomic_subtract_32 atomic_subtract_int 5128a6b1c8fSJohn Baldwin #define atomic_subtract_acq_32 atomic_subtract_acq_int 5138a6b1c8fSJohn Baldwin #define atomic_subtract_rel_32 atomic_subtract_rel_int 5148a6b1c8fSJohn Baldwin #define atomic_load_acq_32 atomic_load_acq_int 5158a6b1c8fSJohn Baldwin #define atomic_store_rel_32 atomic_store_rel_int 5168a6b1c8fSJohn Baldwin #define atomic_cmpset_32 atomic_cmpset_int 5178a6b1c8fSJohn Baldwin #define atomic_cmpset_acq_32 atomic_cmpset_acq_int 5188a6b1c8fSJohn Baldwin #define atomic_cmpset_rel_32 atomic_cmpset_rel_int 5198a6b1c8fSJohn Baldwin #define atomic_readandclear_32 atomic_readandclear_int 5203c2bc2bfSJohn Baldwin #define atomic_fetchadd_32 atomic_fetchadd_int 5218a6b1c8fSJohn Baldwin 52248281036SJohn Baldwin /* Operations on pointers. */ 5236f0f8ccaSDag-Erling Smørgrav #define atomic_set_ptr(p, v) \ 5246f0f8ccaSDag-Erling Smørgrav atomic_set_int((volatile u_int *)(p), (u_int)(v)) 5256f0f8ccaSDag-Erling Smørgrav #define atomic_set_acq_ptr(p, v) \ 5266f0f8ccaSDag-Erling Smørgrav atomic_set_acq_int((volatile u_int *)(p), (u_int)(v)) 5276f0f8ccaSDag-Erling Smørgrav #define atomic_set_rel_ptr(p, v) \ 5286f0f8ccaSDag-Erling Smørgrav atomic_set_rel_int((volatile u_int *)(p), (u_int)(v)) 5296f0f8ccaSDag-Erling Smørgrav #define atomic_clear_ptr(p, v) \ 5306f0f8ccaSDag-Erling Smørgrav atomic_clear_int((volatile u_int *)(p), (u_int)(v)) 5316f0f8ccaSDag-Erling Smørgrav #define atomic_clear_acq_ptr(p, v) \ 5326f0f8ccaSDag-Erling Smørgrav atomic_clear_acq_int((volatile u_int *)(p), (u_int)(v)) 5336f0f8ccaSDag-Erling Smørgrav #define atomic_clear_rel_ptr(p, v) \ 5346f0f8ccaSDag-Erling Smørgrav atomic_clear_rel_int((volatile u_int *)(p), (u_int)(v)) 5356f0f8ccaSDag-Erling Smørgrav #define atomic_add_ptr(p, v) \ 5366f0f8ccaSDag-Erling Smørgrav atomic_add_int((volatile u_int *)(p), (u_int)(v)) 5376f0f8ccaSDag-Erling Smørgrav #define atomic_add_acq_ptr(p, v) \ 5386f0f8ccaSDag-Erling Smørgrav atomic_add_acq_int((volatile u_int *)(p), (u_int)(v)) 5396f0f8ccaSDag-Erling Smørgrav #define atomic_add_rel_ptr(p, v) \ 5406f0f8ccaSDag-Erling Smørgrav atomic_add_rel_int((volatile u_int *)(p), (u_int)(v)) 5416f0f8ccaSDag-Erling Smørgrav #define atomic_subtract_ptr(p, v) \ 5426f0f8ccaSDag-Erling Smørgrav atomic_subtract_int((volatile u_int *)(p), (u_int)(v)) 5436f0f8ccaSDag-Erling Smørgrav #define atomic_subtract_acq_ptr(p, v) \ 5446f0f8ccaSDag-Erling Smørgrav atomic_subtract_acq_int((volatile u_int *)(p), (u_int)(v)) 5456f0f8ccaSDag-Erling Smørgrav #define atomic_subtract_rel_ptr(p, v) \ 5466f0f8ccaSDag-Erling Smørgrav atomic_subtract_rel_int((volatile u_int *)(p), (u_int)(v)) 5476f0f8ccaSDag-Erling Smørgrav #define atomic_load_acq_ptr(p) \ 5486f0f8ccaSDag-Erling Smørgrav atomic_load_acq_int((volatile u_int *)(p)) 5496f0f8ccaSDag-Erling Smørgrav #define atomic_store_rel_ptr(p, v) \ 5506f0f8ccaSDag-Erling Smørgrav atomic_store_rel_int((volatile u_int *)(p), (v)) 5516f0f8ccaSDag-Erling Smørgrav #define atomic_cmpset_ptr(dst, old, new) \ 5526f0f8ccaSDag-Erling Smørgrav atomic_cmpset_int((volatile u_int *)(dst), (u_int)(old), (u_int)(new)) 5536f0f8ccaSDag-Erling Smørgrav #define atomic_cmpset_acq_ptr(dst, old, new) \ 5546c296ffaSBruce Evans atomic_cmpset_acq_int((volatile u_int *)(dst), (u_int)(old), \ 5556c296ffaSBruce Evans (u_int)(new)) 5566f0f8ccaSDag-Erling Smørgrav #define atomic_cmpset_rel_ptr(dst, old, new) \ 5576c296ffaSBruce Evans atomic_cmpset_rel_int((volatile u_int *)(dst), (u_int)(old), \ 5586c296ffaSBruce Evans (u_int)(new)) 5596f0f8ccaSDag-Erling Smørgrav #define atomic_readandclear_ptr(p) \ 5606f0f8ccaSDag-Erling Smørgrav atomic_readandclear_int((volatile u_int *)(p)) 561ccbdd9eeSJohn Baldwin 562f28e1c8fSBruce Evans #endif /* !WANT_FUNCTIONS */ 5636c296ffaSBruce Evans 564069e9bc1SDoug Rabson #endif /* !_MACHINE_ATOMIC_H_ */ 565