atomic.h revision 286051
138517Sdfr/*- 238517Sdfr * Copyright (c) 1998 Doug Rabson 338517Sdfr * All rights reserved. 438517Sdfr * 538517Sdfr * Redistribution and use in source and binary forms, with or without 638517Sdfr * modification, are permitted provided that the following conditions 738517Sdfr * are met: 838517Sdfr * 1. Redistributions of source code must retain the above copyright 938517Sdfr * notice, this list of conditions and the following disclaimer. 1038517Sdfr * 2. Redistributions in binary form must reproduce the above copyright 1138517Sdfr * notice, this list of conditions and the following disclaimer in the 1238517Sdfr * documentation and/or other materials provided with the distribution. 1338517Sdfr * 1438517Sdfr * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 1538517Sdfr * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 1638517Sdfr * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 1738517Sdfr * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 1838517Sdfr * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 1938517Sdfr * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 2038517Sdfr * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 2138517Sdfr * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 2238517Sdfr * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 2338517Sdfr * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 2438517Sdfr * SUCH DAMAGE. 2538517Sdfr * 2650477Speter * $FreeBSD: head/sys/i386/include/atomic.h 286051 2015-07-30 00:13:20Z kib $ 2738517Sdfr */ 2838517Sdfr#ifndef _MACHINE_ATOMIC_H_ 29147855Sjhb#define _MACHINE_ATOMIC_H_ 3038517Sdfr 31143063Sjoerg#ifndef _SYS_CDEFS_H_ 32143063Sjoerg#error this file needs sys/cdefs.h as a prerequisite 33143063Sjoerg#endif 34143063Sjoerg 35254619Sjkim#ifdef _KERNEL 36254619Sjkim#include <machine/md_var.h> 37254619Sjkim#include <machine/specialreg.h> 38254619Sjkim#endif 39254619Sjkim 40286051Skib#ifndef __OFFSETOF_MONITORBUF 41286051Skib/* 42286051Skib * __OFFSETOF_MONITORBUF == __pcpu_offset(pc_monitorbuf). 43286051Skib * 44286051Skib * The open-coded number is used instead of the symbolic expression to 45286051Skib * avoid a dependency on sys/pcpu.h in machine/atomic.h consumers. 46286051Skib * An assertion in i386/vm_machdep.c ensures that the value is correct. 47286051Skib */ 48286051Skib#define __OFFSETOF_MONITORBUF 0x180 49185162Skmacy 50286051Skibstatic __inline void 51286051Skib__mbk(void) 52286051Skib{ 53286051Skib 54286051Skib __asm __volatile("lock; addl $0,%%fs:%0" 55286051Skib : "+m" (*(u_int *)__OFFSETOF_MONITORBUF) : : "memory", "cc"); 56286051Skib} 57286051Skib 58286051Skibstatic __inline void 59286051Skib__mbu(void) 60286051Skib{ 61286051Skib 62286051Skib __asm __volatile("lock; addl $0,(%%esp)" : : : "memory", "cc"); 63286051Skib} 64286051Skib#endif 65286051Skib 6638517Sdfr/* 67165635Sbde * Various simple operations on memory, each of which is atomic in the 68165635Sbde * presence of interrupts and multiple processors. 6938517Sdfr * 70165633Sbde * atomic_set_char(P, V) (*(u_char *)(P) |= (V)) 71165633Sbde * atomic_clear_char(P, V) (*(u_char *)(P) &= ~(V)) 72165633Sbde * atomic_add_char(P, V) (*(u_char *)(P) += (V)) 73165633Sbde * atomic_subtract_char(P, V) (*(u_char *)(P) -= (V)) 7448797Salc * 75165633Sbde * atomic_set_short(P, V) (*(u_short *)(P) |= (V)) 76165633Sbde * atomic_clear_short(P, V) (*(u_short *)(P) &= ~(V)) 77165633Sbde * atomic_add_short(P, V) (*(u_short *)(P) += (V)) 78165633Sbde * atomic_subtract_short(P, V) (*(u_short *)(P) -= (V)) 7948797Salc * 80165633Sbde * atomic_set_int(P, V) (*(u_int *)(P) |= (V)) 81165633Sbde * atomic_clear_int(P, V) (*(u_int *)(P) &= ~(V)) 82165633Sbde * atomic_add_int(P, V) (*(u_int *)(P) += (V)) 83165633Sbde * atomic_subtract_int(P, V) (*(u_int *)(P) -= (V)) 84254617Sjkim * atomic_swap_int(P, V) (return (*(u_int *)(P)); *(u_int *)(P) = (V);) 85165635Sbde * atomic_readandclear_int(P) (return (*(u_int *)(P)); *(u_int *)(P) = 0;) 8648797Salc * 87165633Sbde * atomic_set_long(P, V) (*(u_long *)(P) |= (V)) 88165633Sbde * atomic_clear_long(P, V) (*(u_long *)(P) &= ~(V)) 89165633Sbde * atomic_add_long(P, V) (*(u_long *)(P) += (V)) 90165633Sbde * atomic_subtract_long(P, V) (*(u_long *)(P) -= (V)) 91254617Sjkim * atomic_swap_long(P, V) (return (*(u_long *)(P)); *(u_long *)(P) = (V);) 92165635Sbde * atomic_readandclear_long(P) (return (*(u_long *)(P)); *(u_long *)(P) = 0;) 9338517Sdfr */ 9438517Sdfr 9548797Salc/* 9649999Salc * The above functions are expanded inline in the statically-linked 9749999Salc * kernel. Lock prefixes are generated if an SMP kernel is being 9849999Salc * built. 9949999Salc * 10049999Salc * Kernel modules call real functions which are built into the kernel. 10149999Salc * This allows kernel modules to be portable between UP and SMP systems. 10248797Salc */ 103147855Sjhb#if defined(KLD_MODULE) || !defined(__GNUCLIKE_ASM) 104147855Sjhb#define ATOMIC_ASM(NAME, TYPE, OP, CONS, V) \ 105197803Sattiliovoid atomic_##NAME##_##TYPE(volatile u_##TYPE *p, u_##TYPE v); \ 106197803Sattiliovoid atomic_##NAME##_barr_##TYPE(volatile u_##TYPE *p, u_##TYPE v) 10749999Salc 108208332Sphkint atomic_cmpset_int(volatile u_int *dst, u_int expect, u_int src); 109165633Sbdeu_int atomic_fetchadd_int(volatile u_int *p, u_int v); 110254617Sjkimint atomic_testandset_int(volatile u_int *p, u_int v); 111285283Skibvoid atomic_thread_fence_acq(void); 112285283Skibvoid atomic_thread_fence_acq_rel(void); 113285283Skibvoid atomic_thread_fence_rel(void); 114285283Skibvoid atomic_thread_fence_seq_cst(void); 11565514Sphk 116284901Skib#define ATOMIC_LOAD(TYPE) \ 117236456Skibu_##TYPE atomic_load_acq_##TYPE(volatile u_##TYPE *p) 118236456Skib#define ATOMIC_STORE(TYPE) \ 119100251Smarkmvoid atomic_store_rel_##TYPE(volatile u_##TYPE *p, u_##TYPE v) 12071085Sjhb 121254620Sjkimint atomic_cmpset_64(volatile uint64_t *, uint64_t, uint64_t); 122254619Sjkimuint64_t atomic_load_acq_64(volatile uint64_t *); 123254619Sjkimvoid atomic_store_rel_64(volatile uint64_t *, uint64_t); 124254620Sjkimuint64_t atomic_swap_64(volatile uint64_t *, uint64_t); 125254619Sjkim 126147855Sjhb#else /* !KLD_MODULE && __GNUCLIKE_ASM */ 12772358Smarkm 12884679Sjhb/* 129165635Sbde * For userland, always use lock prefixes so that the binaries will run 130165635Sbde * on both SMP and !SMP systems. 13184679Sjhb */ 13284679Sjhb#if defined(SMP) || !defined(_KERNEL) 133165630Sbde#define MPLOCKED "lock ; " 13490515Sbde#else 135147855Sjhb#define MPLOCKED 13690515Sbde#endif 13738517Sdfr 13848797Salc/* 139197803Sattilio * The assembly is volatilized to avoid code chunk removal by the compiler. 140197803Sattilio * GCC aggressively reorders operations and memory clobbering is necessary 141197803Sattilio * in order to avoid that for memory barriers. 14248797Salc */ 143147855Sjhb#define ATOMIC_ASM(NAME, TYPE, OP, CONS, V) \ 14448797Salcstatic __inline void \ 14549043Salcatomic_##NAME##_##TYPE(volatile u_##TYPE *p, u_##TYPE v)\ 14648797Salc{ \ 147165630Sbde __asm __volatile(MPLOCKED OP \ 148254612Sjkim : "+m" (*p) \ 149254612Sjkim : CONS (V) \ 150216524Skib : "cc"); \ 151122827Sbde} \ 152197803Sattilio \ 153197803Sattiliostatic __inline void \ 154197803Sattilioatomic_##NAME##_barr_##TYPE(volatile u_##TYPE *p, u_##TYPE v)\ 155197803Sattilio{ \ 156197803Sattilio __asm __volatile(MPLOCKED OP \ 157254612Sjkim : "+m" (*p) \ 158254612Sjkim : CONS (V) \ 159216524Skib : "memory", "cc"); \ 160197803Sattilio} \ 161122827Sbdestruct __hack 162100327Smarkm 16365514Sphk/* 16465514Sphk * Atomic compare and set, used by the mutex functions 16565514Sphk * 166208332Sphk * if (*dst == expect) *dst = src (all 32 bit words) 16765514Sphk * 16865514Sphk * Returns 0 on failure, non-zero on success 16965514Sphk */ 17065514Sphk 171165635Sbde#ifdef CPU_DISABLE_CMPXCHG 172100327Smarkm 173197910Sattiliostatic __inline int 174208332Sphkatomic_cmpset_int(volatile u_int *dst, u_int expect, u_int src) 175197910Sattilio{ 176197910Sattilio u_char res; 17765514Sphk 178197910Sattilio __asm __volatile( 179197910Sattilio " pushfl ; " 180197910Sattilio " cli ; " 181254612Sjkim " cmpl %3,%1 ; " 182197910Sattilio " jne 1f ; " 183197910Sattilio " movl %2,%1 ; " 184197910Sattilio "1: " 185197910Sattilio " sete %0 ; " 186197910Sattilio " popfl ; " 187197910Sattilio "# atomic_cmpset_int" 188197910Sattilio : "=q" (res), /* 0 */ 189254612Sjkim "+m" (*dst) /* 1 */ 190197910Sattilio : "r" (src), /* 2 */ 191254612Sjkim "r" (expect) /* 3 */ 192197910Sattilio : "memory"); 193197910Sattilio return (res); 194197910Sattilio} 195197910Sattilio 196165635Sbde#else /* !CPU_DISABLE_CMPXCHG */ 197100327Smarkm 198197910Sattiliostatic __inline int 199208332Sphkatomic_cmpset_int(volatile u_int *dst, u_int expect, u_int src) 200197910Sattilio{ 201197910Sattilio u_char res; 20265514Sphk 203197910Sattilio __asm __volatile( 204197910Sattilio " " MPLOCKED " " 205254614Sjkim " cmpxchgl %3,%1 ; " 206197910Sattilio " sete %0 ; " 207197910Sattilio "# atomic_cmpset_int" 208254614Sjkim : "=q" (res), /* 0 */ 209254614Sjkim "+m" (*dst), /* 1 */ 210254614Sjkim "+a" (expect) /* 2 */ 211254614Sjkim : "r" (src) /* 3 */ 212216524Skib : "memory", "cc"); 213197910Sattilio return (res); 214197910Sattilio} 215197910Sattilio 216165635Sbde#endif /* CPU_DISABLE_CMPXCHG */ 217100327Smarkm 218150627Sjhb/* 219150627Sjhb * Atomically add the value of v to the integer pointed to by p and return 220150627Sjhb * the previous value of *p. 221150627Sjhb */ 222150627Sjhbstatic __inline u_int 223150627Sjhbatomic_fetchadd_int(volatile u_int *p, u_int v) 224150627Sjhb{ 225150627Sjhb 226165633Sbde __asm __volatile( 227165630Sbde " " MPLOCKED " " 228254610Sjkim " xaddl %0,%1 ; " 229150627Sjhb "# atomic_fetchadd_int" 230254610Sjkim : "+r" (v), /* 0 */ 231254612Sjkim "+m" (*p) /* 1 */ 232254612Sjkim : : "cc"); 233150627Sjhb return (v); 234150627Sjhb} 235150627Sjhb 236254617Sjkimstatic __inline int 237254617Sjkimatomic_testandset_int(volatile u_int *p, u_int v) 238254617Sjkim{ 239254617Sjkim u_char res; 240254617Sjkim 241254617Sjkim __asm __volatile( 242254617Sjkim " " MPLOCKED " " 243254617Sjkim " btsl %2,%1 ; " 244254617Sjkim " setc %0 ; " 245254617Sjkim "# atomic_testandset_int" 246254617Sjkim : "=q" (res), /* 0 */ 247254617Sjkim "+m" (*p) /* 1 */ 248254617Sjkim : "Ir" (v & 0x1f) /* 2 */ 249254617Sjkim : "cc"); 250254617Sjkim return (res); 251254617Sjkim} 252254617Sjkim 253236456Skib/* 254236456Skib * We assume that a = b will do atomic loads and stores. Due to the 255236456Skib * IA32 memory model, a simple store guarantees release semantics. 256236456Skib * 257284901Skib * However, a load may pass a store if they are performed on distinct 258286050Skib * addresses, so we need Store/Load barrier for sequentially 259286050Skib * consistent fences in SMP kernels. We use "lock addl $0,mem" for a 260286050Skib * Store/Load barrier, as recommended by the AMD Software Optimization 261286050Skib * Guide, and not mfence. In the kernel, we use a private per-cpu 262286050Skib * cache line as the target for the locked addition, to avoid 263286050Skib * introducing false data dependencies. In userspace, a word at the 264286050Skib * top of the stack is utilized. 265284901Skib * 266284901Skib * For UP kernels, however, the memory of the single processor is 267284901Skib * always consistent, so we only need to stop the compiler from 268284901Skib * reordering accesses in a way that violates the semantics of acquire 269284901Skib * and release. 270236456Skib */ 271286051Skib 272284901Skib#if defined(_KERNEL) 273284901Skib#if defined(SMP) 274286051Skib#define __storeload_barrier() __mbk() 275284901Skib#else /* _KERNEL && UP */ 276286051Skib#define __storeload_barrier() __compiler_membar() 277284901Skib#endif /* SMP */ 278284901Skib#else /* !_KERNEL */ 279286051Skib#define __storeload_barrier() __mbu() 280284901Skib#endif /* _KERNEL*/ 281284901Skib 282284901Skib#define ATOMIC_LOAD(TYPE) \ 283284901Skibstatic __inline u_##TYPE \ 284284901Skibatomic_load_acq_##TYPE(volatile u_##TYPE *p) \ 285284901Skib{ \ 286284901Skib u_##TYPE res; \ 287284901Skib \ 288284901Skib res = *p; \ 289284901Skib __compiler_membar(); \ 290284901Skib return (res); \ 291284901Skib} \ 292122827Sbdestruct __hack 293100327Smarkm 294284901Skib#define ATOMIC_STORE(TYPE) \ 295284901Skibstatic __inline void \ 296284901Skibatomic_store_rel_##TYPE(volatile u_##TYPE *p, u_##TYPE v) \ 297284901Skib{ \ 298284901Skib \ 299284901Skib __compiler_membar(); \ 300284901Skib *p = v; \ 301284901Skib} \ 302284901Skibstruct __hack 303100327Smarkm 304285283Skibstatic __inline void 305285283Skibatomic_thread_fence_acq(void) 306285283Skib{ 307285283Skib 308285283Skib __compiler_membar(); 309285283Skib} 310285283Skib 311285283Skibstatic __inline void 312285283Skibatomic_thread_fence_rel(void) 313285283Skib{ 314285283Skib 315285283Skib __compiler_membar(); 316285283Skib} 317285283Skib 318285283Skibstatic __inline void 319285283Skibatomic_thread_fence_acq_rel(void) 320285283Skib{ 321285283Skib 322285283Skib __compiler_membar(); 323285283Skib} 324285283Skib 325285283Skibstatic __inline void 326285283Skibatomic_thread_fence_seq_cst(void) 327285283Skib{ 328285283Skib 329285283Skib __storeload_barrier(); 330285283Skib} 331285283Skib 332254619Sjkim#ifdef _KERNEL 333254619Sjkim 334254619Sjkim#ifdef WANT_FUNCTIONS 335254620Sjkimint atomic_cmpset_64_i386(volatile uint64_t *, uint64_t, uint64_t); 336254620Sjkimint atomic_cmpset_64_i586(volatile uint64_t *, uint64_t, uint64_t); 337254619Sjkimuint64_t atomic_load_acq_64_i386(volatile uint64_t *); 338254619Sjkimuint64_t atomic_load_acq_64_i586(volatile uint64_t *); 339254619Sjkimvoid atomic_store_rel_64_i386(volatile uint64_t *, uint64_t); 340254619Sjkimvoid atomic_store_rel_64_i586(volatile uint64_t *, uint64_t); 341254620Sjkimuint64_t atomic_swap_64_i386(volatile uint64_t *, uint64_t); 342254620Sjkimuint64_t atomic_swap_64_i586(volatile uint64_t *, uint64_t); 343254619Sjkim#endif 344254619Sjkim 345254619Sjkim/* I486 does not support SMP or CMPXCHG8B. */ 346254620Sjkimstatic __inline int 347254620Sjkimatomic_cmpset_64_i386(volatile uint64_t *dst, uint64_t expect, uint64_t src) 348254620Sjkim{ 349254620Sjkim volatile uint32_t *p; 350254620Sjkim u_char res; 351254620Sjkim 352254620Sjkim p = (volatile uint32_t *)dst; 353254620Sjkim __asm __volatile( 354254620Sjkim " pushfl ; " 355254620Sjkim " cli ; " 356254620Sjkim " xorl %1,%%eax ; " 357254620Sjkim " xorl %2,%%edx ; " 358254620Sjkim " orl %%edx,%%eax ; " 359254620Sjkim " jne 1f ; " 360254620Sjkim " movl %4,%1 ; " 361254620Sjkim " movl %5,%2 ; " 362254620Sjkim "1: " 363254620Sjkim " sete %3 ; " 364254620Sjkim " popfl" 365254620Sjkim : "+A" (expect), /* 0 */ 366254620Sjkim "+m" (*p), /* 1 */ 367254620Sjkim "+m" (*(p + 1)), /* 2 */ 368254620Sjkim "=q" (res) /* 3 */ 369254620Sjkim : "r" ((uint32_t)src), /* 4 */ 370254620Sjkim "r" ((uint32_t)(src >> 32)) /* 5 */ 371254620Sjkim : "memory", "cc"); 372254620Sjkim return (res); 373254620Sjkim} 374254620Sjkim 375254619Sjkimstatic __inline uint64_t 376254619Sjkimatomic_load_acq_64_i386(volatile uint64_t *p) 377254619Sjkim{ 378254619Sjkim volatile uint32_t *q; 379254619Sjkim uint64_t res; 380254619Sjkim 381254619Sjkim q = (volatile uint32_t *)p; 382254619Sjkim __asm __volatile( 383254619Sjkim " pushfl ; " 384254619Sjkim " cli ; " 385254619Sjkim " movl %1,%%eax ; " 386254619Sjkim " movl %2,%%edx ; " 387254619Sjkim " popfl" 388254619Sjkim : "=&A" (res) /* 0 */ 389254619Sjkim : "m" (*q), /* 1 */ 390254619Sjkim "m" (*(q + 1)) /* 2 */ 391254619Sjkim : "memory"); 392254619Sjkim return (res); 393254619Sjkim} 394254619Sjkim 395254619Sjkimstatic __inline void 396254619Sjkimatomic_store_rel_64_i386(volatile uint64_t *p, uint64_t v) 397254619Sjkim{ 398254619Sjkim volatile uint32_t *q; 399254619Sjkim 400254619Sjkim q = (volatile uint32_t *)p; 401254619Sjkim __asm __volatile( 402254619Sjkim " pushfl ; " 403254619Sjkim " cli ; " 404254619Sjkim " movl %%eax,%0 ; " 405254619Sjkim " movl %%edx,%1 ; " 406254619Sjkim " popfl" 407254619Sjkim : "=m" (*q), /* 0 */ 408254619Sjkim "=m" (*(q + 1)) /* 1 */ 409254619Sjkim : "A" (v) /* 2 */ 410254619Sjkim : "memory"); 411254619Sjkim} 412254619Sjkim 413254619Sjkimstatic __inline uint64_t 414254620Sjkimatomic_swap_64_i386(volatile uint64_t *p, uint64_t v) 415254620Sjkim{ 416254620Sjkim volatile uint32_t *q; 417254620Sjkim uint64_t res; 418254620Sjkim 419254620Sjkim q = (volatile uint32_t *)p; 420254620Sjkim __asm __volatile( 421254620Sjkim " pushfl ; " 422254620Sjkim " cli ; " 423254620Sjkim " movl %1,%%eax ; " 424254620Sjkim " movl %2,%%edx ; " 425254620Sjkim " movl %4,%2 ; " 426254620Sjkim " movl %3,%1 ; " 427254620Sjkim " popfl" 428254620Sjkim : "=&A" (res), /* 0 */ 429254620Sjkim "+m" (*q), /* 1 */ 430254620Sjkim "+m" (*(q + 1)) /* 2 */ 431254620Sjkim : "r" ((uint32_t)v), /* 3 */ 432254620Sjkim "r" ((uint32_t)(v >> 32))); /* 4 */ 433254620Sjkim return (res); 434254620Sjkim} 435254620Sjkim 436254620Sjkimstatic __inline int 437254620Sjkimatomic_cmpset_64_i586(volatile uint64_t *dst, uint64_t expect, uint64_t src) 438254620Sjkim{ 439254620Sjkim u_char res; 440254620Sjkim 441254620Sjkim __asm __volatile( 442254620Sjkim " " MPLOCKED " " 443254620Sjkim " cmpxchg8b %1 ; " 444254620Sjkim " sete %0" 445254620Sjkim : "=q" (res), /* 0 */ 446254620Sjkim "+m" (*dst), /* 1 */ 447254620Sjkim "+A" (expect) /* 2 */ 448254620Sjkim : "b" ((uint32_t)src), /* 3 */ 449254620Sjkim "c" ((uint32_t)(src >> 32)) /* 4 */ 450254620Sjkim : "memory", "cc"); 451254620Sjkim return (res); 452254620Sjkim} 453254620Sjkim 454254620Sjkimstatic __inline uint64_t 455254619Sjkimatomic_load_acq_64_i586(volatile uint64_t *p) 456254619Sjkim{ 457254619Sjkim uint64_t res; 458254619Sjkim 459254619Sjkim __asm __volatile( 460254619Sjkim " movl %%ebx,%%eax ; " 461254619Sjkim " movl %%ecx,%%edx ; " 462254619Sjkim " " MPLOCKED " " 463254619Sjkim " cmpxchg8b %1" 464254619Sjkim : "=&A" (res), /* 0 */ 465254619Sjkim "+m" (*p) /* 1 */ 466254619Sjkim : : "memory", "cc"); 467254619Sjkim return (res); 468254619Sjkim} 469254619Sjkim 470254619Sjkimstatic __inline void 471254619Sjkimatomic_store_rel_64_i586(volatile uint64_t *p, uint64_t v) 472254619Sjkim{ 473254619Sjkim 474254619Sjkim __asm __volatile( 475254619Sjkim " movl %%eax,%%ebx ; " 476254619Sjkim " movl %%edx,%%ecx ; " 477254619Sjkim "1: " 478254619Sjkim " " MPLOCKED " " 479254619Sjkim " cmpxchg8b %0 ; " 480254619Sjkim " jne 1b" 481254619Sjkim : "+m" (*p), /* 0 */ 482254619Sjkim "+A" (v) /* 1 */ 483254619Sjkim : : "ebx", "ecx", "memory", "cc"); 484254619Sjkim} 485254619Sjkim 486254619Sjkimstatic __inline uint64_t 487254620Sjkimatomic_swap_64_i586(volatile uint64_t *p, uint64_t v) 488254620Sjkim{ 489254620Sjkim 490254620Sjkim __asm __volatile( 491254620Sjkim " movl %%eax,%%ebx ; " 492254620Sjkim " movl %%edx,%%ecx ; " 493254620Sjkim "1: " 494254620Sjkim " " MPLOCKED " " 495254620Sjkim " cmpxchg8b %0 ; " 496254620Sjkim " jne 1b" 497254620Sjkim : "+m" (*p), /* 0 */ 498254620Sjkim "+A" (v) /* 1 */ 499254620Sjkim : : "ebx", "ecx", "memory", "cc"); 500254620Sjkim return (v); 501254620Sjkim} 502254620Sjkim 503254620Sjkimstatic __inline int 504254620Sjkimatomic_cmpset_64(volatile uint64_t *dst, uint64_t expect, uint64_t src) 505254620Sjkim{ 506254620Sjkim 507254620Sjkim if ((cpu_feature & CPUID_CX8) == 0) 508254620Sjkim return (atomic_cmpset_64_i386(dst, expect, src)); 509254620Sjkim else 510254620Sjkim return (atomic_cmpset_64_i586(dst, expect, src)); 511254620Sjkim} 512254620Sjkim 513254620Sjkimstatic __inline uint64_t 514254619Sjkimatomic_load_acq_64(volatile uint64_t *p) 515254619Sjkim{ 516254619Sjkim 517254619Sjkim if ((cpu_feature & CPUID_CX8) == 0) 518254619Sjkim return (atomic_load_acq_64_i386(p)); 519254619Sjkim else 520254619Sjkim return (atomic_load_acq_64_i586(p)); 521254619Sjkim} 522254619Sjkim 523254619Sjkimstatic __inline void 524254619Sjkimatomic_store_rel_64(volatile uint64_t *p, uint64_t v) 525254619Sjkim{ 526254619Sjkim 527254619Sjkim if ((cpu_feature & CPUID_CX8) == 0) 528254619Sjkim atomic_store_rel_64_i386(p, v); 529254619Sjkim else 530254619Sjkim atomic_store_rel_64_i586(p, v); 531254619Sjkim} 532254619Sjkim 533254620Sjkimstatic __inline uint64_t 534254620Sjkimatomic_swap_64(volatile uint64_t *p, uint64_t v) 535254620Sjkim{ 536254620Sjkim 537254620Sjkim if ((cpu_feature & CPUID_CX8) == 0) 538254620Sjkim return (atomic_swap_64_i386(p, v)); 539254620Sjkim else 540254620Sjkim return (atomic_swap_64_i586(p, v)); 541254620Sjkim} 542254620Sjkim 543254619Sjkim#endif /* _KERNEL */ 544254619Sjkim 545147855Sjhb#endif /* KLD_MODULE || !__GNUCLIKE_ASM */ 546100251Smarkm 547100251SmarkmATOMIC_ASM(set, char, "orb %b1,%0", "iq", v); 548100251SmarkmATOMIC_ASM(clear, char, "andb %b1,%0", "iq", ~v); 549100251SmarkmATOMIC_ASM(add, char, "addb %b1,%0", "iq", v); 550100251SmarkmATOMIC_ASM(subtract, char, "subb %b1,%0", "iq", v); 55171085Sjhb 552100251SmarkmATOMIC_ASM(set, short, "orw %w1,%0", "ir", v); 553100251SmarkmATOMIC_ASM(clear, short, "andw %w1,%0", "ir", ~v); 554100251SmarkmATOMIC_ASM(add, short, "addw %w1,%0", "ir", v); 555100251SmarkmATOMIC_ASM(subtract, short, "subw %w1,%0", "ir", v); 55671085Sjhb 557100251SmarkmATOMIC_ASM(set, int, "orl %1,%0", "ir", v); 558100251SmarkmATOMIC_ASM(clear, int, "andl %1,%0", "ir", ~v); 559100251SmarkmATOMIC_ASM(add, int, "addl %1,%0", "ir", v); 560100251SmarkmATOMIC_ASM(subtract, int, "subl %1,%0", "ir", v); 56171085Sjhb 562100251SmarkmATOMIC_ASM(set, long, "orl %1,%0", "ir", v); 563100251SmarkmATOMIC_ASM(clear, long, "andl %1,%0", "ir", ~v); 564100251SmarkmATOMIC_ASM(add, long, "addl %1,%0", "ir", v); 565100251SmarkmATOMIC_ASM(subtract, long, "subl %1,%0", "ir", v); 56671085Sjhb 567284901Skib#define ATOMIC_LOADSTORE(TYPE) \ 568284901Skib ATOMIC_LOAD(TYPE); \ 569284901Skib ATOMIC_STORE(TYPE) 57071023Sjhb 571284901SkibATOMIC_LOADSTORE(char); 572284901SkibATOMIC_LOADSTORE(short); 573284901SkibATOMIC_LOADSTORE(int); 574284901SkibATOMIC_LOADSTORE(long); 575236456Skib 57671085Sjhb#undef ATOMIC_ASM 577236456Skib#undef ATOMIC_LOAD 578236456Skib#undef ATOMIC_STORE 579284901Skib#undef ATOMIC_LOADSTORE 58067351Sjhb 581165635Sbde#ifndef WANT_FUNCTIONS 582147855Sjhb 583147855Sjhbstatic __inline int 584208332Sphkatomic_cmpset_long(volatile u_long *dst, u_long expect, u_long src) 585147855Sjhb{ 586147855Sjhb 587208332Sphk return (atomic_cmpset_int((volatile u_int *)dst, (u_int)expect, 588147855Sjhb (u_int)src)); 589147855Sjhb} 590147855Sjhb 591177276Spjdstatic __inline u_long 592177276Spjdatomic_fetchadd_long(volatile u_long *p, u_long v) 593177276Spjd{ 594177276Spjd 595177276Spjd return (atomic_fetchadd_int((volatile u_int *)p, (u_int)v)); 596177276Spjd} 597177276Spjd 598254617Sjkimstatic __inline int 599254617Sjkimatomic_testandset_long(volatile u_long *p, u_int v) 600254617Sjkim{ 601254617Sjkim 602254617Sjkim return (atomic_testandset_int((volatile u_int *)p, v)); 603254617Sjkim} 604254617Sjkim 605254617Sjkim/* Read the current value and store a new value in the destination. */ 606147855Sjhb#ifdef __GNUCLIKE_ASM 607147855Sjhb 608147855Sjhbstatic __inline u_int 609254617Sjkimatomic_swap_int(volatile u_int *p, u_int v) 610147855Sjhb{ 611147855Sjhb 612165633Sbde __asm __volatile( 613147855Sjhb " xchgl %1,%0 ; " 614254617Sjkim "# atomic_swap_int" 615254617Sjkim : "+r" (v), /* 0 */ 616254612Sjkim "+m" (*p)); /* 1 */ 617254617Sjkim return (v); 618147855Sjhb} 619147855Sjhb 620147855Sjhbstatic __inline u_long 621254617Sjkimatomic_swap_long(volatile u_long *p, u_long v) 622147855Sjhb{ 623147855Sjhb 624254617Sjkim return (atomic_swap_int((volatile u_int *)p, (u_int)v)); 625147855Sjhb} 626147855Sjhb 627147855Sjhb#else /* !__GNUCLIKE_ASM */ 628147855Sjhb 629254617Sjkimu_int atomic_swap_int(volatile u_int *p, u_int v); 630254617Sjkimu_long atomic_swap_long(volatile u_long *p, u_long v); 631147855Sjhb 632147855Sjhb#endif /* __GNUCLIKE_ASM */ 633147855Sjhb 634197803Sattilio#define atomic_set_acq_char atomic_set_barr_char 635197803Sattilio#define atomic_set_rel_char atomic_set_barr_char 636197803Sattilio#define atomic_clear_acq_char atomic_clear_barr_char 637197803Sattilio#define atomic_clear_rel_char atomic_clear_barr_char 638197803Sattilio#define atomic_add_acq_char atomic_add_barr_char 639197803Sattilio#define atomic_add_rel_char atomic_add_barr_char 640197803Sattilio#define atomic_subtract_acq_char atomic_subtract_barr_char 641197803Sattilio#define atomic_subtract_rel_char atomic_subtract_barr_char 64271085Sjhb 643197803Sattilio#define atomic_set_acq_short atomic_set_barr_short 644197803Sattilio#define atomic_set_rel_short atomic_set_barr_short 645197803Sattilio#define atomic_clear_acq_short atomic_clear_barr_short 646197803Sattilio#define atomic_clear_rel_short atomic_clear_barr_short 647197803Sattilio#define atomic_add_acq_short atomic_add_barr_short 648197803Sattilio#define atomic_add_rel_short atomic_add_barr_short 649197803Sattilio#define atomic_subtract_acq_short atomic_subtract_barr_short 650197803Sattilio#define atomic_subtract_rel_short atomic_subtract_barr_short 65171085Sjhb 652197803Sattilio#define atomic_set_acq_int atomic_set_barr_int 653197803Sattilio#define atomic_set_rel_int atomic_set_barr_int 654197803Sattilio#define atomic_clear_acq_int atomic_clear_barr_int 655197803Sattilio#define atomic_clear_rel_int atomic_clear_barr_int 656197803Sattilio#define atomic_add_acq_int atomic_add_barr_int 657197803Sattilio#define atomic_add_rel_int atomic_add_barr_int 658197803Sattilio#define atomic_subtract_acq_int atomic_subtract_barr_int 659197803Sattilio#define atomic_subtract_rel_int atomic_subtract_barr_int 660197910Sattilio#define atomic_cmpset_acq_int atomic_cmpset_int 661197910Sattilio#define atomic_cmpset_rel_int atomic_cmpset_int 66271085Sjhb 663197803Sattilio#define atomic_set_acq_long atomic_set_barr_long 664197803Sattilio#define atomic_set_rel_long atomic_set_barr_long 665197803Sattilio#define atomic_clear_acq_long atomic_clear_barr_long 666197803Sattilio#define atomic_clear_rel_long atomic_clear_barr_long 667197803Sattilio#define atomic_add_acq_long atomic_add_barr_long 668197803Sattilio#define atomic_add_rel_long atomic_add_barr_long 669197803Sattilio#define atomic_subtract_acq_long atomic_subtract_barr_long 670197803Sattilio#define atomic_subtract_rel_long atomic_subtract_barr_long 671197910Sattilio#define atomic_cmpset_acq_long atomic_cmpset_long 672197910Sattilio#define atomic_cmpset_rel_long atomic_cmpset_long 67371085Sjhb 674254617Sjkim#define atomic_readandclear_int(p) atomic_swap_int(p, 0) 675254617Sjkim#define atomic_readandclear_long(p) atomic_swap_long(p, 0) 676254617Sjkim 677147855Sjhb/* Operations on 8-bit bytes. */ 67871085Sjhb#define atomic_set_8 atomic_set_char 67971085Sjhb#define atomic_set_acq_8 atomic_set_acq_char 68071085Sjhb#define atomic_set_rel_8 atomic_set_rel_char 68171085Sjhb#define atomic_clear_8 atomic_clear_char 68271085Sjhb#define atomic_clear_acq_8 atomic_clear_acq_char 68371085Sjhb#define atomic_clear_rel_8 atomic_clear_rel_char 68471085Sjhb#define atomic_add_8 atomic_add_char 68571085Sjhb#define atomic_add_acq_8 atomic_add_acq_char 68671085Sjhb#define atomic_add_rel_8 atomic_add_rel_char 68771085Sjhb#define atomic_subtract_8 atomic_subtract_char 68871085Sjhb#define atomic_subtract_acq_8 atomic_subtract_acq_char 68971085Sjhb#define atomic_subtract_rel_8 atomic_subtract_rel_char 69071085Sjhb#define atomic_load_acq_8 atomic_load_acq_char 69171085Sjhb#define atomic_store_rel_8 atomic_store_rel_char 69271085Sjhb 693147855Sjhb/* Operations on 16-bit words. */ 69471085Sjhb#define atomic_set_16 atomic_set_short 69571085Sjhb#define atomic_set_acq_16 atomic_set_acq_short 69671085Sjhb#define atomic_set_rel_16 atomic_set_rel_short 69771085Sjhb#define atomic_clear_16 atomic_clear_short 69871085Sjhb#define atomic_clear_acq_16 atomic_clear_acq_short 69971085Sjhb#define atomic_clear_rel_16 atomic_clear_rel_short 70071085Sjhb#define atomic_add_16 atomic_add_short 70171085Sjhb#define atomic_add_acq_16 atomic_add_acq_short 70271085Sjhb#define atomic_add_rel_16 atomic_add_rel_short 70371085Sjhb#define atomic_subtract_16 atomic_subtract_short 70471085Sjhb#define atomic_subtract_acq_16 atomic_subtract_acq_short 70571085Sjhb#define atomic_subtract_rel_16 atomic_subtract_rel_short 70671085Sjhb#define atomic_load_acq_16 atomic_load_acq_short 70771085Sjhb#define atomic_store_rel_16 atomic_store_rel_short 70871085Sjhb 709147855Sjhb/* Operations on 32-bit double words. */ 71071085Sjhb#define atomic_set_32 atomic_set_int 71171085Sjhb#define atomic_set_acq_32 atomic_set_acq_int 71271085Sjhb#define atomic_set_rel_32 atomic_set_rel_int 71371085Sjhb#define atomic_clear_32 atomic_clear_int 71471085Sjhb#define atomic_clear_acq_32 atomic_clear_acq_int 71571085Sjhb#define atomic_clear_rel_32 atomic_clear_rel_int 71671085Sjhb#define atomic_add_32 atomic_add_int 71771085Sjhb#define atomic_add_acq_32 atomic_add_acq_int 71871085Sjhb#define atomic_add_rel_32 atomic_add_rel_int 71971085Sjhb#define atomic_subtract_32 atomic_subtract_int 72071085Sjhb#define atomic_subtract_acq_32 atomic_subtract_acq_int 72171085Sjhb#define atomic_subtract_rel_32 atomic_subtract_rel_int 72271085Sjhb#define atomic_load_acq_32 atomic_load_acq_int 72371085Sjhb#define atomic_store_rel_32 atomic_store_rel_int 72471085Sjhb#define atomic_cmpset_32 atomic_cmpset_int 72571085Sjhb#define atomic_cmpset_acq_32 atomic_cmpset_acq_int 72671085Sjhb#define atomic_cmpset_rel_32 atomic_cmpset_rel_int 727254617Sjkim#define atomic_swap_32 atomic_swap_int 72871085Sjhb#define atomic_readandclear_32 atomic_readandclear_int 729150627Sjhb#define atomic_fetchadd_32 atomic_fetchadd_int 730254617Sjkim#define atomic_testandset_32 atomic_testandset_int 73171085Sjhb 732147855Sjhb/* Operations on pointers. */ 733157212Sdes#define atomic_set_ptr(p, v) \ 734157212Sdes atomic_set_int((volatile u_int *)(p), (u_int)(v)) 735157212Sdes#define atomic_set_acq_ptr(p, v) \ 736157212Sdes atomic_set_acq_int((volatile u_int *)(p), (u_int)(v)) 737157212Sdes#define atomic_set_rel_ptr(p, v) \ 738157212Sdes atomic_set_rel_int((volatile u_int *)(p), (u_int)(v)) 739157212Sdes#define atomic_clear_ptr(p, v) \ 740157212Sdes atomic_clear_int((volatile u_int *)(p), (u_int)(v)) 741157212Sdes#define atomic_clear_acq_ptr(p, v) \ 742157212Sdes atomic_clear_acq_int((volatile u_int *)(p), (u_int)(v)) 743157212Sdes#define atomic_clear_rel_ptr(p, v) \ 744157212Sdes atomic_clear_rel_int((volatile u_int *)(p), (u_int)(v)) 745157212Sdes#define atomic_add_ptr(p, v) \ 746157212Sdes atomic_add_int((volatile u_int *)(p), (u_int)(v)) 747157212Sdes#define atomic_add_acq_ptr(p, v) \ 748157212Sdes atomic_add_acq_int((volatile u_int *)(p), (u_int)(v)) 749157212Sdes#define atomic_add_rel_ptr(p, v) \ 750157212Sdes atomic_add_rel_int((volatile u_int *)(p), (u_int)(v)) 751157212Sdes#define atomic_subtract_ptr(p, v) \ 752157212Sdes atomic_subtract_int((volatile u_int *)(p), (u_int)(v)) 753157212Sdes#define atomic_subtract_acq_ptr(p, v) \ 754157212Sdes atomic_subtract_acq_int((volatile u_int *)(p), (u_int)(v)) 755157212Sdes#define atomic_subtract_rel_ptr(p, v) \ 756157212Sdes atomic_subtract_rel_int((volatile u_int *)(p), (u_int)(v)) 757157212Sdes#define atomic_load_acq_ptr(p) \ 758157212Sdes atomic_load_acq_int((volatile u_int *)(p)) 759157212Sdes#define atomic_store_rel_ptr(p, v) \ 760157212Sdes atomic_store_rel_int((volatile u_int *)(p), (v)) 761157212Sdes#define atomic_cmpset_ptr(dst, old, new) \ 762157212Sdes atomic_cmpset_int((volatile u_int *)(dst), (u_int)(old), (u_int)(new)) 763157212Sdes#define atomic_cmpset_acq_ptr(dst, old, new) \ 764165633Sbde atomic_cmpset_acq_int((volatile u_int *)(dst), (u_int)(old), \ 765165633Sbde (u_int)(new)) 766157212Sdes#define atomic_cmpset_rel_ptr(dst, old, new) \ 767165633Sbde atomic_cmpset_rel_int((volatile u_int *)(dst), (u_int)(old), \ 768165633Sbde (u_int)(new)) 769254617Sjkim#define atomic_swap_ptr(p, v) \ 770254617Sjkim atomic_swap_int((volatile u_int *)(p), (u_int)(v)) 771157212Sdes#define atomic_readandclear_ptr(p) \ 772157212Sdes atomic_readandclear_int((volatile u_int *)(p)) 77365514Sphk 774165635Sbde#endif /* !WANT_FUNCTIONS */ 775165633Sbde 776286051Skib#if defined(_KERNEL) 777286051Skib#define mb() __mbk() 778286051Skib#define wmb() __mbk() 779286051Skib#define rmb() __mbk() 780286051Skib#else 781286051Skib#define mb() __mbu() 782286051Skib#define wmb() __mbu() 783286051Skib#define rmb() __mbu() 784286051Skib#endif 785286051Skib 786165633Sbde#endif /* !_MACHINE_ATOMIC_H_ */ 787