1d265f300SJohn Baldwin.\" Copyright (c) 2000-2001 John H. Baldwin <jhb@FreeBSD.org> 2eaca6183SJohn Baldwin.\" 3eaca6183SJohn Baldwin.\" Redistribution and use in source and binary forms, with or without 4eaca6183SJohn Baldwin.\" modification, are permitted provided that the following conditions 5eaca6183SJohn Baldwin.\" are met: 6eaca6183SJohn Baldwin.\" 1. Redistributions of source code must retain the above copyright 7eaca6183SJohn Baldwin.\" notice, this list of conditions and the following disclaimer. 8eaca6183SJohn Baldwin.\" 2. Redistributions in binary form must reproduce the above copyright 9eaca6183SJohn Baldwin.\" notice, this list of conditions and the following disclaimer in the 10eaca6183SJohn Baldwin.\" documentation and/or other materials provided with the distribution. 11eaca6183SJohn Baldwin.\" 12eaca6183SJohn Baldwin.\" THIS SOFTWARE IS PROVIDED BY THE DEVELOPERS ``AS IS'' AND ANY EXPRESS OR 13eaca6183SJohn Baldwin.\" IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 14eaca6183SJohn Baldwin.\" OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 15eaca6183SJohn Baldwin.\" IN NO EVENT SHALL THE DEVELOPERS BE LIABLE FOR ANY DIRECT, INDIRECT, 16eaca6183SJohn Baldwin.\" INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 17eaca6183SJohn Baldwin.\" NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 18eaca6183SJohn Baldwin.\" DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 19eaca6183SJohn Baldwin.\" THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 20eaca6183SJohn Baldwin.\" (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 21eaca6183SJohn Baldwin.\" THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 22eaca6183SJohn Baldwin.\" 23*32c45723SOlivier Certner.Dd December 16, 2024 24eaca6183SJohn Baldwin.Dt ATOMIC 9 25aa12cea2SUlrich Spörlein.Os 26eaca6183SJohn Baldwin.Sh NAME 27eaca6183SJohn Baldwin.Nm atomic_add , 28eaca6183SJohn Baldwin.Nm atomic_clear , 29eaca6183SJohn Baldwin.Nm atomic_cmpset , 30c0b995bbSMateusz Guzik.Nm atomic_fcmpset , 314ea211a4SJohn Baldwin.Nm atomic_fetchadd , 32e2494f75SKonstantin Belousov.Nm atomic_interrupt_fence , 33eaca6183SJohn Baldwin.Nm atomic_load , 34eaca6183SJohn Baldwin.Nm atomic_readandclear , 35eaca6183SJohn Baldwin.Nm atomic_set , 36eaca6183SJohn Baldwin.Nm atomic_subtract , 3722fd1b5dSAlan Cox.Nm atomic_store , 3822fd1b5dSAlan Cox.Nm atomic_thread_fence 39eaca6183SJohn Baldwin.Nd atomic operations 40eaca6183SJohn Baldwin.Sh SYNOPSIS 4132eef9aeSRuslan Ermilov.In machine/atomic.h 42eaca6183SJohn Baldwin.Ft void 43c6a51f1cSRuslan Ermilov.Fn atomic_add_[acq_|rel_]<type> "volatile <type> *p" "<type> v" 44eaca6183SJohn Baldwin.Ft void 45c6a51f1cSRuslan Ermilov.Fn atomic_clear_[acq_|rel_]<type> "volatile <type> *p" "<type> v" 46eaca6183SJohn Baldwin.Ft int 47c6a51f1cSRuslan Ermilov.Fo atomic_cmpset_[acq_|rel_]<type> 48c6a51f1cSRuslan Ermilov.Fa "volatile <type> *dst" 49c6a51f1cSRuslan Ermilov.Fa "<type> old" 50c6a51f1cSRuslan Ermilov.Fa "<type> new" 51eaca6183SJohn Baldwin.Fc 52c0b995bbSMateusz Guzik.Ft int 53c0b995bbSMateusz Guzik.Fo atomic_fcmpset_[acq_|rel_]<type> 54c0b995bbSMateusz Guzik.Fa "volatile <type> *dst" 55c0b995bbSMateusz Guzik.Fa "<type> *old" 56c0b995bbSMateusz Guzik.Fa "<type> new" 57c0b995bbSMateusz Guzik.Fc 58c6a51f1cSRuslan Ermilov.Ft <type> 594ea211a4SJohn Baldwin.Fn atomic_fetchadd_<type> "volatile <type> *p" "<type> v" 60e2494f75SKonstantin Belousov.Ft void 61e2494f75SKonstantin Belousov.Fn atomic_interrupt_fence "void" 624ea211a4SJohn Baldwin.Ft <type> 63*32c45723SOlivier Certner.Fn atomic_load_[acq_]<type> "const volatile <type> *p" 64c6a51f1cSRuslan Ermilov.Ft <type> 65c6a51f1cSRuslan Ermilov.Fn atomic_readandclear_<type> "volatile <type> *p" 66eaca6183SJohn Baldwin.Ft void 67c6a51f1cSRuslan Ermilov.Fn atomic_set_[acq_|rel_]<type> "volatile <type> *p" "<type> v" 68eaca6183SJohn Baldwin.Ft void 69c6a51f1cSRuslan Ermilov.Fn atomic_subtract_[acq_|rel_]<type> "volatile <type> *p" "<type> v" 70eaca6183SJohn Baldwin.Ft void 7122fd1b5dSAlan Cox.Fn atomic_store_[rel_]<type> "volatile <type> *p" "<type> v" 728a1ee2d3SJung-uk Kim.Ft <type> 738a1ee2d3SJung-uk Kim.Fn atomic_swap_<type> "volatile <type> *p" "<type> v" 748a1ee2d3SJung-uk Kim.Ft int 75dfdc9a05SSepherosa Ziehau.Fn atomic_testandclear_<type> "volatile <type> *p" "u_int v" 76dfdc9a05SSepherosa Ziehau.Ft int 778a1ee2d3SJung-uk Kim.Fn atomic_testandset_<type> "volatile <type> *p" "u_int v" 7822fd1b5dSAlan Cox.Ft void 7922fd1b5dSAlan Cox.Fn atomic_thread_fence_[acq|acq_rel|rel|seq_cst] "void" 80eaca6183SJohn Baldwin.Sh DESCRIPTION 8122fd1b5dSAlan CoxAtomic operations are commonly used to implement reference counts and as 8222fd1b5dSAlan Coxbuilding blocks for synchronization primitives, such as mutexes. 8322fd1b5dSAlan Cox.Pp 8422fd1b5dSAlan CoxAll of these operations are performed 8522fd1b5dSAlan Cox.Em atomically 8622fd1b5dSAlan Coxacross multiple threads and in the presence of interrupts, meaning that they 8722fd1b5dSAlan Coxare performed in an indivisible manner from the perspective of concurrently 88c9b6b582SKonstantin Belousovrunning threads and interrupt handlers. 89c9b6b582SKonstantin Belousov.Pp 9022fd1b5dSAlan CoxOn all architectures supported by 9122fd1b5dSAlan Cox.Fx , 9222fd1b5dSAlan Coxordinary loads and stores of integers in cache-coherent memory are 9322fd1b5dSAlan Coxinherently atomic if the integer is naturally aligned and its size does not 9422fd1b5dSAlan Coxexceed the processor's word size. 9522fd1b5dSAlan CoxHowever, such loads and stores may be elided from the program by 9622fd1b5dSAlan Coxthe compiler, whereas atomic operations are always performed. 9722fd1b5dSAlan Cox.Pp 98c9b6b582SKonstantin BelousovWhen atomic operations are performed on cache-coherent memory, all 99c9b6b582SKonstantin Belousovoperations on the same location are totally ordered. 100c9b6b582SKonstantin Belousov.Pp 101c9b6b582SKonstantin BelousovWhen an atomic load is performed on a location in cache-coherent memory, 102c9b6b582SKonstantin Belousovit reads the entire value that was defined by the last atomic store to 103c9b6b582SKonstantin Belousoveach byte of the location. 104c9b6b582SKonstantin BelousovAn atomic load will never return a value out of thin air. 105c9b6b582SKonstantin BelousovWhen an atomic store is performed on a location, no other thread or 106c9b6b582SKonstantin Belousovinterrupt handler will observe a 107c9b6b582SKonstantin Belousov.Em torn write , 108c9b6b582SKonstantin Belousovor partial modification of the location. 109c9b6b582SKonstantin Belousov.Pp 11022fd1b5dSAlan CoxExcept as noted below, the semantics of these operations are almost 11122fd1b5dSAlan Coxidentical to the semantics of similarly named C11 atomic operations. 112eaca6183SJohn Baldwin.Ss Types 11322fd1b5dSAlan CoxMost atomic operations act upon a specific 1140640e9e0SHiten Pandya.Fa type . 11522fd1b5dSAlan CoxThat type is indicated in the function name. 11622fd1b5dSAlan CoxIn contrast to C11 atomic operations, 11722fd1b5dSAlan Cox.Fx Ns 's 11822fd1b5dSAlan Coxatomic operations are performed on ordinary integer types. 11922fd1b5dSAlan CoxThe available types are: 1202be6c09fSRuslan Ermilov.Pp 1212be6c09fSRuslan Ermilov.Bl -tag -offset indent -width short -compact 1222be6c09fSRuslan Ermilov.It Li int 123eaca6183SJohn Baldwinunsigned integer 1242be6c09fSRuslan Ermilov.It Li long 125eaca6183SJohn Baldwinunsigned long integer 1262be6c09fSRuslan Ermilov.It Li ptr 127eaca6183SJohn Baldwinunsigned integer the size of a pointer 1282be6c09fSRuslan Ermilov.It Li 32 129eaca6183SJohn Baldwinunsigned 32-bit integer 1302be6c09fSRuslan Ermilov.It Li 64 131eaca6183SJohn Baldwinunsigned 64-bit integer 132eaca6183SJohn Baldwin.El 133eaca6183SJohn Baldwin.Pp 134eaca6183SJohn BaldwinFor example, the function to atomically add two integers is called 135eaca6183SJohn Baldwin.Fn atomic_add_int . 136c645e17aSJake Burkholder.Pp 1372be6c09fSRuslan ErmilovCertain architectures also provide operations for types smaller than 1382be6c09fSRuslan Ermilov.Dq Li int . 1392be6c09fSRuslan Ermilov.Pp 1402be6c09fSRuslan Ermilov.Bl -tag -offset indent -width short -compact 1412be6c09fSRuslan Ermilov.It Li char 142c645e17aSJake Burkholderunsigned character 1432be6c09fSRuslan Ermilov.It Li short 144c645e17aSJake Burkholderunsigned short integer 1452be6c09fSRuslan Ermilov.It Li 8 146c645e17aSJake Burkholderunsigned 8-bit integer 1472be6c09fSRuslan Ermilov.It Li 16 148c645e17aSJake Burkholderunsigned 16-bit integer 149c645e17aSJake Burkholder.El 150c645e17aSJake Burkholder.Pp 15122fd1b5dSAlan CoxThese types must not be used in machine-independent code. 152cff0a327SAlan Cox.Ss Acquire and Release Operations 153cff0a327SAlan CoxBy default, a thread's accesses to different memory locations might not be 154cff0a327SAlan Coxperformed in 155cff0a327SAlan Cox.Em program order , 156cff0a327SAlan Coxthat is, the order in which the accesses appear in the source code. 157cff0a327SAlan CoxTo optimize the program's execution, both the compiler and processor might 158cff0a327SAlan Coxreorder the thread's accesses. 159cff0a327SAlan CoxHowever, both ensure that their reordering of the accesses is not visible to 160cff0a327SAlan Coxthe thread. 161cff0a327SAlan CoxOtherwise, the traditional memory model that is expected by single-threaded 162cff0a327SAlan Coxprograms would be violated. 163cff0a327SAlan CoxNonetheless, other threads in a multithreaded program, such as the 164cff0a327SAlan Cox.Fx 165cff0a327SAlan Coxkernel, might observe the reordering. 166cff0a327SAlan CoxMoreover, in some cases, such as the implementation of synchronization between 167cff0a327SAlan Coxthreads, arbitrary reordering might result in the incorrect execution of the 168cff0a327SAlan Coxprogram. 169cff0a327SAlan CoxTo constrain the reordering that both the compiler and processor might perform 17022fd1b5dSAlan Coxon a thread's accesses, a programmer can use atomic operations with 17177054356SKonstantin Belousov.Em acquire 172cff0a327SAlan Coxand 173cff0a327SAlan Cox.Em release 174cff0a327SAlan Coxsemantics. 175cff0a327SAlan Cox.Pp 17622fd1b5dSAlan CoxAtomic operations on memory have up to three variants. 17777863e4bSKonstantin BelousovThe first, or 17877863e4bSKonstantin Belousov.Em relaxed 17977863e4bSKonstantin Belousovvariant, performs the operation without imposing any ordering constraints on 18077863e4bSKonstantin Belousovaccesses to other memory locations. 18177863e4bSKonstantin BelousovThis variant is the default. 182cff0a327SAlan CoxThe second variant has acquire semantics, and the third variant has release 183cff0a327SAlan Coxsemantics. 184cff0a327SAlan Cox.Pp 18522fd1b5dSAlan CoxWhen an atomic operation has acquire semantics, the operation must have 18622fd1b5dSAlan Coxcompleted before any subsequent load or store (by program order) is 187cff0a327SAlan Coxperformed. 188cff0a327SAlan CoxConversely, acquire semantics do not require that prior loads or stores have 189cff0a327SAlan Coxcompleted before the atomic operation is performed. 19022fd1b5dSAlan CoxAn atomic operation can only have acquire semantics if it performs a load 19122fd1b5dSAlan Coxfrom memory. 192cff0a327SAlan CoxTo denote acquire semantics, the suffix 1932be6c09fSRuslan Ermilov.Dq Li _acq 194eaca6183SJohn Baldwinis inserted into the function name immediately prior to the 1950640e9e0SHiten Pandya.Dq Li _ Ns Aq Fa type 196eaca6183SJohn Baldwinsuffix. 19722fd1b5dSAlan CoxFor example, to subtract two integers ensuring that the subtraction is 19822fd1b5dSAlan Coxcompleted before any subsequent loads and stores are performed, use 199eaca6183SJohn Baldwin.Fn atomic_subtract_acq_int . 200eaca6183SJohn Baldwin.Pp 20122fd1b5dSAlan CoxWhen an atomic operation has release semantics, all prior loads or stores 20222fd1b5dSAlan Cox(by program order) must have completed before the operation is performed. 20322fd1b5dSAlan CoxConversely, release semantics do not require that the atomic operation must 20422fd1b5dSAlan Coxhave completed before any subsequent load or store is performed. 20522fd1b5dSAlan CoxAn atomic operation can only have release semantics if it performs a store 20622fd1b5dSAlan Coxto memory. 207cff0a327SAlan CoxTo denote release semantics, the suffix 2082be6c09fSRuslan Ermilov.Dq Li _rel 209eaca6183SJohn Baldwinis inserted into the function name immediately prior to the 2100640e9e0SHiten Pandya.Dq Li _ Ns Aq Fa type 211eaca6183SJohn Baldwinsuffix. 212cff0a327SAlan CoxFor example, to add two long integers ensuring that all prior loads and 21322fd1b5dSAlan Coxstores are completed before the addition is performed, use 214eaca6183SJohn Baldwin.Fn atomic_add_rel_long . 215eaca6183SJohn Baldwin.Pp 21622fd1b5dSAlan CoxWhen a release operation by one thread 21722fd1b5dSAlan Cox.Em synchronizes with 21822fd1b5dSAlan Coxan acquire operation by another thread, usually meaning that the acquire 21922fd1b5dSAlan Coxoperation reads the value written by the release operation, then the effects 22022fd1b5dSAlan Coxof all prior stores by the releasing thread must become visible to 22122fd1b5dSAlan Coxsubsequent loads by the acquiring thread. 22222fd1b5dSAlan CoxMoreover, the effects of all stores (by other threads) that were visible to 22322fd1b5dSAlan Coxthe releasing thread must also become visible to the acquiring thread. 22422fd1b5dSAlan CoxThese rules only apply to the synchronizing threads. 22522fd1b5dSAlan CoxOther threads might observe these stores in a different order. 22622fd1b5dSAlan Cox.Pp 22722fd1b5dSAlan CoxIn effect, atomic operations with acquire and release semantics establish 22822fd1b5dSAlan Coxone-way barriers to reordering that enable the implementations of 22922fd1b5dSAlan Coxsynchronization primitives to express their ordering requirements without 23022fd1b5dSAlan Coxalso imposing unnecessary ordering. 231cff0a327SAlan CoxFor example, for a critical section guarded by a mutex, an acquire operation 232cff0a327SAlan Coxwhen the mutex is locked and a release operation when the mutex is unlocked 233cff0a327SAlan Coxwill prevent any loads or stores from moving outside of the critical 234cff0a327SAlan Coxsection. 235cff0a327SAlan CoxHowever, they will not prevent the compiler or processor from moving loads 236cff0a327SAlan Coxor stores into the critical section, which does not violate the semantics of 237cff0a327SAlan Coxa mutex. 23822fd1b5dSAlan Cox.Ss Thread Fence Operations 23922fd1b5dSAlan CoxAlternatively, a programmer can use atomic thread fence operations to 24022fd1b5dSAlan Coxconstrain the reordering of accesses. 24122fd1b5dSAlan CoxIn contrast to other atomic operations, fences do not, themselves, access 24222fd1b5dSAlan Coxmemory. 24322fd1b5dSAlan Cox.Pp 24422fd1b5dSAlan CoxWhen a fence has acquire semantics, all prior loads (by program order) must 24522fd1b5dSAlan Coxhave completed before any subsequent load or store is performed. 24622fd1b5dSAlan CoxThus, an acquire fence is a two-way barrier for load operations. 24722fd1b5dSAlan CoxTo denote acquire semantics, the suffix 24822fd1b5dSAlan Cox.Dq Li _acq 24922fd1b5dSAlan Coxis appended to the function name, for example, 25022fd1b5dSAlan Cox.Fn atomic_thread_fence_acq . 25122fd1b5dSAlan Cox.Pp 25222fd1b5dSAlan CoxWhen a fence has release semantics, all prior loads or stores (by program 25322fd1b5dSAlan Coxorder) must have completed before any subsequent store operation is 25422fd1b5dSAlan Coxperformed. 25522fd1b5dSAlan CoxThus, a release fence is a two-way barrier for store operations. 25622fd1b5dSAlan CoxTo denote release semantics, the suffix 25722fd1b5dSAlan Cox.Dq Li _rel 25822fd1b5dSAlan Coxis appended to the function name, for example, 25922fd1b5dSAlan Cox.Fn atomic_thread_fence_rel . 26022fd1b5dSAlan Cox.Pp 26122fd1b5dSAlan CoxAlthough 26222fd1b5dSAlan Cox.Fn atomic_thread_fence_acq_rel 26322fd1b5dSAlan Coximplements both acquire and release semantics, it is not a full barrier. 26422fd1b5dSAlan CoxFor example, a store prior to the fence (in program order) may be completed 26522fd1b5dSAlan Coxafter a load subsequent to the fence. 26622fd1b5dSAlan CoxIn contrast, 26722fd1b5dSAlan Cox.Fn atomic_thread_fence_seq_cst 26822fd1b5dSAlan Coximplements a full barrier. 26922fd1b5dSAlan CoxNeither loads nor stores may cross this barrier in either direction. 27022fd1b5dSAlan Cox.Pp 27122fd1b5dSAlan CoxIn C11, a release fence by one thread synchronizes with an acquire fence by 27222fd1b5dSAlan Coxanother thread when an atomic load that is prior to the acquire fence (by 27322fd1b5dSAlan Coxprogram order) reads the value written by an atomic store that is subsequent 27422fd1b5dSAlan Coxto the release fence. 27555ed6718SBenedict ReuschlingIn constrast, in 27655ed6718SBenedict Reuschling.Fx , 27755ed6718SBenedict Reuschlingbecause of the atomicity of ordinary, naturally 27822fd1b5dSAlan Coxaligned loads and stores, fences can also be synchronized by ordinary loads 27922fd1b5dSAlan Coxand stores. 28022fd1b5dSAlan CoxThis simplifies the implementation and use of some synchronization 28122fd1b5dSAlan Coxprimitives in 28222fd1b5dSAlan Cox.Fx . 28322fd1b5dSAlan Cox.Pp 28422fd1b5dSAlan CoxSince neither a compiler nor a processor can foresee which (atomic) load 28522fd1b5dSAlan Coxwill read the value written by an (atomic) store, the ordering constraints 28622fd1b5dSAlan Coximposed by fences must be more restrictive than acquire loads and release 28722fd1b5dSAlan Coxstores. 28822fd1b5dSAlan CoxEssentially, this is why fences are two-way barriers. 28922fd1b5dSAlan Cox.Pp 29022fd1b5dSAlan CoxAlthough fences impose more restrictive ordering than acquire loads and 29122fd1b5dSAlan Coxrelease stores, by separating access from ordering, they can sometimes 29222fd1b5dSAlan Coxfacilitate more efficient implementations of synchronization primitives. 29322fd1b5dSAlan CoxFor example, they can be used to avoid executing a memory barrier until a 29422fd1b5dSAlan Coxmemory access shows that some condition is satisfied. 295e2494f75SKonstantin Belousov.Ss Interrupt Fence Operations 296e2494f75SKonstantin BelousovThe 29732068667SChristian Brueffer.Fn atomic_interrupt_fence 298e2494f75SKonstantin Belousovfunction establishes ordering between its call location and any interrupt 299e2494f75SKonstantin Belousovhandler executing on the same CPU. 300e2494f75SKonstantin BelousovIt is modeled after the similar C11 function 30132068667SChristian Brueffer.Fn atomic_signal_fence , 302e2494f75SKonstantin Belousovand adapted for the kernel environment. 303eaca6183SJohn Baldwin.Ss Multiple Processors 304a61bd957SAlan CoxIn multiprocessor systems, the atomicity of the atomic operations on memory 305a61bd957SAlan Coxdepends on support for cache coherence in the underlying architecture. 306a61bd957SAlan CoxIn general, cache coherence on the default memory type, 307a61bd957SAlan Cox.Dv VM_MEMATTR_DEFAULT , 308a61bd957SAlan Coxis guaranteed by all architectures that are supported by 309a61bd957SAlan Cox.Fx . 310a61bd957SAlan CoxFor example, cache coherence is guaranteed on write-back memory by the 311a61bd957SAlan Cox.Tn amd64 312a61bd957SAlan Coxand 313eaca6183SJohn Baldwin.Tn i386 314a61bd957SAlan Coxarchitectures. 315cff0a327SAlan CoxHowever, on some architectures, cache coherence might not be enabled on all 316a61bd957SAlan Coxmemory types. 317a61bd957SAlan CoxTo determine if cache coherence is enabled for a non-default memory type, 318a61bd957SAlan Coxconsult the architecture's documentation. 319eaca6183SJohn Baldwin.Ss Semantics 320eaca6183SJohn BaldwinThis section describes the semantics of each operation using a C like notation. 321eaca6183SJohn Baldwin.Bl -hang 3222be6c09fSRuslan Ermilov.It Fn atomic_add p v 3232be6c09fSRuslan Ermilov.Bd -literal -compact 324eaca6183SJohn Baldwin*p += v; 325eaca6183SJohn Baldwin.Ed 3262be6c09fSRuslan Ermilov.It Fn atomic_clear p v 3272be6c09fSRuslan Ermilov.Bd -literal -compact 328eaca6183SJohn Baldwin*p &= ~v; 329eaca6183SJohn Baldwin.Ed 3302be6c09fSRuslan Ermilov.It Fn atomic_cmpset dst old new 3312be6c09fSRuslan Ermilov.Bd -literal -compact 332eaca6183SJohn Baldwinif (*dst == old) { 333eaca6183SJohn Baldwin *dst = new; 3348a1ee2d3SJung-uk Kim return (1); 335eaca6183SJohn Baldwin} else 3368a1ee2d3SJung-uk Kim return (0); 337eaca6183SJohn Baldwin.Ed 338eaca6183SJohn Baldwin.El 339eaca6183SJohn Baldwin.Pp 3403d673254SMark JohnstonSome architectures do not implement the 341eaca6183SJohn Baldwin.Fn atomic_cmpset 3423d673254SMark Johnstonfunctions for the types 3432be6c09fSRuslan Ermilov.Dq Li char , 3442be6c09fSRuslan Ermilov.Dq Li short , 3452be6c09fSRuslan Ermilov.Dq Li 8 , 3462be6c09fSRuslan Ermilovand 3472be6c09fSRuslan Ermilov.Dq Li 16 . 348eaca6183SJohn Baldwin.Bl -hang 349c0b995bbSMateusz Guzik.It Fn atomic_fcmpset dst *old new 350c0b995bbSMateusz Guzik.El 351c0b995bbSMateusz Guzik.Pp 352c0b995bbSMateusz GuzikOn architectures implementing 353c0b995bbSMateusz Guzik.Em Compare And Swap 354c0b995bbSMateusz Guzikoperation in hardware, the functionality can be described as 355c0b995bbSMateusz Guzik.Bd -literal -offset indent -compact 356c0b995bbSMateusz Guzikif (*dst == *old) { 357c0b995bbSMateusz Guzik *dst = new; 358c0b995bbSMateusz Guzik return (1); 359c0b995bbSMateusz Guzik} else { 360c0b995bbSMateusz Guzik *old = *dst; 361c0b995bbSMateusz Guzik return (0); 362c0b995bbSMateusz Guzik} 363c0b995bbSMateusz Guzik.Ed 364c0b995bbSMateusz GuzikOn architectures which provide 365c0b995bbSMateusz Guzik.Em Load Linked/Store Conditional 366c0b995bbSMateusz Guzikprimitive, the write to 367c0b995bbSMateusz Guzik.Dv *dst 368c0b995bbSMateusz Guzikmight also fail for several reasons, most important of which 369c0b995bbSMateusz Guzikis a parallel write to 370c0b995bbSMateusz Guzik.Dv *dst 371c0b995bbSMateusz Guzikcache line by other CPU. 372c0b995bbSMateusz GuzikIn this case 373c0b995bbSMateusz Guzik.Fn atomic_fcmpset 374c0b995bbSMateusz Guzikfunction also returns 375c0b995bbSMateusz Guzik.Dv false , 376c0b995bbSMateusz Guzikdespite 377c0b995bbSMateusz Guzik.Dl *old == *dst . 378c0b995bbSMateusz Guzik.Pp 3793d673254SMark JohnstonSome architectures do not implement the 380c0b995bbSMateusz Guzik.Fn atomic_fcmpset 3813d673254SMark Johnstonfunctions for the types 382c0b995bbSMateusz Guzik.Dq Li char , 383c0b995bbSMateusz Guzik.Dq Li short , 384c0b995bbSMateusz Guzik.Dq Li 8 , 385c0b995bbSMateusz Guzikand 386c0b995bbSMateusz Guzik.Dq Li 16 . 387c0b995bbSMateusz Guzik.Bl -hang 3884ea211a4SJohn Baldwin.It Fn atomic_fetchadd p v 3894ea211a4SJohn Baldwin.Bd -literal -compact 3904ea211a4SJohn Baldwintmp = *p; 3914ea211a4SJohn Baldwin*p += v; 3928a1ee2d3SJung-uk Kimreturn (tmp); 3934ea211a4SJohn Baldwin.Ed 3944ea211a4SJohn Baldwin.El 3954ea211a4SJohn Baldwin.Pp 3964ea211a4SJohn BaldwinThe 3974ea211a4SJohn Baldwin.Fn atomic_fetchadd 3984ea211a4SJohn Baldwinfunctions are only implemented for the types 3996eb4157fSPawel Jakub Dawidek.Dq Li int , 4006eb4157fSPawel Jakub Dawidek.Dq Li long 4014ea211a4SJohn Baldwinand 4024ea211a4SJohn Baldwin.Dq Li 32 4034ea211a4SJohn Baldwinand do not have any variants with memory barriers at this time. 4044ea211a4SJohn Baldwin.Bl -hang 4058a1ee2d3SJung-uk Kim.It Fn atomic_load p 4062be6c09fSRuslan Ermilov.Bd -literal -compact 4078a1ee2d3SJung-uk Kimreturn (*p); 408eaca6183SJohn Baldwin.Ed 4098a1ee2d3SJung-uk Kim.It Fn atomic_readandclear p 4102be6c09fSRuslan Ermilov.Bd -literal -compact 4118a1ee2d3SJung-uk Kimtmp = *p; 4128a1ee2d3SJung-uk Kim*p = 0; 4138a1ee2d3SJung-uk Kimreturn (tmp); 414eaca6183SJohn Baldwin.Ed 415eaca6183SJohn Baldwin.El 416eaca6183SJohn Baldwin.Pp 417eaca6183SJohn BaldwinThe 418eaca6183SJohn Baldwin.Fn atomic_readandclear 4192be6c09fSRuslan Ermilovfunctions are not implemented for the types 4202be6c09fSRuslan Ermilov.Dq Li char , 4212be6c09fSRuslan Ermilov.Dq Li short , 4222be6c09fSRuslan Ermilov.Dq Li ptr , 4232be6c09fSRuslan Ermilov.Dq Li 8 , 4242be6c09fSRuslan Ermilovand 4252be6c09fSRuslan Ermilov.Dq Li 16 4268a1ee2d3SJung-uk Kimand do not have any variants with memory barriers at this time. 427eaca6183SJohn Baldwin.Bl -hang 4282be6c09fSRuslan Ermilov.It Fn atomic_set p v 4292be6c09fSRuslan Ermilov.Bd -literal -compact 430eaca6183SJohn Baldwin*p |= v; 431eaca6183SJohn Baldwin.Ed 4322be6c09fSRuslan Ermilov.It Fn atomic_subtract p v 4332be6c09fSRuslan Ermilov.Bd -literal -compact 434eaca6183SJohn Baldwin*p -= v; 435eaca6183SJohn Baldwin.Ed 4362be6c09fSRuslan Ermilov.It Fn atomic_store p v 4372be6c09fSRuslan Ermilov.Bd -literal -compact 438eaca6183SJohn Baldwin*p = v; 439eaca6183SJohn Baldwin.Ed 4408a1ee2d3SJung-uk Kim.It Fn atomic_swap p v 4418a1ee2d3SJung-uk Kim.Bd -literal -compact 4428a1ee2d3SJung-uk Kimtmp = *p; 4438a1ee2d3SJung-uk Kim*p = v; 4448a1ee2d3SJung-uk Kimreturn (tmp); 4458a1ee2d3SJung-uk Kim.Ed 4468a1ee2d3SJung-uk Kim.El 4478a1ee2d3SJung-uk Kim.Pp 4488a1ee2d3SJung-uk KimThe 4498a1ee2d3SJung-uk Kim.Fn atomic_swap 4508a1ee2d3SJung-uk Kimfunctions are not implemented for the types 4518a1ee2d3SJung-uk Kim.Dq Li char , 4528a1ee2d3SJung-uk Kim.Dq Li short , 4538a1ee2d3SJung-uk Kim.Dq Li ptr , 4548a1ee2d3SJung-uk Kim.Dq Li 8 , 4558a1ee2d3SJung-uk Kimand 4568a1ee2d3SJung-uk Kim.Dq Li 16 4578a1ee2d3SJung-uk Kimand do not have any variants with memory barriers at this time. 4588a1ee2d3SJung-uk Kim.Bl -hang 459dfdc9a05SSepherosa Ziehau.It Fn atomic_testandclear p v 460dfdc9a05SSepherosa Ziehau.Bd -literal -compact 461dfdc9a05SSepherosa Ziehaubit = 1 << (v % (sizeof(*p) * NBBY)); 462dfdc9a05SSepherosa Ziehautmp = (*p & bit) != 0; 463dfdc9a05SSepherosa Ziehau*p &= ~bit; 464dfdc9a05SSepherosa Ziehaureturn (tmp); 465dfdc9a05SSepherosa Ziehau.Ed 466dfdc9a05SSepherosa Ziehau.El 467dfdc9a05SSepherosa Ziehau.Bl -hang 4688a1ee2d3SJung-uk Kim.It Fn atomic_testandset p v 4698a1ee2d3SJung-uk Kim.Bd -literal -compact 4708a1ee2d3SJung-uk Kimbit = 1 << (v % (sizeof(*p) * NBBY)); 4718a1ee2d3SJung-uk Kimtmp = (*p & bit) != 0; 4728a1ee2d3SJung-uk Kim*p |= bit; 4738a1ee2d3SJung-uk Kimreturn (tmp); 4748a1ee2d3SJung-uk Kim.Ed 4758a1ee2d3SJung-uk Kim.El 4768a1ee2d3SJung-uk Kim.Pp 4778a1ee2d3SJung-uk KimThe 4788a1ee2d3SJung-uk Kim.Fn atomic_testandset 479dfdc9a05SSepherosa Ziehauand 480dfdc9a05SSepherosa Ziehau.Fn atomic_testandclear 4818a1ee2d3SJung-uk Kimfunctions are only implemented for the types 4828a1ee2d3SJung-uk Kim.Dq Li int , 4833ca22e1eSJohn Baldwin.Dq Li long , 484a80b9ee1SJohn Baldwin.Dq ptr , 4853ca22e1eSJohn Baldwin.Dq Li 32 , 4868a1ee2d3SJung-uk Kimand 4873ca22e1eSJohn Baldwin.Dq Li 64 4883ca22e1eSJohn Baldwinand generally do not have any variants with memory barriers at this time 4893ca22e1eSJohn Baldwinexcept for 4903ca22e1eSJohn Baldwin.Fn atomic_testandset_acq_long . 4918a1ee2d3SJung-uk Kim.Pp 492eaca6183SJohn BaldwinThe type 4932be6c09fSRuslan Ermilov.Dq Li 64 4943a91d106SKonstantin Belousovis currently not implemented for some of the atomic operations on the 4954ea211a4SJohn Baldwin.Tn arm , 4964ea211a4SJohn Baldwin.Tn i386 , 4974ea211a4SJohn Baldwinand 4984ea211a4SJohn Baldwin.Tn powerpc 4994ea211a4SJohn Baldwinarchitectures. 500eaca6183SJohn Baldwin.Sh RETURN VALUES 5012be6c09fSRuslan ErmilovThe 502eaca6183SJohn Baldwin.Fn atomic_cmpset 5038a1ee2d3SJung-uk Kimfunction returns the result of the compare operation. 5042be6c09fSRuslan ErmilovThe 505c0b995bbSMateusz Guzik.Fn atomic_fcmpset 506c0b995bbSMateusz Guzikfunction returns 507c0b995bbSMateusz Guzik.Dv true 50868278ec6SBenjamin Kadukif the operation succeeded. 509c0b995bbSMateusz GuzikOtherwise it returns 510c0b995bbSMateusz Guzik.Dv false 511c0b995bbSMateusz Guzikand sets 512c0b995bbSMateusz Guzik.Va *old 513c0b995bbSMateusz Guzikto the found value. 514c0b995bbSMateusz GuzikThe 5154ea211a4SJohn Baldwin.Fn atomic_fetchadd , 5164ea211a4SJohn Baldwin.Fn atomic_load , 5178a1ee2d3SJung-uk Kim.Fn atomic_readandclear , 518eaca6183SJohn Baldwinand 5198a1ee2d3SJung-uk Kim.Fn atomic_swap 5208a1ee2d3SJung-uk Kimfunctions return the value at the specified address. 5218a1ee2d3SJung-uk KimThe 5228a1ee2d3SJung-uk Kim.Fn atomic_testandset 523dfdc9a05SSepherosa Ziehauand 524dfdc9a05SSepherosa Ziehau.Fn atomic_testandclear 5258a1ee2d3SJung-uk Kimfunction returns the result of the test operation. 526eaca6183SJohn Baldwin.Sh EXAMPLES 527eaca6183SJohn BaldwinThis example uses the 528eaca6183SJohn Baldwin.Fn atomic_cmpset_acq_ptr 529eaca6183SJohn Baldwinand 530eaca6183SJohn Baldwin.Fn atomic_set_ptr 531eaca6183SJohn Baldwinfunctions to obtain a sleep mutex and handle recursion. 532eaca6183SJohn BaldwinSince the 533eaca6183SJohn Baldwin.Va mtx_lock 534eaca6183SJohn Baldwinmember of a 5352be6c09fSRuslan Ermilov.Vt "struct mtx" 536eaca6183SJohn Baldwinis a pointer, the 5372be6c09fSRuslan Ermilov.Dq Li ptr 538eaca6183SJohn Baldwintype is used. 539eaca6183SJohn Baldwin.Bd -literal 5404ea211a4SJohn Baldwin/* Try to obtain mtx_lock once. */ 541eaca6183SJohn Baldwin#define _obtain_lock(mp, tid) \\ 5424ea211a4SJohn Baldwin atomic_cmpset_acq_ptr(&(mp)->mtx_lock, MTX_UNOWNED, (tid)) 543eaca6183SJohn Baldwin 544eaca6183SJohn Baldwin/* Get a sleep lock, deal with recursion inline. */ 5454ea211a4SJohn Baldwin#define _get_sleep_lock(mp, tid, opts, file, line) do { \\ 5464ea211a4SJohn Baldwin uintptr_t _tid = (uintptr_t)(tid); \\ 5474ea211a4SJohn Baldwin \\ 548eaca6183SJohn Baldwin if (!_obtain_lock(mp, tid)) { \\ 5494ea211a4SJohn Baldwin if (((mp)->mtx_lock & MTX_FLAGMASK) != _tid) \\ 5504ea211a4SJohn Baldwin _mtx_lock_sleep((mp), _tid, (opts), (file), (line));\\ 551eaca6183SJohn Baldwin else { \\ 552eaca6183SJohn Baldwin atomic_set_ptr(&(mp)->mtx_lock, MTX_RECURSE); \\ 553eaca6183SJohn Baldwin (mp)->mtx_recurse++; \\ 554eaca6183SJohn Baldwin } \\ 555eaca6183SJohn Baldwin } \\ 556eaca6183SJohn Baldwin} while (0) 557eaca6183SJohn Baldwin.Ed 558eaca6183SJohn Baldwin.Sh HISTORY 559eaca6183SJohn BaldwinThe 560eaca6183SJohn Baldwin.Fn atomic_add , 561eaca6183SJohn Baldwin.Fn atomic_clear , 562eaca6183SJohn Baldwin.Fn atomic_set , 563eaca6183SJohn Baldwinand 564eaca6183SJohn Baldwin.Fn atomic_subtract 56577863e4bSKonstantin Belousovoperations were introduced in 566eaca6183SJohn Baldwin.Fx 3.0 . 56777863e4bSKonstantin BelousovInitially, these operations were defined on the types 5682be6c09fSRuslan Ermilov.Dq Li char , 5692be6c09fSRuslan Ermilov.Dq Li short , 5702be6c09fSRuslan Ermilov.Dq Li int , 5712be6c09fSRuslan Ermilovand 5722be6c09fSRuslan Ermilov.Dq Li long . 57377863e4bSKonstantin Belousov.Pp 574eaca6183SJohn BaldwinThe 575eaca6183SJohn Baldwin.Fn atomic_cmpset , 57677863e4bSKonstantin Belousov.Fn atomic_load_acq , 577eaca6183SJohn Baldwin.Fn atomic_readandclear , 578eaca6183SJohn Baldwinand 57977863e4bSKonstantin Belousov.Fn atomic_store_rel 580eaca6183SJohn Baldwinoperations were added in 581eaca6183SJohn Baldwin.Fx 5.0 . 58277863e4bSKonstantin BelousovSimultaneously, the acquire and release variants were introduced, and 58377863e4bSKonstantin Belousovsupport was added for operation on the types 5842be6c09fSRuslan Ermilov.Dq Li 8 , 5852be6c09fSRuslan Ermilov.Dq Li 16 , 5862be6c09fSRuslan Ermilov.Dq Li 32 , 5872be6c09fSRuslan Ermilov.Dq Li 64 , 5882be6c09fSRuslan Ermilovand 58977863e4bSKonstantin Belousov.Dq Li ptr . 59077863e4bSKonstantin Belousov.Pp 5914ea211a4SJohn BaldwinThe 5924ea211a4SJohn Baldwin.Fn atomic_fetchadd 59377863e4bSKonstantin Belousovoperation was added in 5944ea211a4SJohn Baldwin.Fx 6.0 . 59577863e4bSKonstantin Belousov.Pp 5968a1ee2d3SJung-uk KimThe 5978a1ee2d3SJung-uk Kim.Fn atomic_swap 5988a1ee2d3SJung-uk Kimand 5998a1ee2d3SJung-uk Kim.Fn atomic_testandset 6008a1ee2d3SJung-uk Kimoperations were added in 6018a1ee2d3SJung-uk Kim.Fx 10.0 . 60277863e4bSKonstantin Belousov.Pp 60377863e4bSKonstantin BelousovThe 604dfdc9a05SSepherosa Ziehau.Fn atomic_testandclear 60577863e4bSKonstantin Belousovand 60677863e4bSKonstantin Belousov.Fn atomic_thread_fence 60777863e4bSKonstantin Belousovoperations were added in 608dfdc9a05SSepherosa Ziehau.Fx 11.0 . 60977863e4bSKonstantin Belousov.Pp 61077863e4bSKonstantin BelousovThe relaxed variants of 61177863e4bSKonstantin Belousov.Fn atomic_load 61277863e4bSKonstantin Belousovand 61377863e4bSKonstantin Belousov.Fn atomic_store 61477863e4bSKonstantin Belousovwere added in 61577863e4bSKonstantin Belousov.Fx 12.0 . 616f5e930b3SKonstantin Belousov.Pp 617f5e930b3SKonstantin BelousovThe 618f5e930b3SKonstantin Belousov.Fn atomic_interrupt_fence 619f5e930b3SKonstantin Belousovoperation was added in 620f5e930b3SKonstantin Belousov.Fx 13.0 . 621