2011-04-25 17:22:25 +02:00
|
|
|
#ifndef MY_ATOMIC_INCLUDED
|
|
|
|
#define MY_ATOMIC_INCLUDED
|
2009-10-09 14:21:29 +02:00
|
|
|
|
2011-06-30 17:46:53 +02:00
|
|
|
/* Copyright (c) 2006, 2010, Oracle and/or its affiliates. All rights reserved.
|
2006-05-31 18:44:09 +02:00
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
2006-12-27 02:23:51 +01:00
|
|
|
the Free Software Foundation; version 2 of the License.
|
2006-05-31 18:44:09 +02:00
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
|
|
along with this program; if not, write to the Free Software
|
2011-06-30 17:46:53 +02:00
|
|
|
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */
|
2006-05-31 18:44:09 +02:00
|
|
|
|
2009-10-09 14:21:29 +02:00
|
|
|
/*
|
|
|
|
This header defines five atomic operations:
|
|
|
|
|
|
|
|
my_atomic_add#(&var, what)
|
2014-10-14 14:58:35 +04:00
|
|
|
my_atomic_add#_explicit(&var, what, memory_order)
|
Bug#22320: my_atomic-t unit test fails
Bug#52261: 64 bit atomic operations do not work on Solaris i386
gcc in debug compilation
One of the various problems was that the source operand to
CMPXCHG8b was marked as a input/output operand, causing GCC
to use the EBX register as the destination register for the
CMPXCHG8b instruction. This could lead to crashes as the EBX
register is also implicitly used by the instruction, causing
the value to be potentially garbaged and a protection fault
once the value is used to access a position in memory.
Another problem was the lack of proper clobbers for the atomic
operations and, also, a discrepancy between the implementations
for the Compare and Set operation. The specific problems are
described and fixed by Kristian Nielsen patches:
Patch: 1
Fix bugs in my_atomic_cas*(val,cmp,new) that *cmp is accessed
after CAS succeds.
In the gcc builtin implementation, problem was that *cmp was
read again after atomic CAS to check if old *val == *cmp;
this fails if CAS is successful and another thread modifies
*cmp in-between.
In the x86-gcc implementation, problem was that *cmp was set
also in the case of successful CAS; this means there is a
window where it can clobber a value written by another thread
after successful CAS.
Patch 2:
Add a GCC asm "memory" clobber to primitives that imply a
memory barrier.
This signifies to GCC that any potentially aliased memory
must be flushed before the operation, and re-read after the
operation, so that read or modification in other threads of
such memory values will work as intended.
In effect, it makes these primitives work as memory barriers
for the compiler as well as the CPU. This is better and more
correct than adding "volatile" to variables.
include/atomic/gcc_builtins.h:
Do not read from *cmp after the operation as it might be
already gone if the operation was successful.
include/atomic/nolock.h:
Prefer system provided atomics over the broken x86 asm.
include/atomic/x86-gcc.h:
Do not mark source operands as input/output operands.
Add proper memory clobbers.
include/my_atomic.h:
Add notes about my_atomic_add and my_atomic_cas behaviors.
unittest/mysys/my_atomic-t.c:
Remove work around, if it fails, there is either a problem
with the atomic operations code or the specific compiler
version should be black-listed.
2010-07-23 09:37:10 -03:00
|
|
|
'Fetch and Add'
|
2009-10-09 14:21:29 +02:00
|
|
|
add 'what' to *var, and return the old value of *var
|
2014-10-14 14:58:35 +04:00
|
|
|
All memory orders are valid.
|
2009-10-09 14:21:29 +02:00
|
|
|
|
|
|
|
my_atomic_fas#(&var, what)
|
2014-10-14 14:58:35 +04:00
|
|
|
my_atomic_fas#_explicit(&var, what, memory_order)
|
2009-10-09 14:21:29 +02:00
|
|
|
'Fetch And Store'
|
|
|
|
store 'what' in *var, and return the old value of *var
|
2014-10-14 14:58:35 +04:00
|
|
|
All memory orders are valid.
|
2009-10-09 14:21:29 +02:00
|
|
|
|
|
|
|
my_atomic_cas#(&var, &old, new)
|
2014-10-14 14:58:35 +04:00
|
|
|
my_atomic_cas#_weak_explicit(&var, &old, new, succ, fail)
|
|
|
|
my_atomic_cas#_strong_explicit(&var, &old, new, succ, fail)
|
2006-10-23 15:13:51 +02:00
|
|
|
'Compare And Swap'
|
2009-10-09 14:21:29 +02:00
|
|
|
if *var is equal to *old, then store 'new' in *var, and return TRUE
|
|
|
|
otherwise store *var in *old, and return FALSE
|
2014-10-14 14:58:35 +04:00
|
|
|
succ - the memory synchronization ordering for the read-modify-write
|
|
|
|
operation if the comparison succeeds. All memory orders are valid.
|
|
|
|
fail - the memory synchronization ordering for the load operation if the
|
|
|
|
comparison fails. Cannot be MY_MEMORY_ORDER_RELEASE or
|
|
|
|
MY_MEMORY_ORDER_ACQ_REL and cannot specify stronger ordering than succ.
|
|
|
|
|
|
|
|
The weak form is allowed to fail spuriously, that is, act as if *var != *old
|
|
|
|
even if they are equal. When a compare-and-exchange is in a loop, the weak
|
|
|
|
version will yield better performance on some platforms. When a weak
|
|
|
|
compare-and-exchange would require a loop and a strong one would not, the
|
|
|
|
strong one is preferable.
|
2009-10-09 14:21:29 +02:00
|
|
|
|
|
|
|
my_atomic_load#(&var)
|
2014-10-14 14:58:35 +04:00
|
|
|
my_atomic_load#_explicit(&var, memory_order)
|
2009-10-09 14:21:29 +02:00
|
|
|
return *var
|
2014-10-14 14:58:35 +04:00
|
|
|
Order must be one of MY_MEMORY_ORDER_RELAXED, MY_MEMORY_ORDER_CONSUME,
|
|
|
|
MY_MEMORY_ORDER_ACQUIRE, MY_MEMORY_ORDER_SEQ_CST.
|
2009-10-09 14:21:29 +02:00
|
|
|
|
|
|
|
my_atomic_store#(&var, what)
|
2014-10-14 14:58:35 +04:00
|
|
|
my_atomic_store#_explicit(&var, what, memory_order)
|
2009-10-09 14:21:29 +02:00
|
|
|
store 'what' in *var
|
2014-10-14 14:58:35 +04:00
|
|
|
Order must be one of MY_MEMORY_ORDER_RELAXED, MY_MEMORY_ORDER_RELEASE,
|
|
|
|
MY_MEMORY_ORDER_SEQ_CST.
|
2009-10-09 14:21:29 +02:00
|
|
|
|
2009-10-12 11:00:39 +02:00
|
|
|
'#' is substituted by a size suffix - 8, 16, 32, 64, or ptr
|
2009-10-09 14:21:29 +02:00
|
|
|
(e.g. my_atomic_add8, my_atomic_fas32, my_atomic_casptr).
|
|
|
|
|
2014-10-14 14:58:35 +04:00
|
|
|
The first version orders memory accesses according to MY_MEMORY_ORDER_SEQ_CST,
|
|
|
|
the second version (with _explicit suffix) orders memory accesses according to
|
|
|
|
given memory order.
|
|
|
|
|
|
|
|
memory_order specifies how non-atomic memory accesses are to be ordered around
|
|
|
|
an atomic operation:
|
|
|
|
|
|
|
|
MY_MEMORY_ORDER_RELAXED - there are no constraints on reordering of memory
|
|
|
|
accesses around the atomic variable.
|
|
|
|
MY_MEMORY_ORDER_CONSUME - no reads in the current thread dependent on the
|
|
|
|
value currently loaded can be reordered before this
|
|
|
|
load. This ensures that writes to dependent
|
|
|
|
variables in other threads that release the same
|
|
|
|
atomic variable are visible in the current thread.
|
|
|
|
On most platforms, this affects compiler
|
|
|
|
optimization only.
|
|
|
|
MY_MEMORY_ORDER_ACQUIRE - no reads in the current thread can be reordered
|
|
|
|
before this load. This ensures that all writes in
|
|
|
|
other threads that release the same atomic variable
|
|
|
|
are visible in the current thread.
|
|
|
|
MY_MEMORY_ORDER_RELEASE - no writes in the current thread can be reordered
|
|
|
|
after this store. This ensures that all writes in
|
|
|
|
the current thread are visible in other threads that
|
|
|
|
acquire the same atomic variable.
|
|
|
|
MY_MEMORY_ORDER_ACQ_REL - no reads in the current thread can be reordered
|
|
|
|
before this load as well as no writes in the current
|
|
|
|
thread can be reordered after this store. The
|
|
|
|
operation is read-modify-write operation. It is
|
|
|
|
ensured that all writes in another threads that
|
|
|
|
release the same atomic variable are visible before
|
|
|
|
the modification and the modification is visible in
|
|
|
|
other threads that acquire the same atomic variable.
|
|
|
|
MY_MEMORY_ORDER_SEQ_CST - The operation has the same semantics as
|
|
|
|
acquire-release operation, and additionally has
|
|
|
|
sequentially-consistent operation ordering.
|
2006-05-31 18:44:09 +02:00
|
|
|
|
2016-11-02 16:43:23 +04:00
|
|
|
We choose implementation as follows: on Windows using Visual C++ the native
|
|
|
|
implementation should be preferrable. When using gcc we prefer the Solaris
|
|
|
|
implementation before the gcc because of stability preference, we choose gcc
|
2016-11-02 15:16:36 +04:00
|
|
|
builtins if available.
|
2016-10-28 12:29:37 +04:00
|
|
|
*/
|
2016-11-02 16:43:23 +04:00
|
|
|
|
2016-10-28 12:29:37 +04:00
|
|
|
#if defined(_MSC_VER)
|
|
|
|
#include "atomic/generic-msvc.h"
|
|
|
|
#elif defined(HAVE_SOLARIS_ATOMIC)
|
|
|
|
#include "atomic/solaris.h"
|
2016-11-17 14:50:09 +04:00
|
|
|
#elif defined(HAVE_GCC_ATOMIC_BUILTINS) || defined(HAVE_GCC_C11_ATOMICS)
|
2016-10-28 12:29:37 +04:00
|
|
|
#include "atomic/gcc_builtins.h"
|
|
|
|
#endif
|
|
|
|
|
2006-05-31 18:44:09 +02:00
|
|
|
|
2016-11-03 13:21:18 +04:00
|
|
|
#ifndef HAVE_GCC_C11_ATOMICS
|
2009-12-23 09:27:41 +01:00
|
|
|
#ifndef make_atomic_cas_body
|
2009-10-09 14:21:29 +02:00
|
|
|
/* nolock.h was not able to generate even a CAS function, fall back */
|
2015-01-12 17:03:45 +01:00
|
|
|
#error atomic ops for this platform are not implemented
|
2009-12-19 12:48:39 +01:00
|
|
|
#endif
|
2009-12-19 17:44:45 +01:00
|
|
|
|
2016-11-02 16:43:23 +04:00
|
|
|
#define intptr void *
|
|
|
|
|
2009-10-09 14:21:29 +02:00
|
|
|
/* define missing functions by using the already generated ones */
|
2006-06-29 15:39:53 +02:00
|
|
|
#ifndef make_atomic_add_body
|
2009-10-09 14:21:29 +02:00
|
|
|
#define make_atomic_add_body(S) \
|
2006-06-29 15:39:53 +02:00
|
|
|
int ## S tmp=*a; \
|
2010-02-19 17:20:29 +03:00
|
|
|
while (!my_atomic_cas ## S(a, &tmp, tmp+v)) ; \
|
2006-06-29 15:39:53 +02:00
|
|
|
v=tmp;
|
|
|
|
#endif
|
2009-10-09 14:21:29 +02:00
|
|
|
#ifndef make_atomic_fas_body
|
|
|
|
#define make_atomic_fas_body(S) \
|
|
|
|
int ## S tmp=*a; \
|
2010-02-19 17:20:29 +03:00
|
|
|
while (!my_atomic_cas ## S(a, &tmp, v)) ; \
|
2009-10-09 14:21:29 +02:00
|
|
|
v=tmp;
|
|
|
|
#endif
|
|
|
|
#ifndef make_atomic_load_body
|
|
|
|
#define make_atomic_load_body(S) \
|
|
|
|
ret= 0; /* avoid compiler warning */ \
|
|
|
|
(void)(my_atomic_cas ## S(a, &ret, ret));
|
|
|
|
#endif
|
|
|
|
#ifndef make_atomic_store_body
|
|
|
|
#define make_atomic_store_body(S) \
|
|
|
|
(void)(my_atomic_fas ## S (a, v));
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#define make_atomic_cas(S) \
|
2016-11-02 16:40:43 +04:00
|
|
|
static inline int my_atomic_cas ## S(int ## S volatile *a, \
|
|
|
|
int ## S *cmp, int ## S set) \
|
2009-10-09 14:21:29 +02:00
|
|
|
{ \
|
|
|
|
int8 ret; \
|
|
|
|
make_atomic_cas_body(S); \
|
|
|
|
return ret; \
|
2006-06-17 16:20:39 +02:00
|
|
|
}
|
|
|
|
|
2009-10-09 14:21:29 +02:00
|
|
|
#define make_atomic_add(S) \
|
2010-07-23 17:18:36 -03:00
|
|
|
static inline int ## S my_atomic_add ## S( \
|
2016-11-02 16:40:43 +04:00
|
|
|
int ## S volatile *a, int ## S v) \
|
2009-10-09 14:21:29 +02:00
|
|
|
{ \
|
|
|
|
make_atomic_add_body(S); \
|
|
|
|
return v; \
|
2006-06-17 16:20:39 +02:00
|
|
|
}
|
|
|
|
|
2009-10-09 14:21:29 +02:00
|
|
|
#define make_atomic_fas(S) \
|
2010-07-23 17:18:36 -03:00
|
|
|
static inline int ## S my_atomic_fas ## S( \
|
2016-11-02 16:40:43 +04:00
|
|
|
int ## S volatile *a, int ## S v) \
|
2009-10-09 14:21:29 +02:00
|
|
|
{ \
|
|
|
|
make_atomic_fas_body(S); \
|
|
|
|
return v; \
|
2006-06-17 16:20:39 +02:00
|
|
|
}
|
|
|
|
|
2009-10-09 14:21:29 +02:00
|
|
|
#define make_atomic_load(S) \
|
2016-11-02 16:40:43 +04:00
|
|
|
static inline int ## S my_atomic_load ## S(int ## S volatile *a)\
|
2009-10-09 14:21:29 +02:00
|
|
|
{ \
|
|
|
|
int ## S ret; \
|
|
|
|
make_atomic_load_body(S); \
|
|
|
|
return ret; \
|
2006-06-17 16:20:39 +02:00
|
|
|
}
|
|
|
|
|
2009-10-09 14:21:29 +02:00
|
|
|
#define make_atomic_store(S) \
|
2010-07-23 17:18:36 -03:00
|
|
|
static inline void my_atomic_store ## S( \
|
2016-11-02 16:40:43 +04:00
|
|
|
int ## S volatile *a, int ## S v) \
|
2009-10-09 14:21:29 +02:00
|
|
|
{ \
|
|
|
|
make_atomic_store_body(S); \
|
2006-06-17 16:20:39 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
make_atomic_cas(32)
|
2009-10-12 11:00:39 +02:00
|
|
|
make_atomic_cas(64)
|
2006-06-17 16:20:39 +02:00
|
|
|
make_atomic_cas(ptr)
|
|
|
|
|
2006-06-29 15:39:53 +02:00
|
|
|
make_atomic_add(32)
|
2009-10-12 11:00:39 +02:00
|
|
|
make_atomic_add(64)
|
2006-06-29 15:39:53 +02:00
|
|
|
|
2006-06-17 16:20:39 +02:00
|
|
|
make_atomic_load(32)
|
2009-10-12 11:00:39 +02:00
|
|
|
make_atomic_load(64)
|
2006-06-17 16:20:39 +02:00
|
|
|
make_atomic_load(ptr)
|
|
|
|
|
2009-10-09 14:21:29 +02:00
|
|
|
make_atomic_fas(32)
|
2009-10-12 11:00:39 +02:00
|
|
|
make_atomic_fas(64)
|
2009-10-09 14:21:29 +02:00
|
|
|
make_atomic_fas(ptr)
|
|
|
|
|
2006-06-17 16:20:39 +02:00
|
|
|
make_atomic_store(32)
|
2009-10-12 11:00:39 +02:00
|
|
|
make_atomic_store(64)
|
2006-06-17 16:20:39 +02:00
|
|
|
make_atomic_store(ptr)
|
|
|
|
|
2009-10-09 14:21:29 +02:00
|
|
|
#ifdef _atomic_h_cleanup_
|
|
|
|
#include _atomic_h_cleanup_
|
|
|
|
#undef _atomic_h_cleanup_
|
|
|
|
#endif
|
2006-06-17 16:20:39 +02:00
|
|
|
|
|
|
|
#undef make_atomic_add
|
|
|
|
#undef make_atomic_cas
|
|
|
|
#undef make_atomic_load
|
|
|
|
#undef make_atomic_store
|
2009-10-09 14:21:29 +02:00
|
|
|
#undef make_atomic_fas
|
2006-06-29 15:39:53 +02:00
|
|
|
#undef make_atomic_add_body
|
|
|
|
#undef make_atomic_cas_body
|
|
|
|
#undef make_atomic_load_body
|
|
|
|
#undef make_atomic_store_body
|
2009-10-09 14:21:29 +02:00
|
|
|
#undef make_atomic_fas_body
|
2009-12-19 18:24:52 +01:00
|
|
|
#undef intptr
|
2016-11-03 13:21:18 +04:00
|
|
|
#endif
|
2006-06-17 16:20:39 +02:00
|
|
|
|
2009-10-09 14:21:29 +02:00
|
|
|
/*
|
|
|
|
the macro below defines (as an expression) the code that
|
|
|
|
will be run in spin-loops. Intel manuals recummend to have PAUSE there.
|
|
|
|
It is expected to be defined in include/atomic/ *.h files
|
|
|
|
*/
|
|
|
|
#ifndef LF_BACKOFF
|
|
|
|
#define LF_BACKOFF (1)
|
2006-06-17 16:20:39 +02:00
|
|
|
#endif
|
|
|
|
|
2016-11-02 16:43:23 +04:00
|
|
|
#if SIZEOF_LONG == 4
|
|
|
|
#define my_atomic_addlong(A,B) my_atomic_add32((int32*) (A), (B))
|
|
|
|
#define my_atomic_loadlong(A) my_atomic_load32((int32*) (A))
|
2017-10-09 22:55:05 +03:00
|
|
|
#define my_atomic_loadlong_explicit(A,O) my_atomic_load32_explicit((int32*) (A), (O))
|
2016-11-02 16:43:23 +04:00
|
|
|
#define my_atomic_storelong(A,B) my_atomic_store32((int32*) (A), (B))
|
|
|
|
#define my_atomic_faslong(A,B) my_atomic_fas32((int32*) (A), (B))
|
|
|
|
#define my_atomic_caslong(A,B,C) my_atomic_cas32((int32*) (A), (int32*) (B), (C))
|
2014-10-14 14:58:35 +04:00
|
|
|
#else
|
2016-11-02 16:43:23 +04:00
|
|
|
#define my_atomic_addlong(A,B) my_atomic_add64((int64*) (A), (B))
|
|
|
|
#define my_atomic_loadlong(A) my_atomic_load64((int64*) (A))
|
2017-10-09 22:55:05 +03:00
|
|
|
#define my_atomic_loadlong_explicit(A,O) my_atomic_load64_explicit((int64*) (A), (O))
|
2016-11-02 16:43:23 +04:00
|
|
|
#define my_atomic_storelong(A,B) my_atomic_store64((int64*) (A), (B))
|
|
|
|
#define my_atomic_faslong(A,B) my_atomic_fas64((int64*) (A), (B))
|
|
|
|
#define my_atomic_caslong(A,B,C) my_atomic_cas64((int64*) (A), (int64*) (B), (C))
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifndef MY_MEMORY_ORDER_SEQ_CST
|
2014-10-14 14:58:35 +04:00
|
|
|
#define MY_MEMORY_ORDER_RELAXED
|
|
|
|
#define MY_MEMORY_ORDER_CONSUME
|
|
|
|
#define MY_MEMORY_ORDER_ACQUIRE
|
|
|
|
#define MY_MEMORY_ORDER_RELEASE
|
|
|
|
#define MY_MEMORY_ORDER_ACQ_REL
|
|
|
|
#define MY_MEMORY_ORDER_SEQ_CST
|
|
|
|
|
|
|
|
#define my_atomic_store32_explicit(P, D, O) my_atomic_store32((P), (D))
|
|
|
|
#define my_atomic_store64_explicit(P, D, O) my_atomic_store64((P), (D))
|
|
|
|
#define my_atomic_storeptr_explicit(P, D, O) my_atomic_storeptr((P), (D))
|
|
|
|
|
|
|
|
#define my_atomic_load32_explicit(P, O) my_atomic_load32((P))
|
|
|
|
#define my_atomic_load64_explicit(P, O) my_atomic_load64((P))
|
|
|
|
#define my_atomic_loadptr_explicit(P, O) my_atomic_loadptr((P))
|
|
|
|
|
|
|
|
#define my_atomic_fas32_explicit(P, D, O) my_atomic_fas32((P), (D))
|
|
|
|
#define my_atomic_fas64_explicit(P, D, O) my_atomic_fas64((P), (D))
|
|
|
|
#define my_atomic_fasptr_explicit(P, D, O) my_atomic_fasptr((P), (D))
|
|
|
|
|
|
|
|
#define my_atomic_add32_explicit(P, A, O) my_atomic_add32((P), (A))
|
|
|
|
#define my_atomic_add64_explicit(P, A, O) my_atomic_add64((P), (A))
|
|
|
|
#define my_atomic_addptr_explicit(P, A, O) my_atomic_addptr((P), (A))
|
|
|
|
|
|
|
|
#define my_atomic_cas32_weak_explicit(P, E, D, S, F) \
|
|
|
|
my_atomic_cas32((P), (E), (D))
|
|
|
|
#define my_atomic_cas64_weak_explicit(P, E, D, S, F) \
|
|
|
|
my_atomic_cas64((P), (E), (D))
|
|
|
|
#define my_atomic_casptr_weak_explicit(P, E, D, S, F) \
|
|
|
|
my_atomic_casptr((P), (E), (D))
|
|
|
|
|
|
|
|
#define my_atomic_cas32_strong_explicit(P, E, D, S, F) \
|
|
|
|
my_atomic_cas32((P), (E), (D))
|
|
|
|
#define my_atomic_cas64_strong_explicit(P, E, D, S, F) \
|
|
|
|
my_atomic_cas64((P), (E), (D))
|
|
|
|
#define my_atomic_casptr_strong_explicit(P, E, D, S, F) \
|
|
|
|
my_atomic_casptr((P), (E), (D))
|
|
|
|
#endif
|
|
|
|
|
2009-10-09 14:21:29 +02:00
|
|
|
#endif /* MY_ATOMIC_INCLUDED */
|