1 /* 2 Simple DirectMedia Layer 3 Copyright (C) 1997-2020 Sam Lantinga <slouken@libsdl.org> 4 5 This software is provided 'as-is', without any express or implied 6 warranty. In no event will the authors be held liable for any damages 7 arising from the use of this software. 8 9 Permission is granted to anyone to use this software for any purpose, 10 including commercial applications, and to alter it and redistribute it 11 freely, subject to the following restrictions: 12 13 1. The origin of this software must not be misrepresented; you must not 14 claim that you wrote the original software. If you use this software 15 in a product, an acknowledgment in the product documentation would be 16 appreciated but is not required. 17 2. Altered source versions must be plainly marked as such, and must not be 18 misrepresented as being the original software. 19 3. This notice may not be removed or altered from any source distribution. 20 */ 21 22 /** 23 * \file SDL_atomic.h 24 * 25 * Atomic operations. 26 * 27 * IMPORTANT: 28 * If you are not an expert in concurrent lockless programming, you should 29 * only be using the atomic lock and reference counting functions in this 30 * file. In all other cases you should be protecting your data structures 31 * with full mutexes. 32 * 33 * The list of "safe" functions to use are: 34 * SDL_AtomicLock() 35 * SDL_AtomicUnlock() 36 * SDL_AtomicIncRef() 37 * SDL_AtomicDecRef() 38 * 39 * Seriously, here be dragons! 40 * ^^^^^^^^^^^^^^^^^^^^^^^^^^^ 41 * 42 * You can find out a little more about lockless programming and the 43 * subtle issues that can arise here: 44 * http://msdn.microsoft.com/en-us/library/ee418650%28v=vs.85%29.aspx 45 * 46 * There's also lots of good information here: 47 * http://www.1024cores.net/home/lock-free-algorithms 48 * http://preshing.com/ 49 * 50 * These operations may or may not actually be implemented using 51 * processor specific atomic operations. When possible they are 52 * implemented as true processor specific atomic operations. When that 53 * is not possible the are implemented using locks that *do* use the 54 * available atomic operations. 55 * 56 * All of the atomic operations that modify memory are full memory barriers. 57 */ 58 59 #ifndef SDL_atomic_h_ 60 #define SDL_atomic_h_ 61 62 #include "SDL_stdinc.h" 63 #include "SDL_platform.h" 64 65 #include "begin_code.h" 66 67 /* Set up for C function definitions, even when using C++ */ 68 #ifdef __cplusplus 69 extern "C" { 70 #endif 71 72 /** 73 * \name SDL AtomicLock 74 * 75 * The atomic locks are efficient spinlocks using CPU instructions, 76 * but are vulnerable to starvation and can spin forever if a thread 77 * holding a lock has been terminated. For this reason you should 78 * minimize the code executed inside an atomic lock and never do 79 * expensive things like API or system calls while holding them. 80 * 81 * The atomic locks are not safe to lock recursively. 82 * 83 * Porting Note: 84 * The spin lock functions and type are required and can not be 85 * emulated because they are used in the atomic emulation code. 86 */ 87 /* @{ */ 88 89 typedef int SDL_SpinLock; 90 91 /** 92 * \brief Try to lock a spin lock by setting it to a non-zero value. 93 * 94 * \param lock Points to the lock. 95 * 96 * \return SDL_TRUE if the lock succeeded, SDL_FALSE if the lock is already held. 97 */ 98 extern DECLSPEC SDL_bool SDLCALL SDL_AtomicTryLock(SDL_SpinLock *lock); 99 100 /** 101 * \brief Lock a spin lock by setting it to a non-zero value. 102 * 103 * \param lock Points to the lock. 104 */ 105 extern DECLSPEC void SDLCALL SDL_AtomicLock(SDL_SpinLock *lock); 106 107 /** 108 * \brief Unlock a spin lock by setting it to 0. Always returns immediately 109 * 110 * \param lock Points to the lock. 111 */ 112 extern DECLSPEC void SDLCALL SDL_AtomicUnlock(SDL_SpinLock *lock); 113 114 /* @} *//* SDL AtomicLock */ 115 116 117 /** 118 * The compiler barrier prevents the compiler from reordering 119 * reads and writes to globally visible variables across the call. 120 */ 121 #if defined(_MSC_VER) && (_MSC_VER > 1200) && !defined(__clang__) 122 void _ReadWriteBarrier(void); 123 #pragma intrinsic(_ReadWriteBarrier) 124 #define SDL_CompilerBarrier() _ReadWriteBarrier() 125 #elif (defined(__GNUC__) && !defined(__EMSCRIPTEN__)) || (defined(__SUNPRO_C) && (__SUNPRO_C >= 0x5120)) 126 /* This is correct for all CPUs when using GCC or Solaris Studio 12.1+. */ 127 #define SDL_CompilerBarrier() __asm__ __volatile__ ("" : : : "memory") 128 #elif defined(__WATCOMC__) 129 extern _inline void SDL_CompilerBarrier (void); 130 #pragma aux SDL_CompilerBarrier = "" parm [] modify exact []; 131 #else 132 #define SDL_CompilerBarrier() \ 133 { SDL_SpinLock _tmp = 0; SDL_AtomicLock(&_tmp); SDL_AtomicUnlock(&_tmp); } 134 #endif 135 136 /** 137 * Memory barriers are designed to prevent reads and writes from being 138 * reordered by the compiler and being seen out of order on multi-core CPUs. 139 * 140 * A typical pattern would be for thread A to write some data and a flag, 141 * and for thread B to read the flag and get the data. In this case you 142 * would insert a release barrier between writing the data and the flag, 143 * guaranteeing that the data write completes no later than the flag is 144 * written, and you would insert an acquire barrier between reading the 145 * flag and reading the data, to ensure that all the reads associated 146 * with the flag have completed. 147 * 148 * In this pattern you should always see a release barrier paired with 149 * an acquire barrier and you should gate the data reads/writes with a 150 * single flag variable. 151 * 152 * For more information on these semantics, take a look at the blog post: 153 * http://preshing.com/20120913/acquire-and-release-semantics 154 */ 155 extern DECLSPEC void SDLCALL SDL_MemoryBarrierReleaseFunction(void); 156 extern DECLSPEC void SDLCALL SDL_MemoryBarrierAcquireFunction(void); 157 158 #if defined(__GNUC__) && (defined(__powerpc__) || defined(__ppc__)) 159 #define SDL_MemoryBarrierRelease() __asm__ __volatile__ ("lwsync" : : : "memory") 160 #define SDL_MemoryBarrierAcquire() __asm__ __volatile__ ("lwsync" : : : "memory") 161 #elif defined(__GNUC__) && defined(__aarch64__) 162 #define SDL_MemoryBarrierRelease() __asm__ __volatile__ ("dmb ish" : : : "memory") 163 #define SDL_MemoryBarrierAcquire() __asm__ __volatile__ ("dmb ish" : : : "memory") 164 #elif defined(__GNUC__) && defined(__arm__) 165 #if 0 /* defined(__LINUX__) || defined(__ANDROID__) */ 166 /* Information from: 167 https://chromium.googlesource.com/chromium/chromium/+/trunk/base/atomicops_internals_arm_gcc.h#19 168 169 The Linux kernel provides a helper function which provides the right code for a memory barrier, 170 hard-coded at address 0xffff0fa0 171 */ 172 typedef void (*SDL_KernelMemoryBarrierFunc)(); 173 #define SDL_MemoryBarrierRelease() ((SDL_KernelMemoryBarrierFunc)0xffff0fa0)() 174 #define SDL_MemoryBarrierAcquire() ((SDL_KernelMemoryBarrierFunc)0xffff0fa0)() 175 #elif 0 /* defined(__QNXNTO__) */ 176 #include <sys/cpuinline.h> 177 178 #define SDL_MemoryBarrierRelease() __cpu_membarrier() 179 #define SDL_MemoryBarrierAcquire() __cpu_membarrier() 180 #else 181 #if defined(__ARM_ARCH_7__) || defined(__ARM_ARCH_7A__) || defined(__ARM_ARCH_7EM__) || defined(__ARM_ARCH_7R__) || defined(__ARM_ARCH_7M__) || defined(__ARM_ARCH_7S__) || defined(__ARM_ARCH_8A__) 182 #define SDL_MemoryBarrierRelease() __asm__ __volatile__ ("dmb ish" : : : "memory") 183 #define SDL_MemoryBarrierAcquire() __asm__ __volatile__ ("dmb ish" : : : "memory") 184 #elif defined(__ARM_ARCH_6__) || defined(__ARM_ARCH_6J__) || defined(__ARM_ARCH_6K__) || defined(__ARM_ARCH_6T2__) || defined(__ARM_ARCH_6Z__) || defined(__ARM_ARCH_6ZK__) || defined(__ARM_ARCH_5TE__) 185 #ifdef __thumb__ 186 /* The mcr instruction isn't available in thumb mode, use real functions */ 187 #define SDL_MEMORY_BARRIER_USES_FUNCTION 188 #define SDL_MemoryBarrierRelease() SDL_MemoryBarrierReleaseFunction() 189 #define SDL_MemoryBarrierAcquire() SDL_MemoryBarrierAcquireFunction() 190 #else 191 #define SDL_MemoryBarrierRelease() __asm__ __volatile__ ("mcr p15, 0, %0, c7, c10, 5" : : "r"(0) : "memory") 192 #define SDL_MemoryBarrierAcquire() __asm__ __volatile__ ("mcr p15, 0, %0, c7, c10, 5" : : "r"(0) : "memory") 193 #endif /* __thumb__ */ 194 #else 195 #define SDL_MemoryBarrierRelease() __asm__ __volatile__ ("" : : : "memory") 196 #define SDL_MemoryBarrierAcquire() __asm__ __volatile__ ("" : : : "memory") 197 #endif /* __LINUX__ || __ANDROID__ */ 198 #endif /* __GNUC__ && __arm__ */ 199 #else 200 #if (defined(__SUNPRO_C) && (__SUNPRO_C >= 0x5120)) 201 /* This is correct for all CPUs on Solaris when using Solaris Studio 12.1+. */ 202 #include <mbarrier.h> 203 #define SDL_MemoryBarrierRelease() __machine_rel_barrier() 204 #define SDL_MemoryBarrierAcquire() __machine_acq_barrier() 205 #else 206 /* This is correct for the x86 and x64 CPUs, and we'll expand this over time. */ 207 #define SDL_MemoryBarrierRelease() SDL_CompilerBarrier() 208 #define SDL_MemoryBarrierAcquire() SDL_CompilerBarrier() 209 #endif 210 #endif 211 212 /** 213 * \brief A type representing an atomic integer value. It is a struct 214 * so people don't accidentally use numeric operations on it. 215 */ 216 typedef struct { int value; } SDL_atomic_t; 217 218 /** 219 * \brief Set an atomic variable to a new value if it is currently an old value. 220 * 221 * \return SDL_TRUE if the atomic variable was set, SDL_FALSE otherwise. 222 * 223 * \note If you don't know what this function is for, you shouldn't use it! 224 */ 225 extern DECLSPEC SDL_bool SDLCALL SDL_AtomicCAS(SDL_atomic_t *a, int oldval, int newval); 226 227 /** 228 * \brief Set an atomic variable to a value. 229 * 230 * \return The previous value of the atomic variable. 231 */ 232 extern DECLSPEC int SDLCALL SDL_AtomicSet(SDL_atomic_t *a, int v); 233 234 /** 235 * \brief Get the value of an atomic variable 236 */ 237 extern DECLSPEC int SDLCALL SDL_AtomicGet(SDL_atomic_t *a); 238 239 /** 240 * \brief Add to an atomic variable. 241 * 242 * \return The previous value of the atomic variable. 243 * 244 * \note This same style can be used for any number operation 245 */ 246 extern DECLSPEC int SDLCALL SDL_AtomicAdd(SDL_atomic_t *a, int v); 247 248 /** 249 * \brief Increment an atomic variable used as a reference count. 250 */ 251 #ifndef SDL_AtomicIncRef 252 #define SDL_AtomicIncRef(a) SDL_AtomicAdd(a, 1) 253 #endif 254 255 /** 256 * \brief Decrement an atomic variable used as a reference count. 257 * 258 * \return SDL_TRUE if the variable reached zero after decrementing, 259 * SDL_FALSE otherwise 260 */ 261 #ifndef SDL_AtomicDecRef 262 #define SDL_AtomicDecRef(a) (SDL_AtomicAdd(a, -1) == 1) 263 #endif 264 265 /** 266 * \brief Set a pointer to a new value if it is currently an old value. 267 * 268 * \return SDL_TRUE if the pointer was set, SDL_FALSE otherwise. 269 * 270 * \note If you don't know what this function is for, you shouldn't use it! 271 */ 272 extern DECLSPEC SDL_bool SDLCALL SDL_AtomicCASPtr(void **a, void *oldval, void *newval); 273 274 /** 275 * \brief Set a pointer to a value atomically. 276 * 277 * \return The previous value of the pointer. 278 */ 279 extern DECLSPEC void* SDLCALL SDL_AtomicSetPtr(void **a, void* v); 280 281 /** 282 * \brief Get the value of a pointer atomically. 283 */ 284 extern DECLSPEC void* SDLCALL SDL_AtomicGetPtr(void **a); 285 286 /* Ends C function definitions when using C++ */ 287 #ifdef __cplusplus 288 } 289 #endif 290 291 #include "close_code.h" 292 293 #endif /* SDL_atomic_h_ */ 294 295 /* vi: set ts=4 sw=4 expandtab: */ 296