| 1 | /* |
| 2 | Simple DirectMedia Layer |
| 3 | Copyright (C) 1997-2025 Sam Lantinga <slouken@libsdl.org> |
| 4 | |
| 5 | This software is provided 'as-is', without any express or implied |
| 6 | warranty. In no event will the authors be held liable for any damages |
| 7 | arising from the use of this software. |
| 8 | |
| 9 | Permission is granted to anyone to use this software for any purpose, |
| 10 | including commercial applications, and to alter it and redistribute it |
| 11 | freely, subject to the following restrictions: |
| 12 | |
| 13 | 1. The origin of this software must not be misrepresented; you must not |
| 14 | claim that you wrote the original software. If you use this software |
| 15 | in a product, an acknowledgment in the product documentation would be |
| 16 | appreciated but is not required. |
| 17 | 2. Altered source versions must be plainly marked as such, and must not be |
| 18 | misrepresented as being the original software. |
| 19 | 3. This notice may not be removed or altered from any source distribution. |
| 20 | */ |
| 21 | #include "SDL_internal.h" |
| 22 | |
| 23 | #if defined(_MSC_VER) && (_MSC_VER >= 1900) |
| 24 | #include <intrin.h> |
| 25 | #define HAVE_MSC_ATOMICS 1 |
| 26 | #endif |
| 27 | |
| 28 | #ifdef SDL_PLATFORM_MACOS // !!! FIXME: should we favor gcc atomics? |
| 29 | #include <libkern/OSAtomic.h> |
| 30 | #endif |
| 31 | |
| 32 | #if !defined(HAVE_GCC_ATOMICS) && defined(SDL_PLATFORM_SOLARIS) |
| 33 | #include <atomic.h> |
| 34 | #endif |
| 35 | |
| 36 | // The __atomic_load_n() intrinsic showed up in different times for different compilers. |
| 37 | #ifdef __clang__ |
| 38 | #if __has_builtin(__atomic_load_n) || defined(HAVE_GCC_ATOMICS) |
| 39 | /* !!! FIXME: this advertises as available in the NDK but uses an external symbol we don't have. |
| 40 | It might be in a later NDK or we might need an extra library? --ryan. */ |
| 41 | #ifndef SDL_PLATFORM_ANDROID |
| 42 | #define HAVE_ATOMIC_LOAD_N 1 |
| 43 | #endif |
| 44 | #endif |
| 45 | #elif defined(__GNUC__) |
| 46 | #if (__GNUC__ >= 5) |
| 47 | #define HAVE_ATOMIC_LOAD_N 1 |
| 48 | #endif |
| 49 | #endif |
| 50 | |
| 51 | /* *INDENT-OFF* */ // clang-format off |
| 52 | #if defined(__WATCOMC__) && defined(__386__) |
| 53 | SDL_COMPILE_TIME_ASSERT(intsize, 4==sizeof(int)); |
| 54 | #define HAVE_WATCOM_ATOMICS |
| 55 | extern __inline int _SDL_xchg_watcom(volatile int *a, int v); |
| 56 | #pragma aux _SDL_xchg_watcom = \ |
| 57 | "lock xchg [ecx], eax" \ |
| 58 | parm [ecx] [eax] \ |
| 59 | value [eax] \ |
| 60 | modify exact [eax]; |
| 61 | |
| 62 | extern __inline unsigned char _SDL_cmpxchg_watcom(volatile int *a, int newval, int oldval); |
| 63 | #pragma aux _SDL_cmpxchg_watcom = \ |
| 64 | "lock cmpxchg [edx], ecx" \ |
| 65 | "setz al" \ |
| 66 | parm [edx] [ecx] [eax] \ |
| 67 | value [al] \ |
| 68 | modify exact [eax]; |
| 69 | |
| 70 | extern __inline int _SDL_xadd_watcom(volatile int *a, int v); |
| 71 | #pragma aux _SDL_xadd_watcom = \ |
| 72 | "lock xadd [ecx], eax" \ |
| 73 | parm [ecx] [eax] \ |
| 74 | value [eax] \ |
| 75 | modify exact [eax]; |
| 76 | |
| 77 | #endif // __WATCOMC__ && __386__ |
| 78 | /* *INDENT-ON* */ // clang-format on |
| 79 | |
| 80 | /* |
| 81 | If any of the operations are not provided then we must emulate some |
| 82 | of them. That means we need a nice implementation of spin locks |
| 83 | that avoids the "one big lock" problem. We use a vector of spin |
| 84 | locks and pick which one to use based on the address of the operand |
| 85 | of the function. |
| 86 | |
| 87 | To generate the index of the lock we first shift by 3 bits to get |
| 88 | rid on the zero bits that result from 32 and 64 bit alignment of |
| 89 | data. We then mask off all but 5 bits and use those 5 bits as an |
| 90 | index into the table. |
| 91 | |
| 92 | Picking the lock this way insures that accesses to the same data at |
| 93 | the same time will go to the same lock. OTOH, accesses to different |
| 94 | data have only a 1/32 chance of hitting the same lock. That should |
| 95 | pretty much eliminate the chances of several atomic operations on |
| 96 | different data from waiting on the same "big lock". If it isn't |
| 97 | then the table of locks can be expanded to a new size so long as |
| 98 | the new size is a power of two. |
| 99 | |
| 100 | Contributed by Bob Pendleton, bob@pendleton.com |
| 101 | */ |
| 102 | |
| 103 | #if !defined(HAVE_MSC_ATOMICS) && !defined(HAVE_GCC_ATOMICS) && !defined(SDL_PLATFORM_MACOS) && !defined(SDL_PLATFORM_SOLARIS) && !defined(HAVE_WATCOM_ATOMICS) |
| 104 | #define EMULATE_CAS 1 |
| 105 | #endif |
| 106 | |
| 107 | #ifdef EMULATE_CAS |
| 108 | static SDL_SpinLock locks[32]; |
| 109 | |
| 110 | static SDL_INLINE void enterLock(void *a) |
| 111 | { |
| 112 | uintptr_t index = ((((uintptr_t)a) >> 3) & 0x1f); |
| 113 | |
| 114 | SDL_LockSpinlock(&locks[index]); |
| 115 | } |
| 116 | |
| 117 | static SDL_INLINE void leaveLock(void *a) |
| 118 | { |
| 119 | uintptr_t index = ((((uintptr_t)a) >> 3) & 0x1f); |
| 120 | |
| 121 | SDL_UnlockSpinlock(&locks[index]); |
| 122 | } |
| 123 | #endif |
| 124 | |
| 125 | bool SDL_CompareAndSwapAtomicInt(SDL_AtomicInt *a, int oldval, int newval) |
| 126 | { |
| 127 | #ifdef HAVE_MSC_ATOMICS |
| 128 | SDL_COMPILE_TIME_ASSERT(atomic_cas, sizeof(long) == sizeof(a->value)); |
| 129 | return _InterlockedCompareExchange((long *)&a->value, (long)newval, (long)oldval) == (long)oldval; |
| 130 | #elif defined(HAVE_WATCOM_ATOMICS) |
| 131 | return _SDL_cmpxchg_watcom((volatile int *)&a->value, newval, oldval); |
| 132 | #elif defined(HAVE_GCC_ATOMICS) |
| 133 | return __sync_bool_compare_and_swap(&a->value, oldval, newval); |
| 134 | #elif defined(SDL_PLATFORM_MACOS) // this is deprecated in 10.12 sdk; favor gcc atomics. |
| 135 | return OSAtomicCompareAndSwap32Barrier(oldval, newval, &a->value); |
| 136 | #elif defined(SDL_PLATFORM_SOLARIS) |
| 137 | SDL_COMPILE_TIME_ASSERT(atomic_cas, sizeof(uint_t) == sizeof(a->value)); |
| 138 | return ((int)atomic_cas_uint((volatile uint_t *)&a->value, (uint_t)oldval, (uint_t)newval) == oldval); |
| 139 | #elif defined(EMULATE_CAS) |
| 140 | bool result = false; |
| 141 | |
| 142 | enterLock(a); |
| 143 | if (a->value == oldval) { |
| 144 | a->value = newval; |
| 145 | result = true; |
| 146 | } |
| 147 | leaveLock(a); |
| 148 | |
| 149 | return result; |
| 150 | #else |
| 151 | #error Please define your platform. |
| 152 | #endif |
| 153 | } |
| 154 | |
| 155 | bool SDL_CompareAndSwapAtomicU32(SDL_AtomicU32 *a, Uint32 oldval, Uint32 newval) |
| 156 | { |
| 157 | #ifdef HAVE_MSC_ATOMICS |
| 158 | SDL_COMPILE_TIME_ASSERT(atomic_cas, sizeof(long) == sizeof(a->value)); |
| 159 | return _InterlockedCompareExchange((long *)&a->value, (long)newval, (long)oldval) == (long)oldval; |
| 160 | #elif defined(HAVE_WATCOM_ATOMICS) |
| 161 | SDL_COMPILE_TIME_ASSERT(atomic_cas, sizeof(int) == sizeof(a->value)); |
| 162 | return _SDL_cmpxchg_watcom((volatile int *)&a->value, (int)newval, (int)oldval); |
| 163 | #elif defined(HAVE_GCC_ATOMICS) |
| 164 | return __sync_bool_compare_and_swap(&a->value, oldval, newval); |
| 165 | #elif defined(SDL_PLATFORM_MACOS) // this is deprecated in 10.12 sdk; favor gcc atomics. |
| 166 | return OSAtomicCompareAndSwap32Barrier((int32_t)oldval, (int32_t)newval, (int32_t*)&a->value); |
| 167 | #elif defined(SDL_PLATFORM_SOLARIS) |
| 168 | SDL_COMPILE_TIME_ASSERT(atomic_cas, sizeof(uint_t) == sizeof(a->value)); |
| 169 | return ((Uint32)atomic_cas_uint((volatile uint_t *)&a->value, (uint_t)oldval, (uint_t)newval) == oldval); |
| 170 | #elif defined(EMULATE_CAS) |
| 171 | bool result = false; |
| 172 | |
| 173 | enterLock(a); |
| 174 | if (a->value == oldval) { |
| 175 | a->value = newval; |
| 176 | result = true; |
| 177 | } |
| 178 | leaveLock(a); |
| 179 | |
| 180 | return result; |
| 181 | #else |
| 182 | #error Please define your platform. |
| 183 | #endif |
| 184 | } |
| 185 | |
| 186 | bool SDL_CompareAndSwapAtomicPointer(void **a, void *oldval, void *newval) |
| 187 | { |
| 188 | #ifdef HAVE_MSC_ATOMICS |
| 189 | return _InterlockedCompareExchangePointer(a, newval, oldval) == oldval; |
| 190 | #elif defined(HAVE_WATCOM_ATOMICS) |
| 191 | return _SDL_cmpxchg_watcom((int *)a, (long)newval, (long)oldval); |
| 192 | #elif defined(HAVE_GCC_ATOMICS) |
| 193 | return __sync_bool_compare_and_swap(a, oldval, newval); |
| 194 | #elif defined(SDL_PLATFORM_MACOS) && defined(__LP64__) // this is deprecated in 10.12 sdk; favor gcc atomics. |
| 195 | return OSAtomicCompareAndSwap64Barrier((int64_t)oldval, (int64_t)newval, (int64_t *)a); |
| 196 | #elif defined(SDL_PLATFORM_MACOS) && !defined(__LP64__) // this is deprecated in 10.12 sdk; favor gcc atomics. |
| 197 | return OSAtomicCompareAndSwap32Barrier((int32_t)oldval, (int32_t)newval, (int32_t *)a); |
| 198 | #elif defined(SDL_PLATFORM_SOLARIS) |
| 199 | return (atomic_cas_ptr(a, oldval, newval) == oldval); |
| 200 | #elif defined(EMULATE_CAS) |
| 201 | bool result = false; |
| 202 | |
| 203 | enterLock(a); |
| 204 | if (*a == oldval) { |
| 205 | *a = newval; |
| 206 | result = true; |
| 207 | } |
| 208 | leaveLock(a); |
| 209 | |
| 210 | return result; |
| 211 | #else |
| 212 | #error Please define your platform. |
| 213 | #endif |
| 214 | } |
| 215 | |
| 216 | int SDL_SetAtomicInt(SDL_AtomicInt *a, int v) |
| 217 | { |
| 218 | #ifdef HAVE_MSC_ATOMICS |
| 219 | SDL_COMPILE_TIME_ASSERT(atomic_set, sizeof(long) == sizeof(a->value)); |
| 220 | return _InterlockedExchange((long *)&a->value, v); |
| 221 | #elif defined(HAVE_WATCOM_ATOMICS) |
| 222 | return _SDL_xchg_watcom(&a->value, v); |
| 223 | #elif defined(HAVE_GCC_ATOMICS) |
| 224 | return __sync_lock_test_and_set(&a->value, v); |
| 225 | #elif defined(SDL_PLATFORM_SOLARIS) |
| 226 | SDL_COMPILE_TIME_ASSERT(atomic_set, sizeof(uint_t) == sizeof(a->value)); |
| 227 | return (int)atomic_swap_uint((volatile uint_t *)&a->value, v); |
| 228 | #else |
| 229 | int value; |
| 230 | do { |
| 231 | value = a->value; |
| 232 | } while (!SDL_CompareAndSwapAtomicInt(a, value, v)); |
| 233 | return value; |
| 234 | #endif |
| 235 | } |
| 236 | |
| 237 | Uint32 SDL_SetAtomicU32(SDL_AtomicU32 *a, Uint32 v) |
| 238 | { |
| 239 | #ifdef HAVE_MSC_ATOMICS |
| 240 | SDL_COMPILE_TIME_ASSERT(atomic_set, sizeof(long) == sizeof(a->value)); |
| 241 | return _InterlockedExchange((long *)&a->value, v); |
| 242 | #elif defined(HAVE_WATCOM_ATOMICS) |
| 243 | return _SDL_xchg_watcom(&a->value, v); |
| 244 | #elif defined(HAVE_GCC_ATOMICS) |
| 245 | return __sync_lock_test_and_set(&a->value, v); |
| 246 | #elif defined(SDL_PLATFORM_SOLARIS) |
| 247 | SDL_COMPILE_TIME_ASSERT(atomic_set, sizeof(uint_t) == sizeof(a->value)); |
| 248 | return (Uint32)atomic_swap_uint((volatile uint_t *)&a->value, v); |
| 249 | #else |
| 250 | Uint32 value; |
| 251 | do { |
| 252 | value = a->value; |
| 253 | } while (!SDL_CompareAndSwapAtomicU32(a, value, v)); |
| 254 | return value; |
| 255 | #endif |
| 256 | } |
| 257 | |
| 258 | void *SDL_SetAtomicPointer(void **a, void *v) |
| 259 | { |
| 260 | #ifdef HAVE_MSC_ATOMICS |
| 261 | return _InterlockedExchangePointer(a, v); |
| 262 | #elif defined(HAVE_WATCOM_ATOMICS) |
| 263 | return (void *)_SDL_xchg_watcom((int *)a, (long)v); |
| 264 | #elif defined(HAVE_GCC_ATOMICS) |
| 265 | return __sync_lock_test_and_set(a, v); |
| 266 | #elif defined(SDL_PLATFORM_SOLARIS) |
| 267 | return atomic_swap_ptr(a, v); |
| 268 | #else |
| 269 | void *value; |
| 270 | do { |
| 271 | value = *a; |
| 272 | } while (!SDL_CompareAndSwapAtomicPointer(a, value, v)); |
| 273 | return value; |
| 274 | #endif |
| 275 | } |
| 276 | |
| 277 | int SDL_AddAtomicInt(SDL_AtomicInt *a, int v) |
| 278 | { |
| 279 | #ifdef HAVE_MSC_ATOMICS |
| 280 | SDL_COMPILE_TIME_ASSERT(atomic_add, sizeof(long) == sizeof(a->value)); |
| 281 | return _InterlockedExchangeAdd((long *)&a->value, v); |
| 282 | #elif defined(HAVE_WATCOM_ATOMICS) |
| 283 | SDL_COMPILE_TIME_ASSERT(atomic_add, sizeof(int) == sizeof(a->value)); |
| 284 | return _SDL_xadd_watcom((volatile int *)&a->value, v); |
| 285 | #elif defined(HAVE_GCC_ATOMICS) |
| 286 | return __sync_fetch_and_add(&a->value, v); |
| 287 | #elif defined(SDL_PLATFORM_SOLARIS) |
| 288 | int pv = a->value; |
| 289 | membar_consumer(); |
| 290 | atomic_add_int((volatile uint_t *)&a->value, v); |
| 291 | return pv; |
| 292 | #else |
| 293 | int value; |
| 294 | do { |
| 295 | value = a->value; |
| 296 | } while (!SDL_CompareAndSwapAtomicInt(a, value, (value + v))); |
| 297 | return value; |
| 298 | #endif |
| 299 | } |
| 300 | |
| 301 | int SDL_GetAtomicInt(SDL_AtomicInt *a) |
| 302 | { |
| 303 | #ifdef HAVE_ATOMIC_LOAD_N |
| 304 | return __atomic_load_n(&a->value, __ATOMIC_SEQ_CST); |
| 305 | #elif defined(HAVE_MSC_ATOMICS) |
| 306 | SDL_COMPILE_TIME_ASSERT(atomic_get, sizeof(long) == sizeof(a->value)); |
| 307 | return _InterlockedOr((long *)&a->value, 0); |
| 308 | #elif defined(HAVE_WATCOM_ATOMICS) |
| 309 | return _SDL_xadd_watcom(&a->value, 0); |
| 310 | #elif defined(HAVE_GCC_ATOMICS) |
| 311 | return __sync_or_and_fetch(&a->value, 0); |
| 312 | #elif defined(SDL_PLATFORM_MACOS) // this is deprecated in 10.12 sdk; favor gcc atomics. |
| 313 | return sizeof(a->value) == sizeof(uint32_t) ? OSAtomicOr32Barrier(0, (volatile uint32_t *)&a->value) : OSAtomicAdd64Barrier(0, (volatile int64_t *)&a->value); |
| 314 | #elif defined(SDL_PLATFORM_SOLARIS) |
| 315 | return atomic_or_uint_nv((volatile uint_t *)&a->value, 0); |
| 316 | #else |
| 317 | int value; |
| 318 | do { |
| 319 | value = a->value; |
| 320 | } while (!SDL_CompareAndSwapAtomicInt(a, value, value)); |
| 321 | return value; |
| 322 | #endif |
| 323 | } |
| 324 | |
| 325 | Uint32 SDL_GetAtomicU32(SDL_AtomicU32 *a) |
| 326 | { |
| 327 | #ifdef HAVE_ATOMIC_LOAD_N |
| 328 | return __atomic_load_n(&a->value, __ATOMIC_SEQ_CST); |
| 329 | #elif defined(HAVE_MSC_ATOMICS) |
| 330 | SDL_COMPILE_TIME_ASSERT(atomic_get, sizeof(long) == sizeof(a->value)); |
| 331 | return (Uint32)_InterlockedOr((long *)&a->value, 0); |
| 332 | #elif defined(HAVE_WATCOM_ATOMICS) |
| 333 | SDL_COMPILE_TIME_ASSERT(atomic_get, sizeof(int) == sizeof(a->value)); |
| 334 | return (Uint32)_SDL_xadd_watcom((volatile int *)&a->value, 0); |
| 335 | #elif defined(HAVE_GCC_ATOMICS) |
| 336 | return __sync_or_and_fetch(&a->value, 0); |
| 337 | #elif defined(SDL_PLATFORM_MACOS) // this is deprecated in 10.12 sdk; favor gcc atomics. |
| 338 | return OSAtomicOr32Barrier(0, (volatile uint32_t *)&a->value); |
| 339 | #elif defined(SDL_PLATFORM_SOLARIS) |
| 340 | SDL_COMPILE_TIME_ASSERT(atomic_get, sizeof(uint_t) == sizeof(a->value)); |
| 341 | return (Uint32)atomic_or_uint_nv((volatile uint_t *)&a->value, 0); |
| 342 | #else |
| 343 | Uint32 value; |
| 344 | do { |
| 345 | value = a->value; |
| 346 | } while (!SDL_CompareAndSwapAtomicU32(a, value, value)); |
| 347 | return value; |
| 348 | #endif |
| 349 | } |
| 350 | |
| 351 | void *SDL_GetAtomicPointer(void **a) |
| 352 | { |
| 353 | #ifdef HAVE_ATOMIC_LOAD_N |
| 354 | return __atomic_load_n(a, __ATOMIC_SEQ_CST); |
| 355 | #elif defined(HAVE_MSC_ATOMICS) |
| 356 | return _InterlockedCompareExchangePointer(a, NULL, NULL); |
| 357 | #elif defined(HAVE_GCC_ATOMICS) |
| 358 | return __sync_val_compare_and_swap(a, (void *)0, (void *)0); |
| 359 | #elif defined(SDL_PLATFORM_SOLARIS) |
| 360 | return atomic_cas_ptr(a, (void *)0, (void *)0); |
| 361 | #else |
| 362 | void *value; |
| 363 | do { |
| 364 | value = *a; |
| 365 | } while (!SDL_CompareAndSwapAtomicPointer(a, value, value)); |
| 366 | return value; |
| 367 | #endif |
| 368 | } |
| 369 | |
| 370 | #ifdef SDL_MEMORY_BARRIER_USES_FUNCTION |
| 371 | #error This file should be built in arm mode so the mcr instruction is available for memory barriers |
| 372 | #endif |
| 373 | |
| 374 | void SDL_MemoryBarrierReleaseFunction(void) |
| 375 | { |
| 376 | SDL_MemoryBarrierRelease(); |
| 377 | } |
| 378 | |
| 379 | void SDL_MemoryBarrierAcquireFunction(void) |
| 380 | { |
| 381 | SDL_MemoryBarrierAcquire(); |
| 382 | } |
| 383 | |