Mercurial > sdl-ios-xcode
view src/atomic/linux/SDL_atomic.c @ 3295:4ff84e8939c1
Whoops, need both the header and the library!
author | Sam Lantinga <slouken@libsdl.org> |
---|---|
date | Mon, 21 Sep 2009 11:31:28 +0000 |
parents | 72b542f34739 |
children | 6fe620d7ce92 |
line wrap: on
line source
/* SDL - Simple DirectMedia Layer Copyright (C) 1997-2009 Sam Lantinga This library is free software; you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License as published by the Free Software Foundation; either version 2.1 of the License, or (at your option) any later version. This library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details. You should have received a copy of the GNU Lesser General Public License along with this library; if not, write to the Free Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA Sam Lantinga slouken@libsdl.org Contributed by Bob Pendleton, bob@pendleton.com */ #include "SDL_stdinc.h" #include "SDL_atomic.h" #include "SDL_error.h" /* This file provides 32, and 64 bit atomic operations. If the operations are provided by the native hardware and operating system they are used. If they are not then the operations are emulated using the SDL spin lock operations. If spin lock can not be implemented then these functions must fail. */ /* LINUX/GCC VERSION. This version of the code assumes support of the atomic builtins as documented at gcc.gnu.org/onlinedocs/gcc/Atomic-Builtins.html This code should work on any modern x86 or other processor supported by GCC. Some processors will only support some of these operations so #ifdefs will have to be added as incompatibilities are discovered */ /* Native spinlock routines. */ void SDL_AtomicLock(SDL_SpinLock *lock) { while (0 != __sync_lock_test_and_set(lock, 1)) { } } void SDL_AtomicUnlock(SDL_SpinLock *lock) { __sync_lock_test_and_set(lock, 0); } /* Note that platform specific versions can be built from this version by changing the #undefs to #defines and adding platform specific code. */ #define nativeTestThenSet32 #define nativeClear32 #define nativeFetchThenIncrement32 #define nativeFetchThenDecrement32 #define nativeFetchThenAdd32 #define nativeFetchThenSubtract32 #define nativeIncrementThenFetch32 #define nativeDecrementThenFetch32 #define nativeAddThenFetch32 #define nativeSubtractThenFetch32 #define nativeTestThenSet64 #define nativeClear64 #define nativeFetchThenIncrement64 #define nativeFetchThenDecrement64 #define nativeFetchThenAdd64 #define nativeFetchThenSubtract64 #define nativeIncrementThenFetch64 #define nativeDecrementThenFetch64 #define nativeAddThenFetch64 #define nativeSubtractThenFetch64 /* If any of the operations are not provided then we must emulate some of them. That means we need a nice implementation of spin locks that avoids the "one big lock" problem. We use a vector of spin locks and pick which one to use based on the address of the operand of the function. To generate the index of the lock we first shift by 3 bits to get rid on the zero bits that result from 32 and 64 bit allignment of data. We then mask off all but 5 bits and use those 5 bits as an index into the table. Picking the lock this way insures that accesses to the same data at the same time will go to the same lock. OTOH, accesses to different data have only a 1/32 chance of hitting the same lock. That should pretty much eliminate the chances of several atomic operations on different data from waiting on the same "big lock". If it isn't then the table of locks can be expanded to a new size so long as the new size if a power of two. */ static SDL_SpinLock locks[32] = { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, }; static __inline__ void privateWaitLock(volatile void *ptr) { #if SIZEOF_VOIDP == 4 Uint32 index = ((((Uint32)ptr) >> 3) & 0x1f); #elif SIZEOF_VOIDP == 8 Uint64 index = ((((Uint64)ptr) >> 3) & 0x1f); #endif SDL_AtomicLock(&locks[index]); } static __inline__ void privateUnlock(volatile void *ptr) { #if SIZEOF_VOIDP == 4 Uint32 index = ((((Uint32)ptr) >> 3) & 0x1f); #elif SIZEOF_VOIDP == 8 Uint64 index = ((((Uint64)ptr) >> 3) & 0x1f); #endif SDL_AtomicUnlock(&locks[index]); } /* 32 bit atomic operations */ SDL_bool SDL_AtomicTestThenSet32(volatile Uint32 * ptr) { #ifdef nativeTestThenSet32 return 0 == __sync_lock_test_and_set(ptr, 1); #else SDL_bool result = SDL_FALSE; privateWaitLock(ptr); result = (*ptr == 0); if (result) { *ptr = 1; } privateUnlock(ptr); return result; #endif } void SDL_AtomicClear32(volatile Uint32 * ptr) { #ifdef nativeClear32 __sync_lock_test_and_set(ptr, 0); return; #else privateWaitLock(ptr); *ptr = 0; privateUnlock(ptr); return; #endif } Uint32 SDL_AtomicFetchThenIncrement32(volatile Uint32 * ptr) { #ifdef nativeFetchThenIncrement32 return __sync_fetch_and_add(ptr, 1); #else Uint32 tmp = 0; privateWaitLock(ptr); tmp = *ptr; (*ptr)+= 1; privateUnlock(ptr); return tmp; #endif } Uint32 SDL_AtomicFetchThenDecrement32(volatile Uint32 * ptr) { #ifdef nativeFetchThenDecrement32 return __sync_fetch_and_sub(ptr, 1); #else Uint32 tmp = 0; privateWaitLock(ptr); tmp = *ptr; (*ptr) -= 1; privateUnlock(ptr); return tmp; #endif } Uint32 SDL_AtomicFetchThenAdd32(volatile Uint32 * ptr, Uint32 value) { #ifdef nativeFetchThenAdd32 return __sync_fetch_and_add(ptr, value); #else Uint32 tmp = 0; privateWaitLock(ptr); tmp = *ptr; (*ptr)+= value; privateUnlock(ptr); return tmp; #endif } Uint32 SDL_AtomicFetchThenSubtract32(volatile Uint32 * ptr, Uint32 value) { #ifdef nativeFetchThenSubtract32 return __sync_fetch_and_sub(ptr, value); #else Uint32 tmp = 0; privateWaitLock(ptr); tmp = *ptr; (*ptr)-= value; privateUnlock(ptr); return tmp; #endif } Uint32 SDL_AtomicIncrementThenFetch32(volatile Uint32 * ptr) { #ifdef nativeIncrementThenFetch32 return __sync_add_and_fetch(ptr, 1); #else Uint32 tmp = 0; privateWaitLock(ptr); (*ptr)+= 1; tmp = *ptr; privateUnlock(ptr); return tmp; #endif } Uint32 SDL_AtomicDecrementThenFetch32(volatile Uint32 * ptr) { #ifdef nativeDecrementThenFetch32 return __sync_sub_and_fetch(ptr, 1); #else Uint32 tmp = 0; privateWaitLock(ptr); (*ptr)-= 1; tmp = *ptr; privateUnlock(ptr); return tmp; #endif } Uint32 SDL_AtomicAddThenFetch32(volatile Uint32 * ptr, Uint32 value) { #ifdef nativeAddThenFetch32 return __sync_add_and_fetch(ptr, value); #else Uint32 tmp = 0; privateWaitLock(ptr); (*ptr)+= value; tmp = *ptr; privateUnlock(ptr); return tmp; #endif } Uint32 SDL_AtomicSubtractThenFetch32(volatile Uint32 * ptr, Uint32 value) { #ifdef nativeSubtractThenFetch32 return __sync_sub_and_fetch(ptr, value); #else Uint32 tmp = 0; privateWaitLock(ptr); (*ptr)-= value; tmp = *ptr; privateUnlock(ptr); return tmp; #endif } /* 64 bit atomic operations */ #ifdef SDL_HAS_64BIT_TYPE SDL_bool SDL_AtomicTestThenSet64(volatile Uint64 * ptr) { #ifdef nativeTestThenSet64 return 0 == __sync_lock_test_and_set(ptr, 1); #else SDL_bool result = SDL_FALSE; privateWaitLock(ptr); result = (*ptr == 0); if (result) { *ptr = 1; } privateUnlock(ptr); return result; #endif } void SDL_AtomicClear64(volatile Uint64 * ptr) { #ifdef nativeClear64 __sync_lock_test_and_set(ptr, 0); return; #else privateWaitLock(ptr); *ptr = 0; privateUnlock(ptr); return; #endif } Uint64 SDL_AtomicFetchThenIncrement64(volatile Uint64 * ptr) { #ifdef nativeFetchThenIncrement64 return __sync_fetch_and_add(ptr, 1); #else Uint64 tmp = 0; privateWaitLock(ptr); tmp = *ptr; (*ptr)+= 1; privateUnlock(ptr); return tmp; #endif } Uint64 SDL_AtomicFetchThenDecrement64(volatile Uint64 * ptr) { #ifdef nativeFetchThenDecrement64 return __sync_fetch_and_sub(ptr, 1); #else Uint64 tmp = 0; privateWaitLock(ptr); tmp = *ptr; (*ptr) -= 1; privateUnlock(ptr); return tmp; #endif } Uint64 SDL_AtomicFetchThenAdd64(volatile Uint64 * ptr, Uint64 value) { #ifdef nativeFetchThenAdd64 return __sync_fetch_and_add(ptr, value); #else Uint64 tmp = 0; privateWaitLock(ptr); tmp = *ptr; (*ptr)+= value; privateUnlock(ptr); return tmp; #endif } Uint64 SDL_AtomicFetchThenSubtract64(volatile Uint64 * ptr, Uint64 value) { #ifdef nativeFetchThenSubtract64 return __sync_fetch_and_sub(ptr, value); #else Uint64 tmp = 0; privateWaitLock(ptr); tmp = *ptr; (*ptr)-= value; privateUnlock(ptr); return tmp; #endif } Uint64 SDL_AtomicIncrementThenFetch64(volatile Uint64 * ptr) { #ifdef nativeIncrementThenFetch64 return __sync_add_and_fetch(ptr, 1); #else Uint64 tmp = 0; privateWaitLock(ptr); (*ptr)+= 1; tmp = *ptr; privateUnlock(ptr); return tmp; #endif } Uint64 SDL_AtomicDecrementThenFetch64(volatile Uint64 * ptr) { #ifdef nativeDecrementThenFetch64 return __sync_sub_and_fetch(ptr, 1); #else Uint64 tmp = 0; privateWaitLock(ptr); (*ptr)-= 1; tmp = *ptr; privateUnlock(ptr); return tmp; #endif } Uint64 SDL_AtomicAddThenFetch64(volatile Uint64 * ptr, Uint64 value) { #ifdef nativeAddThenFetch64 return __sync_add_and_fetch(ptr, value); #else Uint64 tmp = 0; privateWaitLock(ptr); (*ptr)+= value; tmp = *ptr; privateUnlock(ptr); return tmp; #endif } Uint64 SDL_AtomicSubtractThenFetch64(volatile Uint64 * ptr, Uint64 value) { #ifdef nativeSubtractThenFetch64 return __sync_sub_and_fetch(ptr, value); #else Uint64 tmp = 0; privateWaitLock(ptr); (*ptr)-= value; tmp = *ptr; privateUnlock(ptr); return tmp; #endif } #endif /* SDL_HAS_64BIT_TYPE */