[fe065c3] | 1 | #include <stdio.h> |
---|
| 2 | #include <stdint.h> // uintptr_t |
---|
| 3 | |
---|
| 4 | #include "bench.h" |
---|
| 5 | |
---|
[525b5ef] | 6 | // Does a "lock xchg" on entry but a simple "mov" on exit => cheaper as 0 contention. While it has much more code, the |
---|
| 7 | // bulk is never run. |
---|
| 8 | |
---|
[fe065c3] | 9 | #define CALIGN __attribute__(( aligned (CACHE_ALIGN) )) |
---|
| 10 | #define CACHE_ALIGN 128 |
---|
[7f5683e] | 11 | #if defined( __i386 ) || defined( __x86_64 ) |
---|
| 12 | #define Pause() __asm__ __volatile__ ( "pause" : : : ) |
---|
| 13 | #elif defined( __ARM_ARCH ) |
---|
| 14 | #define Pause() __asm__ __volatile__ ( "YIELD" : : : ) |
---|
| 15 | #else |
---|
| 16 | #error unsupported architecture |
---|
| 17 | #endif |
---|
[fe065c3] | 18 | |
---|
| 19 | typedef uintptr_t TYPE; // addressable word-size |
---|
| 20 | static volatile TYPE lock __attribute__(( aligned (128) )); // Intel recommendation |
---|
| 21 | static TYPE PAD CALIGN __attribute__(( unused )); // protect further false sharing |
---|
| 22 | |
---|
| 23 | static inline void spin_lock( volatile TYPE *lock ) { |
---|
| 24 | enum { SPIN_START = 4, SPIN_END = 64 * 1024, }; |
---|
| 25 | unsigned int spin = SPIN_START; |
---|
| 26 | |
---|
| 27 | for ( unsigned int i = 1;; i += 1 ) { |
---|
| 28 | if ( *lock == 0 && __atomic_test_and_set( lock, __ATOMIC_ACQUIRE ) == 0 ) break; |
---|
| 29 | for ( volatile unsigned int s = 0; s < spin; s += 1 ) Pause(); // exponential spin |
---|
| 30 | //spin += spin; // powers of 2 |
---|
| 31 | if ( i % 64 == 0 ) spin += spin; // slowly increase by powers of 2 |
---|
| 32 | if ( spin > SPIN_END ) spin = SPIN_START; // prevent overflow |
---|
| 33 | } // for |
---|
| 34 | } // spin_lock |
---|
| 35 | |
---|
| 36 | static inline void spin_unlock( volatile TYPE *lock ) { |
---|
| 37 | __atomic_clear( lock, __ATOMIC_RELEASE ); |
---|
| 38 | } // spin_unlock |
---|
| 39 | |
---|
| 40 | void __attribute__((noinline)) do_call() { |
---|
| 41 | spin_lock( &lock ); |
---|
| 42 | // asm volatile (""); |
---|
| 43 | spin_unlock( &lock ); |
---|
| 44 | } |
---|
| 45 | |
---|
[b4107c8] | 46 | int main( int argc, char * argv[] ) { |
---|
| 47 | BENCH_START() |
---|
[fe065c3] | 48 | BENCH( |
---|
[b4107c8] | 49 | for (size_t i = 0; i < times; i++) { |
---|
[fe065c3] | 50 | do_call(); |
---|
| 51 | }, |
---|
| 52 | result |
---|
[b4107c8] | 53 | ) |
---|
| 54 | printf( "%g\n", result ); |
---|
[fe065c3] | 55 | } |
---|
| 56 | |
---|
| 57 | // Local Variables: // |
---|
| 58 | // tab-width: 4 // |
---|
| 59 | // End: // |
---|