| [fe065c3] | 1 | #include <stdio.h> | 
|---|
|  | 2 | #include <stdint.h>                                                                             // uintptr_t | 
|---|
|  | 3 |  | 
|---|
|  | 4 | #include "bench.h" | 
|---|
|  | 5 |  | 
|---|
| [525b5ef] | 6 | // Does a "lock xchg" on entry but a simple "mov" on exit => cheaper as 0 contention. While it has much more code, the | 
|---|
|  | 7 | // bulk is never run. | 
|---|
|  | 8 |  | 
|---|
| [fe065c3] | 9 | #define CALIGN __attribute__(( aligned (CACHE_ALIGN) )) | 
|---|
|  | 10 | #define CACHE_ALIGN 128 | 
|---|
| [7f5683e] | 11 | #if defined( __i386 ) || defined( __x86_64 ) | 
|---|
|  | 12 | #define Pause() __asm__ __volatile__ ( "pause" : : : ) | 
|---|
|  | 13 | #elif defined( __ARM_ARCH ) | 
|---|
|  | 14 | #define Pause() __asm__ __volatile__ ( "YIELD" : : : ) | 
|---|
|  | 15 | #else | 
|---|
|  | 16 | #error unsupported architecture | 
|---|
|  | 17 | #endif | 
|---|
| [fe065c3] | 18 |  | 
|---|
|  | 19 | typedef uintptr_t TYPE;                                                                 // addressable word-size | 
|---|
|  | 20 | static volatile TYPE lock __attribute__(( aligned (128) )); // Intel recommendation | 
|---|
|  | 21 | static TYPE PAD CALIGN __attribute__(( unused ));               // protect further false sharing | 
|---|
|  | 22 |  | 
|---|
|  | 23 | static inline void spin_lock( volatile TYPE *lock ) { | 
|---|
|  | 24 | enum { SPIN_START = 4, SPIN_END = 64 * 1024, }; | 
|---|
|  | 25 | unsigned int spin = SPIN_START; | 
|---|
|  | 26 |  | 
|---|
|  | 27 | for ( unsigned int i = 1;; i += 1 ) { | 
|---|
|  | 28 | if ( *lock == 0 && __atomic_test_and_set( lock, __ATOMIC_ACQUIRE ) == 0 ) break; | 
|---|
|  | 29 | for ( volatile unsigned int s = 0; s < spin; s += 1 ) Pause(); // exponential spin | 
|---|
|  | 30 | //spin += spin;                                                                 // powers of 2 | 
|---|
|  | 31 | if ( i % 64 == 0 ) spin += spin;                                // slowly increase by powers of 2 | 
|---|
|  | 32 | if ( spin > SPIN_END ) spin = SPIN_START;               // prevent overflow | 
|---|
|  | 33 | } // for | 
|---|
|  | 34 | } // spin_lock | 
|---|
|  | 35 |  | 
|---|
|  | 36 | static inline void spin_unlock( volatile TYPE *lock ) { | 
|---|
|  | 37 | __atomic_clear( lock, __ATOMIC_RELEASE ); | 
|---|
|  | 38 | } // spin_unlock | 
|---|
|  | 39 |  | 
|---|
|  | 40 | void __attribute__((noinline)) do_call() { | 
|---|
|  | 41 | spin_lock( &lock ); | 
|---|
|  | 42 | //      asm volatile (""); | 
|---|
|  | 43 | spin_unlock( &lock ); | 
|---|
|  | 44 | } | 
|---|
|  | 45 |  | 
|---|
| [b4107c8] | 46 | int main( int argc, char * argv[] ) { | 
|---|
|  | 47 | BENCH_START() | 
|---|
| [fe065c3] | 48 | BENCH( | 
|---|
| [b4107c8] | 49 | for (size_t i = 0; i < times; i++) { | 
|---|
| [fe065c3] | 50 | do_call(); | 
|---|
|  | 51 | }, | 
|---|
|  | 52 | result | 
|---|
| [b4107c8] | 53 | ) | 
|---|
|  | 54 | printf( "%g\n", result ); | 
|---|
| [fe065c3] | 55 | } | 
|---|
|  | 56 |  | 
|---|
|  | 57 | // Local Variables: // | 
|---|
|  | 58 | // tab-width: 4 // | 
|---|
|  | 59 | // End: // | 
|---|