| [ea7d2b0] | 1 | // | 
|---|
|  | 2 | // Cforall Version 1.0.0 Copyright (C) 2016 University of Waterloo | 
|---|
|  | 3 | // | 
|---|
|  | 4 | // The contents of this file are covered under the licence agreement in the | 
|---|
|  | 5 | // file "LICENCE" distributed with Cforall. | 
|---|
|  | 6 | // | 
|---|
| [73abe95] | 7 | // bits/locks.hfa -- Fast internal locks. | 
|---|
| [ea7d2b0] | 8 | // | 
|---|
|  | 9 | // Author           : Thierry Delisle | 
|---|
|  | 10 | // Created On       : Tue Oct 31 15:14:38 2017 | 
|---|
| [b158d8f] | 11 | // Last Modified By : Peter A. Buhr | 
|---|
| [e3fea42] | 12 | // Last Modified On : Tue Feb  4 13:03:19 2020 | 
|---|
|  | 13 | // Update Count     : 11 | 
|---|
| [ea7d2b0] | 14 | // | 
|---|
|  | 15 |  | 
|---|
|  | 16 | #pragma once | 
|---|
|  | 17 |  | 
|---|
| [73abe95] | 18 | #include "bits/debug.hfa" | 
|---|
|  | 19 | #include "bits/defs.hfa" | 
|---|
| [ea8b2f7] | 20 | #include <assert.h> | 
|---|
|  | 21 |  | 
|---|
|  | 22 | #ifdef __cforall | 
|---|
|  | 23 | extern "C" { | 
|---|
|  | 24 | #include <pthread.h> | 
|---|
|  | 25 | } | 
|---|
|  | 26 | #endif | 
|---|
| [ea7d2b0] | 27 |  | 
|---|
|  | 28 | // pause to prevent excess processor bus usage | 
|---|
|  | 29 | #if defined( __sparc ) | 
|---|
|  | 30 | #define Pause() __asm__ __volatile__ ( "rd %ccr,%g0" ) | 
|---|
|  | 31 | #elif defined( __i386 ) || defined( __x86_64 ) | 
|---|
|  | 32 | #define Pause() __asm__ __volatile__ ( "pause" : : : ) | 
|---|
| [b158d8f] | 33 | #elif defined( __ARM_ARCH ) | 
|---|
|  | 34 | #define Pause() __asm__ __volatile__ ( "nop" : : : ) | 
|---|
| [ea7d2b0] | 35 | #else | 
|---|
|  | 36 | #error unsupported architecture | 
|---|
|  | 37 | #endif | 
|---|
|  | 38 |  | 
|---|
|  | 39 | struct __spinlock_t { | 
|---|
| [13073be] | 40 | // Wrap in struct to prevent false sharing with debug info | 
|---|
| [3aeee3c] | 41 | volatile bool lock; | 
|---|
| [ea7d2b0] | 42 | #ifdef __CFA_DEBUG__ | 
|---|
| [13073be] | 43 | // previous function to acquire the lock | 
|---|
| [ea7d2b0] | 44 | const char * prev_name; | 
|---|
| [13073be] | 45 | // previous thread to acquire the lock | 
|---|
| [ea7d2b0] | 46 | void* prev_thrd; | 
|---|
|  | 47 | #endif | 
|---|
| [3aeee3c] | 48 | }; | 
|---|
| [ea7d2b0] | 49 |  | 
|---|
| [0cf5b79] | 50 | #ifdef __cforall | 
|---|
| [dbe9b08] | 51 | extern "C" { | 
|---|
| [2026bb6] | 52 | extern void disable_interrupts() OPTIONAL_THREAD; | 
|---|
|  | 53 | extern void enable_interrupts_noPoll() OPTIONAL_THREAD; | 
|---|
| [1997b4e] | 54 |  | 
|---|
|  | 55 | #ifdef __CFA_DEBUG__ | 
|---|
| [ae66348] | 56 | void __cfaabi_dbg_record_lock(__spinlock_t & this, const char prev_name[]); | 
|---|
| [1997b4e] | 57 | #else | 
|---|
| [ae66348] | 58 | #define __cfaabi_dbg_record_lock(x, y) | 
|---|
| [1997b4e] | 59 | #endif | 
|---|
| [dbe9b08] | 60 | } | 
|---|
|  | 61 |  | 
|---|
| [ea7d2b0] | 62 | static inline void ?{}( __spinlock_t & this ) { | 
|---|
|  | 63 | this.lock = 0; | 
|---|
|  | 64 | } | 
|---|
|  | 65 |  | 
|---|
|  | 66 | // Lock the spinlock, return false if already acquired | 
|---|
| [93c2e0a] | 67 | static inline bool try_lock  ( __spinlock_t & this __cfaabi_dbg_ctx_param2 ) { | 
|---|
| [3381ed7] | 68 | disable_interrupts(); | 
|---|
| [93c2e0a] | 69 | bool result = (this.lock == 0) && (__atomic_test_and_set( &this.lock, __ATOMIC_ACQUIRE ) == 0); | 
|---|
| [dbe9b08] | 70 | if( result ) { | 
|---|
| [ae66348] | 71 | __cfaabi_dbg_record_lock( this, caller ); | 
|---|
| [3381ed7] | 72 | } else { | 
|---|
|  | 73 | enable_interrupts_noPoll(); | 
|---|
| [dbe9b08] | 74 | } | 
|---|
| [ea7d2b0] | 75 | return result; | 
|---|
|  | 76 | } | 
|---|
|  | 77 |  | 
|---|
|  | 78 | // Lock the spinlock, spin if already acquired | 
|---|
| [36982fc] | 79 | static inline void lock( __spinlock_t & this __cfaabi_dbg_ctx_param2 ) { | 
|---|
| [ea7d2b0] | 80 | #ifndef NOEXPBACK | 
|---|
|  | 81 | enum { SPIN_START = 4, SPIN_END = 64 * 1024, }; | 
|---|
|  | 82 | unsigned int spin = SPIN_START; | 
|---|
|  | 83 | #endif | 
|---|
|  | 84 |  | 
|---|
| [3381ed7] | 85 | disable_interrupts(); | 
|---|
| [ea7d2b0] | 86 | for ( unsigned int i = 1;; i += 1 ) { | 
|---|
| [13073be] | 87 | if ( (this.lock == 0) && (__atomic_test_and_set( &this.lock, __ATOMIC_ACQUIRE ) == 0) ) break; | 
|---|
| [ea7d2b0] | 88 | #ifndef NOEXPBACK | 
|---|
|  | 89 | // exponential spin | 
|---|
|  | 90 | for ( volatile unsigned int s = 0; s < spin; s += 1 ) Pause(); | 
|---|
|  | 91 |  | 
|---|
|  | 92 | // slowly increase by powers of 2 | 
|---|
|  | 93 | if ( i % 64 == 0 ) spin += spin; | 
|---|
|  | 94 |  | 
|---|
|  | 95 | // prevent overflow | 
|---|
|  | 96 | if ( spin > SPIN_END ) spin = SPIN_START; | 
|---|
|  | 97 | #else | 
|---|
|  | 98 | Pause(); | 
|---|
|  | 99 | #endif | 
|---|
|  | 100 | } | 
|---|
| [ae66348] | 101 | __cfaabi_dbg_record_lock( this, caller ); | 
|---|
| [ea7d2b0] | 102 | } | 
|---|
|  | 103 |  | 
|---|
|  | 104 | static inline void unlock( __spinlock_t & this ) { | 
|---|
| [13073be] | 105 | __atomic_clear( &this.lock, __ATOMIC_RELEASE ); | 
|---|
| [3381ed7] | 106 | enable_interrupts_noPoll(); | 
|---|
| [ea7d2b0] | 107 | } | 
|---|
| [ea8b2f7] | 108 |  | 
|---|
|  | 109 |  | 
|---|
|  | 110 | #ifdef __CFA_WITH_VERIFY__ | 
|---|
|  | 111 | extern bool __cfaabi_dbg_in_kernel(); | 
|---|
|  | 112 | #endif | 
|---|
|  | 113 |  | 
|---|
| [c66f6cb] | 114 | extern "C" { | 
|---|
|  | 115 | char * strerror(int); | 
|---|
|  | 116 | } | 
|---|
| [6ec07e5] | 117 | #define CHECKED(x) { int err = x; if( err != 0 ) abort("KERNEL ERROR: Operation \"" #x "\" return error %d - %s\n", err, strerror(err)); } | 
|---|
| [c66f6cb] | 118 |  | 
|---|
| [ea8b2f7] | 119 | struct __bin_sem_t { | 
|---|
| [85b1deb] | 120 | pthread_mutex_t         lock; | 
|---|
|  | 121 | pthread_cond_t          cond; | 
|---|
| [4069faad] | 122 | int                     val; | 
|---|
| [ea8b2f7] | 123 | }; | 
|---|
|  | 124 |  | 
|---|
|  | 125 | static inline void ?{}(__bin_sem_t & this) with( this ) { | 
|---|
| [c66f6cb] | 126 | // Create the mutex with error checking | 
|---|
|  | 127 | pthread_mutexattr_t mattr; | 
|---|
|  | 128 | pthread_mutexattr_init( &mattr ); | 
|---|
|  | 129 | pthread_mutexattr_settype( &mattr, PTHREAD_MUTEX_ERRORCHECK_NP); | 
|---|
|  | 130 | pthread_mutex_init(&lock, &mattr); | 
|---|
|  | 131 |  | 
|---|
| [b81fd95] | 132 | pthread_cond_init (&cond, (const pthread_condattr_t *)0p);  // workaround trac#208: cast should not be required | 
|---|
| [4069faad] | 133 | val = 0; | 
|---|
| [ea8b2f7] | 134 | } | 
|---|
|  | 135 |  | 
|---|
|  | 136 | static inline void ^?{}(__bin_sem_t & this) with( this ) { | 
|---|
| [c66f6cb] | 137 | CHECKED( pthread_mutex_destroy(&lock) ); | 
|---|
|  | 138 | CHECKED( pthread_cond_destroy (&cond) ); | 
|---|
| [ea8b2f7] | 139 | } | 
|---|
|  | 140 |  | 
|---|
|  | 141 | static inline void wait(__bin_sem_t & this) with( this ) { | 
|---|
|  | 142 | verify(__cfaabi_dbg_in_kernel()); | 
|---|
| [c66f6cb] | 143 | CHECKED( pthread_mutex_lock(&lock) ); | 
|---|
| [4069faad] | 144 | while(val < 1) { | 
|---|
| [85b1deb] | 145 | pthread_cond_wait(&cond, &lock); | 
|---|
|  | 146 | } | 
|---|
| [4069faad] | 147 | val -= 1; | 
|---|
| [c66f6cb] | 148 | CHECKED( pthread_mutex_unlock(&lock) ); | 
|---|
| [ea8b2f7] | 149 | } | 
|---|
|  | 150 |  | 
|---|
| [92e7631] | 151 | static inline bool post(__bin_sem_t & this) with( this ) { | 
|---|
| [4069faad] | 152 | bool needs_signal = false; | 
|---|
|  | 153 |  | 
|---|
| [c66f6cb] | 154 | CHECKED( pthread_mutex_lock(&lock) ); | 
|---|
| [4069faad] | 155 | if(val < 1) { | 
|---|
|  | 156 | val += 1; | 
|---|
|  | 157 | pthread_cond_signal(&cond); | 
|---|
|  | 158 | needs_signal = true; | 
|---|
|  | 159 | } | 
|---|
| [c66f6cb] | 160 | CHECKED( pthread_mutex_unlock(&lock) ); | 
|---|
| [85b1deb] | 161 |  | 
|---|
| [92e7631] | 162 | return needs_signal; | 
|---|
| [85b1deb] | 163 | } | 
|---|
| [c66f6cb] | 164 |  | 
|---|
|  | 165 | #undef CHECKED | 
|---|
| [e0f93e0] | 166 |  | 
|---|
|  | 167 | struct $thread; | 
|---|
|  | 168 | extern void park( __cfaabi_dbg_ctx_param ); | 
|---|
|  | 169 | extern void unpark( struct $thread * this __cfaabi_dbg_ctx_param2 ); | 
|---|
|  | 170 | static inline struct $thread * active_thread (); | 
|---|
|  | 171 |  | 
|---|
|  | 172 | // Semaphore which only supports a single thread | 
|---|
|  | 173 | struct single_sem { | 
|---|
|  | 174 | struct $thread * volatile ptr; | 
|---|
|  | 175 | }; | 
|---|
|  | 176 |  | 
|---|
|  | 177 | static inline { | 
|---|
|  | 178 | void  ?{}(single_sem & this) { | 
|---|
|  | 179 | this.ptr = 0p; | 
|---|
|  | 180 | } | 
|---|
|  | 181 |  | 
|---|
|  | 182 | void ^?{}(single_sem & this) {} | 
|---|
|  | 183 |  | 
|---|
|  | 184 | bool wait(single_sem & this) { | 
|---|
|  | 185 | for() { | 
|---|
|  | 186 | struct $thread * expected = this.ptr; | 
|---|
|  | 187 | if(expected == 1p) { | 
|---|
|  | 188 | if(__atomic_compare_exchange_n(&this.ptr, &expected, 0p, false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST)) { | 
|---|
|  | 189 | return false; | 
|---|
|  | 190 | } | 
|---|
|  | 191 | } | 
|---|
|  | 192 | else { | 
|---|
|  | 193 | /* paranoid */ verify( expected == 0p ); | 
|---|
|  | 194 | if(__atomic_compare_exchange_n(&this.ptr, &expected, active_thread(), false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST)) { | 
|---|
|  | 195 | park( __cfaabi_dbg_ctx ); | 
|---|
|  | 196 | return true; | 
|---|
|  | 197 | } | 
|---|
|  | 198 | } | 
|---|
|  | 199 |  | 
|---|
|  | 200 | } | 
|---|
|  | 201 | } | 
|---|
|  | 202 |  | 
|---|
|  | 203 | bool post(single_sem & this) { | 
|---|
|  | 204 | for() { | 
|---|
|  | 205 | struct $thread * expected = this.ptr; | 
|---|
|  | 206 | if(expected == 1p) return false; | 
|---|
|  | 207 | if(expected == 0p) { | 
|---|
|  | 208 | if(__atomic_compare_exchange_n(&this.ptr, &expected, 1p, false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST)) { | 
|---|
|  | 209 | return false; | 
|---|
|  | 210 | } | 
|---|
|  | 211 | } | 
|---|
|  | 212 | else { | 
|---|
|  | 213 | if(__atomic_compare_exchange_n(&this.ptr, &expected, 0p, false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST)) { | 
|---|
|  | 214 | unpark( expected __cfaabi_dbg_ctx2 ); | 
|---|
|  | 215 | return true; | 
|---|
|  | 216 | } | 
|---|
|  | 217 | } | 
|---|
|  | 218 | } | 
|---|
|  | 219 | } | 
|---|
|  | 220 | } | 
|---|
| [b158d8f] | 221 | #endif | 
|---|