Changeset 2a301ff for libcfa/src/concurrency

libcfa/src/concurrency/actor.hfa

-              r92355883
+              r2a301ff
 // #define ACTOR_STATS
+// used to run and only track missed queue gulps
+#ifdef ACTOR_STATS
+#define ACTOR_STATS_QUEUE_MISSED
+#endif
 // forward decls
 struct actor;
 …
 typedef allocation (*__receive_fn)(actor &, message &, actor **, message **);
 struct request {
     actor * receiver;
     message * msg;
     __receive_fn fn;
+        actor * receiver;
+        message * msg;
+        __receive_fn fn;
 };
 struct a_msg {
     int m;
+        int m;
 };
 static inline void ?{}( request & this ) {}
 static inline void ?{}( request & this, actor * receiver, message * msg, __receive_fn fn ) {
     this.receiver = receiver;
     this.msg = msg;
     this.fn = fn;
+        this.receiver = receiver;
+        this.msg = msg;
+        this.fn = fn;
+}
 static inline void ?{}( request & this, request & copy ) {
     this.receiver = copy.receiver;
     this.msg = copy.msg;
     this.fn = copy.fn;
+        this.receiver = copy.receiver;
+        this.msg = copy.msg;
+        this.fn = copy.fn;
+}
 …
 // assumes gulping behaviour (once a remove occurs, removes happen until empty beforw next insert)
 struct copy_queue {
     request * buffer;
     size_t count, buffer_size, index, utilized, last_size;
+        request * buffer;
+        size_t count, buffer_size, index, utilized, last_size;
 };
 static inline void ?{}( copy_queue & this ) {}
 static inline void ?{}( copy_queue & this, size_t buf_size ) with(this) {
     buffer_size = buf_size;
     buffer = aalloc( buffer_size );
     count = 0;
     utilized = 0;
     index = 0;
     last_size = 0;
+        buffer_size = buf_size;
+        buffer = aalloc( buffer_size );
+        count = 0;
+        utilized = 0;
+        index = 0;
+        last_size = 0;
+}
 static inline void ^?{}( copy_queue & this ) with(this) {
     DEBUG_ABORT( count != 0, "Actor system terminated with messages sent but not received\n" );
     adelete(buffer);
+        DEBUG_ABORT( count != 0, "Actor system terminated with messages sent but not received\n" );
+        adelete(buffer);
+}
 static inline void insert( copy_queue & this, request & elem ) with(this) {
     if ( count >= buffer_size ) { // increase arr size
         last_size = buffer_size;
         buffer_size = 2 * buffer_size;
         buffer = realloc( buffer, sizeof( request ) * buffer_size );
         /* paranoid */ verify( buffer );
+    }
     memcpy( &buffer[count], &elem, sizeof(request) );
     count++;
+        if ( count >= buffer_size ) { // increase arr size
+                last_size = buffer_size;
+                buffer_size = 2 * buffer_size;
+                buffer = realloc( buffer, sizeof( request ) * buffer_size );
+                /* paranoid */ verify( buffer );
+        }
+        memcpy( &buffer[count], &elem, sizeof(request) );
+        count++;
+}
 …
 // it is not supported to call insert() before the array is fully empty
 static inline request & remove( copy_queue & this ) with(this) {
     if ( count > 0 ) {
         count--;
         size_t old_idx = index;
         index = count == 0 ? 0 : index + 1;
         return buffer[old_idx];
+    }
     request * ret = 0p;
     return *0p;
+        if ( count > 0 ) {
+                count--;
+                size_t old_idx = index;
+                index = count == 0 ? 0 : index + 1;
+                return buffer[old_idx];
+        }
+        request * ret = 0p;
+        return *0p;
+}
 // try to reclaim some memory if less than half of buffer is utilized
 static inline void reclaim( copy_queue & this ) with(this) {
     if ( utilized >= last_size || buffer_size <= 4 ) { utilized = 0; return; }
     utilized = 0;
     buffer_size--;
     buffer = realloc( buffer, sizeof( request ) * buffer_size ); // try to reclaim some memory
+        if ( utilized >= last_size || buffer_size <= 4 ) { utilized = 0; return; }
+        utilized = 0;
+        buffer_size--;
+        buffer = realloc( buffer, sizeof( request ) * buffer_size ); // try to reclaim some memory
+}
 …
 struct work_queue {
+    __spinlock_t mutex_lock;
+    copy_queue * owned_queue;       // copy queue allocated and cleaned up by this work_queue
+    copy_queue * c_queue;           // current queue
+    volatile bool being_processed;  // flag to prevent concurrent processing
+    #ifdef ACTOR_STATS
+    unsigned int id;
+    size_t missed;                  // transfers skipped due to being_processed flag being up
+        __spinlock_t mutex_lock;
+        copy_queue * owned_queue;                                                       // copy queue allocated and cleaned up by this work_queue
+        copy_queue * c_queue;                                                           // current queue
+        volatile bool being_processed;                                          // flag to prevent concurrent processing
+        #ifdef ACTOR_STATS
+        unsigned int id;
     #endif
+    #ifdef ACTOR_STATS_QUEUE_MISSED
+        size_t missed;                                                                          // transfers skipped due to being_processed flag being up
+        #endif
 }; // work_queue
 static inline void ?{}( work_queue & this, size_t buf_size, unsigned int i ) with(this) {
     owned_queue = alloc();      // allocated separately to avoid false sharing
     (*owned_queue){ buf_size };
     c_queue = owned_queue;
     being_processed = false;
     #ifdef ACTOR_STATS
     id = i;
     missed = 0;
     #endif
+        owned_queue = alloc();                                                          // allocated separately to avoid false sharing
+        (*owned_queue){ buf_size };
+        c_queue = owned_queue;
+        being_processed = false;
+        #ifdef ACTOR_STATS
+        id = i;
+        missed = 0;
+        #endif
+}
 …
 static inline void insert( work_queue & this, request & elem ) with(this) {
     lock( mutex_lock __cfaabi_dbg_ctx2 );
     insert( *c_queue, elem );
     unlock( mutex_lock );
+        lock( mutex_lock __cfaabi_dbg_ctx2 );
+        insert( *c_queue, elem );
+        unlock( mutex_lock );
 } // insert
 static inline void transfer( work_queue & this, copy_queue ** transfer_to ) with(this) {
     lock( mutex_lock __cfaabi_dbg_ctx2 );
     #ifdef __STEAL
     // check if queue is being processed elsewhere
     if ( unlikely( being_processed ) ) {
         #ifdef ACTOR_STATS
         missed++;
         #endif
         unlock( mutex_lock );
         return;
+    }
     being_processed = c_queue->count != 0;
     #endif // __STEAL
     c_queue->utilized = c_queue->count;
     // swap copy queue ptrs
     copy_queue * temp = *transfer_to;
     *transfer_to = c_queue;
     c_queue = temp;
     unlock( mutex_lock );
+        lock( mutex_lock __cfaabi_dbg_ctx2 );
+        #ifdef __STEAL
+        // check if queue is being processed elsewhere
+        if ( unlikely( being_processed ) ) {
+                #ifdef ACTOR_STATS
+                missed++;
+                #endif
+                unlock( mutex_lock );
+                return;
+        }
+        being_processed = c_queue->count != 0;
+        #endif // __STEAL
+        c_queue->utilized = c_queue->count;
+        // swap copy queue ptrs
+        copy_queue * temp = *transfer_to;
+        *transfer_to = c_queue;
+        c_queue = temp;
+        unlock( mutex_lock );
 } // transfer
 // needed since some info needs to persist past worker lifetimes
 struct worker_info {
     volatile unsigned long long stamp;
     #ifdef ACTOR_STATS
     size_t stolen_from, try_steal, stolen, empty_stolen, failed_swaps, msgs_stolen;
     unsigned long long processed;
     size_t gulps;
     #endif
+        volatile unsigned long long stamp;
+        #ifdef ACTOR_STATS
+        size_t stolen_from, try_steal, stolen, empty_stolen, failed_swaps, msgs_stolen;
+        unsigned long long processed;
+        size_t gulps;
+        #endif
 };
 static inline void ?{}( worker_info & this ) {
     #ifdef ACTOR_STATS
     this.stolen_from = 0;
     this.try_steal = 0;                             // attempts to steal
     this.stolen = 0;                                // successful steals
     this.processed = 0;                             // requests processed
     this.gulps = 0;                                 // number of gulps
     this.failed_swaps = 0;                          // steal swap failures
     this.empty_stolen = 0;                          // queues empty after steal
     this.msgs_stolen = 0;                           // number of messages stolen
     #endif
     this.stamp = rdtscl();
+        #ifdef ACTOR_STATS
+        this.stolen_from = 0;
+        this.try_steal = 0;                                                                     // attempts to steal
+        this.stolen = 0;                                                                        // successful steals
+        this.processed = 0;                                                                     // requests processed
+        this.gulps = 0;                                                                         // number of gulps
+        this.failed_swaps = 0;                                                          // steal swap failures
+        this.empty_stolen = 0;                                                          // queues empty after steal
+        this.msgs_stolen = 0;                                                           // number of messages stolen
+        #endif
+        this.stamp = rdtscl();
+}
 …
 // #endif
 thread worker {
     work_queue ** request_queues;
     copy_queue * current_queue;
     executor * executor_;
     unsigned int start, range;
     int id;
+        work_queue ** request_queues;
+        copy_queue * current_queue;
+        executor * executor_;
+        unsigned int start, range;
+        int id;
 };
 …
 // aggregate counters for statistics
 size_t __total_tries = 0, __total_stolen = 0, __total_workers, __all_gulps = 0, __total_empty_stolen = 0,
     __total_failed_swaps = 0, __all_processed = 0, __num_actors_stats = 0, __all_msgs_stolen = 0;
+        __total_failed_swaps = 0, __all_processed = 0, __num_actors_stats = 0, __all_msgs_stolen = 0;
 #endif
 static inline void ?{}( worker & this, cluster & clu, work_queue ** request_queues, copy_queue * current_queue, executor * executor_,
     unsigned int start, unsigned int range, int id ) {
     ((thread &)this){ clu };
     this.request_queues = request_queues;           // array of all queues
     this.current_queue = current_queue;             // currently gulped queue (start with empty queue to use in swap later)
     this.executor_ = executor_;                     // pointer to current executor
     this.start = start;                             // start of worker's subrange of request_queues
     this.range = range;                             // size of worker's subrange of request_queues
     this.id = id;                                   // worker's id and index in array of workers
+        unsigned int start, unsigned int range, int id ) {
+        ((thread &)this){ clu };
+        this.request_queues = request_queues;                           // array of all queues
+        this.current_queue = current_queue;                                     // currently gulped queue (start with empty queue to use in swap later)
+        this.executor_ = executor_;                                                     // pointer to current executor
+        this.start = start;                                                                     // start of worker's subrange of request_queues
+        this.range = range;                                                                     // size of worker's subrange of request_queues
+        this.id = id;                                                                           // worker's id and index in array of workers
+}
 static bool no_steal = false;
 struct executor {
     cluster * cluster;                                                      // if workers execute on separate cluster
         processor ** processors;                                            // array of virtual processors adding parallelism for workers
         work_queue * request_queues;                                // master array of work request queues
     copy_queue * local_queues;                      // array of all worker local queues to avoid deletion race
         work_queue ** worker_req_queues;                // secondary array of work queues to allow for swapping
     worker ** workers;                                                          // array of workers executing work requests
     worker_info * w_infos;                          // array of info about each worker
         unsigned int nprocessors, nworkers, nrqueues;   // number of processors/threads/request queues
         bool seperate_clus;                                                             // use same or separate cluster for executor
     volatile bool is_shutdown;                      // flag to communicate shutdown to worker threads
+        cluster * cluster;                                                                      // if workers execute on separate cluster
+        processor ** processors;                                                        // array of virtual processors adding parallelism for workers
+        work_queue * request_queues;                                            // master array of work request queues
+        copy_queue * local_queues;                                                      // array of all worker local queues to avoid deletion race
+        work_queue ** worker_req_queues;                                        // secondary array of work queues to allow for swapping
+        worker ** workers;                                                                      // array of workers executing work requests
+        worker_info * w_infos;                                                          // array of info about each worker
+        unsigned int nprocessors, nworkers, nrqueues;           // number of processors/threads/request queues
+        bool seperate_clus;                                                                     // use same or separate cluster for executor
+        volatile bool is_shutdown;                                                      // flag to communicate shutdown to worker threads
 }; // executor
 …
 // #endif
 static inline void ^?{}( worker & mutex this ) with(this) {
     #ifdef ACTOR_STATS
     __atomic_add_fetch(&__all_gulps, executor_->w_infos[id].gulps,__ATOMIC_SEQ_CST);
     __atomic_add_fetch(&__all_processed, executor_->w_infos[id].processed,__ATOMIC_SEQ_CST);
     __atomic_add_fetch(&__all_msgs_stolen, executor_->w_infos[id].msgs_stolen,__ATOMIC_SEQ_CST);
     __atomic_add_fetch(&__total_tries, executor_->w_infos[id].try_steal, __ATOMIC_SEQ_CST);
     __atomic_add_fetch(&__total_stolen, executor_->w_infos[id].stolen, __ATOMIC_SEQ_CST);
     __atomic_add_fetch(&__total_failed_swaps, executor_->w_infos[id].failed_swaps, __ATOMIC_SEQ_CST);
     __atomic_add_fetch(&__total_empty_stolen, executor_->w_infos[id].empty_stolen, __ATOMIC_SEQ_CST);
     // per worker steal stats (uncomment alongside the lock above this routine to print)
     // lock( out_lock __cfaabi_dbg_ctx2 );
     // printf("Worker id: %d, processed: %llu messages, attempted %lu, stole: %lu, stolen from: %lu\n", id, processed, try_steal, stolen, __atomic_add_fetch(&executor_->w_infos[id].stolen_from, 0, __ATOMIC_SEQ_CST) );
     // int count = 0;
     // int count2 = 0;
     // for ( i; range ) {
     //     if ( replaced_queue[start + i] > 0 ){
     //         count++;
     //         // printf("%d: %u, ",i, replaced_queue[i]);
     //     }
     //     if (__atomic_add_fetch(&stolen_arr[start + i],0,__ATOMIC_SEQ_CST) > 0)
     //         count2++;
     // }
     // printf("swapped with: %d of %u indices\n", count, executor_->nrqueues / executor_->nworkers );
     // printf("%d of %u indices were stolen\n", count2, executor_->nrqueues / executor_->nworkers );
     // unlock( out_lock );
     #endif
+        #ifdef ACTOR_STATS
+        __atomic_add_fetch(&__all_gulps, executor_->w_infos[id].gulps,__ATOMIC_SEQ_CST);
+        __atomic_add_fetch(&__all_processed, executor_->w_infos[id].processed,__ATOMIC_SEQ_CST);
+        __atomic_add_fetch(&__all_msgs_stolen, executor_->w_infos[id].msgs_stolen,__ATOMIC_SEQ_CST);
+        __atomic_add_fetch(&__total_tries, executor_->w_infos[id].try_steal, __ATOMIC_SEQ_CST);
+        __atomic_add_fetch(&__total_stolen, executor_->w_infos[id].stolen, __ATOMIC_SEQ_CST);
+        __atomic_add_fetch(&__total_failed_swaps, executor_->w_infos[id].failed_swaps, __ATOMIC_SEQ_CST);
+        __atomic_add_fetch(&__total_empty_stolen, executor_->w_infos[id].empty_stolen, __ATOMIC_SEQ_CST);
+        // per worker steal stats (uncomment alongside the lock above this routine to print)
+        // lock( out_lock __cfaabi_dbg_ctx2 );
+        // printf("Worker id: %d, processed: %llu messages, attempted %lu, stole: %lu, stolen from: %lu\n", id, processed, try_steal, stolen, __atomic_add_fetch(&executor_->w_infos[id].stolen_from, 0, __ATOMIC_SEQ_CST) );
+        // int count = 0;
+        // int count2 = 0;
+        // for ( i; range ) {
+        //       if ( replaced_queue[start + i] > 0 ){
+        //               count++;
+        //               // printf("%d: %u, ",i, replaced_queue[i]);
+        //       }
+        //       if (__atomic_add_fetch(&stolen_arr[start + i],0,__ATOMIC_SEQ_CST) > 0)
+        //               count2++;
+        // }
+        // printf("swapped with: %d of %u indices\n", count, executor_->nrqueues / executor_->nworkers );
+        // printf("%d of %u indices were stolen\n", count2, executor_->nrqueues / executor_->nworkers );
+        // unlock( out_lock );
+        #endif
+}
 static inline void ?{}( executor & this, unsigned int nprocessors, unsigned int nworkers, unsigned int nrqueues, bool seperate_clus, size_t buf_size ) with(this) {
     if ( nrqueues < nworkers ) abort( "nrqueues needs to be >= nworkers\n" );
     this.nprocessors = nprocessors;
     this.nworkers = nworkers;
     this.nrqueues = nrqueues;
     this.seperate_clus = seperate_clus;
     this.is_shutdown = false;
     if ( nworkers == nrqueues )
         no_steal = true;
     #ifdef ACTOR_STATS
     // stolen_arr = aalloc( nrqueues );
     // replaced_queue = aalloc( nrqueues );
     __total_workers = nworkers;
     #endif
     if ( seperate_clus ) {
         cluster = alloc();
         (*cluster){};
     } else cluster = active_cluster();
     request_queues = aalloc( nrqueues );
     worker_req_queues = aalloc( nrqueues );
     for ( i; nrqueues ) {
         request_queues[i]{ buf_size, i };
         worker_req_queues[i] = &request_queues[i];
+    }
     processors = aalloc( nprocessors );
     for ( i; nprocessors )
         (*(processors[i] = alloc())){ *cluster };
     local_queues = aalloc( nworkers );
     workers = aalloc( nworkers );
     w_infos = aalloc( nworkers );
     unsigned int reqPerWorker = nrqueues / nworkers, extras = nrqueues % nworkers;
     for ( i; nworkers ) {
         w_infos[i]{};
         local_queues[i]{ buf_size };
+    }
     for ( unsigned int i = 0, start = 0, range; i < nworkers; i += 1, start += range ) {
         range = reqPerWorker + ( i < extras ? 1 : 0 );
         (*(workers[i] = alloc())){ *cluster, worker_req_queues, &local_queues[i], &this, start, range, i };
     } // for
+        if ( nrqueues < nworkers ) abort( "nrqueues needs to be >= nworkers\n" );
+        this.nprocessors = nprocessors;
+        this.nworkers = nworkers;
+        this.nrqueues = nrqueues;
+        this.seperate_clus = seperate_clus;
+        this.is_shutdown = false;
+        if ( nworkers == nrqueues )
+                no_steal = true;
+        #ifdef ACTOR_STATS
+        // stolen_arr = aalloc( nrqueues );
+        // replaced_queue = aalloc( nrqueues );
+        __total_workers = nworkers;
+        #endif
+        if ( seperate_clus ) {
+                cluster = alloc();
+                (*cluster){};
+        } else cluster = active_cluster();
+        request_queues = aalloc( nrqueues );
+        worker_req_queues = aalloc( nrqueues );
+        for ( i; nrqueues ) {
+                request_queues[i]{ buf_size, i };
+                worker_req_queues[i] = &request_queues[i];
+        }
+        processors = aalloc( nprocessors );
+        for ( i; nprocessors )
+                (*(processors[i] = alloc())){ *cluster };
+        local_queues = aalloc( nworkers );
+        workers = aalloc( nworkers );
+        w_infos = aalloc( nworkers );
+        unsigned int reqPerWorker = nrqueues / nworkers, extras = nrqueues % nworkers;
+        for ( i; nworkers ) {
+                w_infos[i]{};
+                local_queues[i]{ buf_size };
+        }
+        for ( unsigned int i = 0, start = 0, range; i < nworkers; i += 1, start += range ) {
+                range = reqPerWorker + ( i < extras ? 1 : 0 );
+                (*(workers[i] = alloc())){ *cluster, worker_req_queues, &local_queues[i], &this, start, range, i };
+        } // for
+}
 static inline void ?{}( executor & this, unsigned int nprocessors, unsigned int nworkers, unsigned int nrqueues, bool seperate_clus ) { this{ nprocessors, nworkers, nrqueues, seperate_clus, __DEFAULT_EXECUTOR_BUFSIZE__ }; }
 …
 static inline void ^?{}( executor & this ) with(this) {
+    is_shutdown = true;
+    for ( i; nworkers )
+        delete( workers[i] );
+    for ( i; nprocessors ) {
+        delete( processors[i] );
+    } // for
+    #ifdef ACTOR_STATS
+    size_t misses = 0;
+    for ( i; nrqueues ) {
+        misses += worker_req_queues[i]->missed;
+    }
+    // adelete( stolen_arr );
+    // adelete( replaced_queue );
+        is_shutdown = true;
+        for ( i; nworkers )
+                delete( workers[i] );
+        for ( i; nprocessors ) {
+                delete( processors[i] );
+        } // for
+        #ifdef ACTOR_STATS_QUEUE_MISSED
+        size_t misses = 0;
+        for ( i; nrqueues ) {
+                misses += worker_req_queues[i]->missed;
+        }
+        // adelete( stolen_arr );
+        // adelete( replaced_queue );
+        #endif
+        adelete( workers );
+        adelete( w_infos );
+        adelete( local_queues );
+        adelete( request_queues );
+        adelete( worker_req_queues );
+        adelete( processors );
+        if ( seperate_clus ) delete( cluster );
+        #ifdef ACTOR_STATS // print formatted stats
+        printf("        Actor System Stats:\n");
+        printf("\tActors Created:\t\t\t\t%lu\n\tMessages Sent:\t\t\t\t%lu\n", __num_actors_stats, __all_processed);
+        size_t avg_gulps = __all_gulps == 0 ? 0 : __all_processed / __all_gulps;
+        printf("\tGulps:\t\t\t\t\t%lu\n\tAverage Gulp Size:\t\t\t%lu\n\tMissed gulps:\t\t\t\t%lu\n", __all_gulps, avg_gulps, misses);
+        printf("\tSteal attempts:\t\t\t\t%lu\n\tSteals:\t\t\t\t\t%lu\n\tSteal failures (no candidates):\t\t%lu\n\tSteal failures (failed swaps):\t\t%lu\t Empty steals:\t\t%lu\n",
+                __total_tries, __total_stolen, __total_tries - __total_stolen - __total_failed_swaps, __total_failed_swaps, __total_empty_stolen);
+        size_t avg_steal = __total_stolen == 0 ? 0 : __all_msgs_stolen / __total_stolen;
+        printf("\tMessages stolen:\t\t\t%lu\n\tAverage steal size:\t\t\t%lu\n", __all_msgs_stolen, avg_steal);
+        #endif
+    #ifndef ACTOR_STATS
+    #ifdef ACTOR_STATS_QUEUE_MISSED
+    printf("\t%lu", misses);
     #endif
-    adelete( workers );
-    adelete( w_infos );
-    adelete( local_queues );
-    adelete( request_queues );
-    adelete( worker_req_queues );
-    adelete( processors );
-    if ( seperate_clus ) delete( cluster );
-    #ifdef ACTOR_STATS // print formatted stats
-    printf("    Actor System Stats:\n");
-    printf("\tActors Created:\t\t\t\t%lu\n\tMessages Sent:\t\t\t\t%lu\n", __num_actors_stats, __all_processed);
-    size_t avg_gulps = __all_gulps == 0 ? 0 : __all_processed / __all_gulps;
-    printf("\tGulps:\t\t\t\t\t%lu\n\tAverage Gulp Size:\t\t\t%lu\n\tMissed gulps:\t\t\t\t%lu\n", __all_gulps, avg_gulps, misses);
-    printf("\tSteal attempts:\t\t\t\t%lu\n\tSteals:\t\t\t\t\t%lu\n\tSteal failures (no candidates):\t\t%lu\n\tSteal failures (failed swaps):\t\t%lu\t Empty steals:\t\t%lu\n",
-        __total_tries, __total_stolen, __total_tries - __total_stolen - __total_failed_swaps, __total_failed_swaps, __total_empty_stolen);
-    size_t avg_steal = __total_stolen == 0 ? 0 : __all_msgs_stolen / __total_stolen;
-    printf("\tMessages stolen:\t\t\t%lu\n\tAverage steal size:\t\t\t%lu\n", __all_msgs_stolen, avg_steal);
     #endif
+}
 …
 static inline size_t __get_next_ticket( executor & this ) with(this) {
     #ifdef __CFA_DEBUG__
     size_t temp = __atomic_fetch_add( &__next_ticket, 1, __ATOMIC_SEQ_CST) % nrqueues;
     // reserve MAX for dead actors
     if ( unlikely( temp == MAX ) ) temp = __atomic_fetch_add( &__next_ticket, 1, __ATOMIC_SEQ_CST) % nrqueues;
     return temp;
     #else
     return __atomic_fetch_add( &__next_ticket, 1, __ATOMIC_RELAXED) % nrqueues;
     #endif
+        #ifdef __CFA_DEBUG__
+        size_t temp = __atomic_fetch_add( &__next_ticket, 1, __ATOMIC_SEQ_CST) % nrqueues;
+        // reserve MAX for dead actors
+        if ( unlikely( temp == MAX ) ) temp = __atomic_fetch_add( &__next_ticket, 1, __ATOMIC_SEQ_CST) % nrqueues;
+        return temp;
+        #else
+        return __atomic_fetch_add( &__next_ticket, 1, __ATOMIC_RELAXED) % nrqueues;
+        #endif
 } // tickets
 // TODO: update globals in this file to be static fields once the static fields project is done
 static executor * __actor_executor_ = 0p;
 static bool __actor_executor_passed = false;            // was an executor passed to start_actor_system
 static size_t __num_actors_ = 0;                                        // number of actor objects in system
+static bool __actor_executor_passed = false;                    // was an executor passed to start_actor_system
+static size_t __num_actors_ = 0;                                                // number of actor objects in system
 static struct thread$ * __actor_executor_thd = 0p;              // used to wake executor after actors finish
 struct actor {
     size_t ticket;                                          // executor-queue handle
     allocation allocation_;                                         // allocation action
     inline virtual_dtor;
+        size_t ticket;                                                                          // executor-queue handle
+        allocation alloc;                                                                       // allocation action
+        inline virtual_dtor;
 };
 static inline void ?{}( actor & this ) with(this) {
     // Once an actor is allocated it must be sent a message or the actor system cannot stop. Hence, its receive
     // member must be called to end it
     DEBUG_ABORT( __actor_executor_ == 0p, "Creating actor before calling start_actor_system() can cause undefined behaviour.\n" );
     allocation_ = Nodelete;
     ticket = __get_next_ticket( *__actor_executor_ );
     __atomic_fetch_add( &__num_actors_, 1, __ATOMIC_RELAXED );
     #ifdef ACTOR_STATS
     __atomic_fetch_add( &__num_actors_stats, 1, __ATOMIC_SEQ_CST );
     #endif
+        // Once an actor is allocated it must be sent a message or the actor system cannot stop. Hence, its receive
+        // member must be called to end it
+        DEBUG_ABORT( __actor_executor_ == 0p, "Creating actor before calling start_actor_system() can cause undefined behaviour.\n" );
+        alloc = Nodelete;
+        ticket = __get_next_ticket( *__actor_executor_ );
+        __atomic_fetch_add( &__num_actors_, 1, __ATOMIC_RELAXED );
+        #ifdef ACTOR_STATS
+        __atomic_fetch_add( &__num_actors_stats, 1, __ATOMIC_SEQ_CST );
+        #endif
+}
 static inline void check_actor( actor & this ) {
     if ( this.allocation_ != Nodelete ) {
         switch( this.allocation_ ) {
             case Delete: delete( &this ); break;
             case Destroy:
                 CFA_DEBUG( this.ticket = MAX; );        // mark as terminated
                 ^?{}(this);
                 break;
             case Finished:
                 CFA_DEBUG( this.ticket = MAX; );        // mark as terminated
                 break;
             default: ;                                                          // stop warning
+        }
         if ( unlikely( __atomic_add_fetch( &__num_actors_, -1, __ATOMIC_RELAXED ) == 0 ) ) { // all actors have terminated
             unpark( __actor_executor_thd );
+        }
+    }
+        if ( this.alloc != Nodelete ) {
+                switch( this.alloc ) {
+                        case Delete: delete( &this ); break;
+                        case Destroy:
+                                CFA_DEBUG( this.ticket = MAX; );                // mark as terminated
+                                ^?{}(this);
+                                break;
+                        case Finished:
+                                CFA_DEBUG( this.ticket = MAX; );                // mark as terminated
+                                break;
+                        default: ;                                                                      // stop warning
+                }
+                if ( unlikely( __atomic_add_fetch( &__num_actors_, -1, __ATOMIC_RELAXED ) == 0 ) ) { // all actors have terminated
+                        unpark( __actor_executor_thd );
+                }
+        }
+}
 struct message {
     allocation allocation_;                     // allocation action
     inline virtual_dtor;
+        allocation alloc;                                                                       // allocation action
+        inline virtual_dtor;
 };
 static inline void ?{}( message & this ) {
     this.allocation_ = Nodelete;
+        this.alloc = Nodelete;
+}
 static inline void ?{}( message & this, allocation alloc ) {
     memcpy( &this.allocation_, &alloc, sizeof(allocation) ); // optimization to elide ctor
     DEBUG_ABORT( this.allocation_ == Finished, "The Finished allocation status is not supported for message types.\n" );
+        memcpy( &this.alloc, &alloc, sizeof(allocation) );      // optimization to elide ctor
+        CFA_DEBUG( if ( this.alloc == Finished ) this.alloc = Nodelete; );
+}
 static inline void ^?{}( message & this ) with(this) {
+    CFA_DEBUG( if ( allocation_ == Nodelete ) printf("A message at location %p was allocated but never sent.\n", &this); )
+        CFA_DEBUG(
+                if ( alloc == Nodelete ) {
+                        printf( "CFA warning (UNIX pid:%ld) : program terminating with message %p allocated but never sent.\n",
+                                        (long int)getpid(), &this );
+                }
+        )
+}
 static inline void check_message( message & this ) {
+    switch ( this.allocation_ ) {                                               // analyze message status
+        case Nodelete: CFA_DEBUG( this.allocation_ = Finished ); break;
+        case Delete: delete( &this ); break;
+        case Destroy: ^?{}( this ); break;
+        case Finished: break;
+    } // switch
+}
+static inline void set_allocation( message & this, allocation state ) {
+    this.allocation_ = state;
+        switch ( this.alloc ) {                                         // analyze message status
+                case Nodelete: CFA_DEBUG( this.alloc = Finished ); break;
+                case Delete: delete( &this ); break;
+                case Destroy: ^?{}( this ); break;
+                case Finished: break;
+        } // switch
+}
+static inline allocation set_allocation( message & this, allocation state ) {
+        CFA_DEBUG( if ( state == Nodelete ) state = Finished; );
+        allocation prev = this.alloc;
+        this.alloc = state;
+        return prev;
+}
+static inline allocation get_allocation( message & this ) {
+        return this.alloc;
+}
 static inline void deliver_request( request & this ) {
     DEBUG_ABORT( this.receiver->ticket == (unsigned long int)MAX, "Attempted to send message to deleted/dead actor\n" );
     actor * base_actor;
     message * base_msg;
     allocation temp = this.fn( *this.receiver, *this.msg, &base_actor, &base_msg );
+    base_actor->allocation_ = temp;
     check_message( *base_msg );
     check_actor( *base_actor );
+        DEBUG_ABORT( this.receiver->ticket == (unsigned long int)MAX, "Attempted to send message to deleted/dead actor\n" );
+        actor * base_actor;
+        message * base_msg;
+        allocation temp = this.fn( *this.receiver, *this.msg, &base_actor, &base_msg );
+        memcpy( &base_actor->alloc, &temp, sizeof(allocation) ); // optimization to elide ctor
+        check_message( *base_msg );
+        check_actor( *base_actor );
+}
 …
 // returns ptr to newly owned queue if swap succeeds
 static inline work_queue * try_swap_queues( worker & this, unsigned int victim_idx, unsigned int my_idx ) with(this) {
     work_queue * my_queue = request_queues[my_idx];
     work_queue * other_queue = request_queues[victim_idx];
     // if either queue is 0p then they are in the process of being stolen
     if ( other_queue == 0p ) return 0p;
     // try to set our queue ptr to be 0p. If it fails someone moved our queue so return false
     if ( !__atomic_compare_exchange_n( &request_queues[my_idx], &my_queue, 0p, false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST ) )
         return 0p;
     // try to set other queue ptr to be our queue ptr. If it fails someone moved the other queue so fix up then return false
     if ( !__atomic_compare_exchange_n( &request_queues[victim_idx], &other_queue, my_queue, false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST ) ) {
         /* paranoid */ verify( request_queues[my_idx] == 0p );
         request_queues[my_idx] = my_queue; // reset my queue ptr back to appropriate val
         return 0p;
+    }
     // we have successfully swapped and since our queue is 0p no one will touch it so write back new queue ptr non atomically
     request_queues[my_idx] = other_queue; // last write does not need to be atomic
     return other_queue;
+        work_queue * my_queue = request_queues[my_idx];
+        work_queue * other_queue = request_queues[victim_idx];
+        // if either queue is 0p then they are in the process of being stolen
+        if ( other_queue == 0p ) return 0p;
+        // try to set our queue ptr to be 0p. If it fails someone moved our queue so return false
+        if ( !__atomic_compare_exchange_n( &request_queues[my_idx], &my_queue, 0p, false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST ) )
+                return 0p;
+        // try to set other queue ptr to be our queue ptr. If it fails someone moved the other queue so fix up then return false
+        if ( !__atomic_compare_exchange_n( &request_queues[victim_idx], &other_queue, my_queue, false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST ) ) {
+                /* paranoid */ verify( request_queues[my_idx] == 0p );
+                request_queues[my_idx] = my_queue; // reset my queue ptr back to appropriate val
+                return 0p;
+        }
+        // we have successfully swapped and since our queue is 0p no one will touch it so write back new queue ptr non atomically
+        request_queues[my_idx] = other_queue; // last write does not need to be atomic
+        return other_queue;
+}
 // once a worker to steal from has been chosen, choose queue to steal from
 static inline void choose_queue( worker & this, unsigned int victim_id, unsigned int swap_idx ) with(this) {
     // have to calculate victim start and range since victim may be deleted before us in shutdown
     const unsigned int queues_per_worker = executor_->nrqueues / executor_->nworkers;
     const unsigned int extras = executor_->nrqueues % executor_->nworkers;
     unsigned int vic_start, vic_range;
     if ( extras > victim_id  ) {
         vic_range = queues_per_worker + 1;
         vic_start = vic_range * victim_id;
     } else {
         vic_start = extras + victim_id * queues_per_worker;
         vic_range = queues_per_worker;
+    }
     unsigned int start_idx = prng( vic_range );
     unsigned int tries = 0;
     work_queue * curr_steal_queue;
     for ( unsigned int i = start_idx; tries < vic_range; i = (i + 1) % vic_range ) {
         tries++;
         curr_steal_queue = request_queues[ i + vic_start ];
         // avoid empty queues and queues that are being operated on
         if ( curr_steal_queue == 0p || curr_steal_queue->being_processed || is_empty( *curr_steal_queue->c_queue ) )
             continue;
         #ifdef ACTOR_STATS
         curr_steal_queue = try_swap_queues( this, i + vic_start, swap_idx );
         if ( curr_steal_queue ) {
             executor_->w_infos[id].msgs_stolen += curr_steal_queue->c_queue->count;
             executor_->w_infos[id].stolen++;
             if ( is_empty( *curr_steal_queue->c_queue ) ) executor_->w_infos[id].empty_stolen++;
             // __atomic_add_fetch(&executor_->w_infos[victim_id].stolen_from, 1, __ATOMIC_RELAXED);
             // replaced_queue[swap_idx]++;
             // __atomic_add_fetch(&stolen_arr[ i + vic_start ], 1, __ATOMIC_RELAXED);
         } else {
             executor_->w_infos[id].failed_swaps++;
+        }
         #else
         curr_steal_queue = try_swap_queues( this, i + vic_start, swap_idx );
         #endif // ACTOR_STATS
         return;
+    }
     return;
+        // have to calculate victim start and range since victim may be deleted before us in shutdown
+        const unsigned int queues_per_worker = executor_->nrqueues / executor_->nworkers;
+        const unsigned int extras = executor_->nrqueues % executor_->nworkers;
+        unsigned int vic_start, vic_range;
+        if ( extras > victim_id  ) {
+                vic_range = queues_per_worker + 1;
+                vic_start = vic_range * victim_id;
+        } else {
+                vic_start = extras + victim_id * queues_per_worker;
+                vic_range = queues_per_worker;
+        }
+        unsigned int start_idx = prng( vic_range );
+        unsigned int tries = 0;
+        work_queue * curr_steal_queue;
+        for ( unsigned int i = start_idx; tries < vic_range; i = (i + 1) % vic_range ) {
+                tries++;
+                curr_steal_queue = request_queues[ i + vic_start ];
+                // avoid empty queues and queues that are being operated on
+                if ( curr_steal_queue == 0p || curr_steal_queue->being_processed || is_empty( *curr_steal_queue->c_queue ) )
+                        continue;
+                #ifdef ACTOR_STATS
+                curr_steal_queue = try_swap_queues( this, i + vic_start, swap_idx );
+                if ( curr_steal_queue ) {
+                        executor_->w_infos[id].msgs_stolen += curr_steal_queue->c_queue->count;
+                        executor_->w_infos[id].stolen++;
+                        if ( is_empty( *curr_steal_queue->c_queue ) ) executor_->w_infos[id].empty_stolen++;
+                        // __atomic_add_fetch(&executor_->w_infos[victim_id].stolen_from, 1, __ATOMIC_RELAXED);
+                        // replaced_queue[swap_idx]++;
+                        // __atomic_add_fetch(&stolen_arr[ i + vic_start ], 1, __ATOMIC_RELAXED);
+                } else {
+                        executor_->w_infos[id].failed_swaps++;
+                }
+                #else
+                curr_steal_queue = try_swap_queues( this, i + vic_start, swap_idx );
+                #endif // ACTOR_STATS
+                return;
+        }
+        return;
+}
 // choose a worker to steal from
 static inline void steal_work( worker & this, unsigned int swap_idx ) with(this) {
     #if RAND
     unsigned int victim = prng( executor_->nworkers );
     if ( victim == id ) victim = ( victim + 1 ) % executor_->nworkers;
     choose_queue( this, victim, swap_idx );
     #elif SEARCH
     unsigned long long min = MAX; // smaller timestamp means longer since service
     int min_id = 0; // use ints not uints to avoid integer underflow without hacky math
     int n_workers = executor_->nworkers;
     unsigned long long curr_stamp;
     int scount = 1;
     for ( int i = (id + 1) % n_workers; scount < n_workers; i = (i + 1) % n_workers, scount++ ) {
         curr_stamp = executor_->w_infos[i].stamp;
         if ( curr_stamp < min ) {
             min = curr_stamp;
             min_id = i;
+        }
+    }
     choose_queue( this, min_id, swap_idx );
     #endif
+        #if RAND
+        unsigned int victim = prng( executor_->nworkers );
+        if ( victim == id ) victim = ( victim + 1 ) % executor_->nworkers;
+        choose_queue( this, victim, swap_idx );
+        #elif SEARCH
+        unsigned long long min = MAX; // smaller timestamp means longer since service
+        int min_id = 0; // use ints not uints to avoid integer underflow without hacky math
+        int n_workers = executor_->nworkers;
+        unsigned long long curr_stamp;
+        int scount = 1;
+        for ( int i = (id + 1) % n_workers; scount < n_workers; i = (i + 1) % n_workers, scount++ ) {
+                curr_stamp = executor_->w_infos[i].stamp;
+                if ( curr_stamp < min ) {
+                        min = curr_stamp;
+                        min_id = i;
+                }
+        }
+        choose_queue( this, min_id, swap_idx );
+        #endif
+}
 #define CHECK_TERMINATION if ( unlikely( executor_->is_shutdown ) ) break Exit
 void main( worker & this ) with(this) {
+    // #ifdef ACTOR_STATS
+    // for ( i; executor_->nrqueues ) {
+    //     replaced_queue[i] = 0;
+    //     __atomic_store_n( &stolen_arr[i], 0, __ATOMIC_SEQ_CST );
+    // }
+    // #endif
+    // threshold of empty queues we see before we go stealing
+    const unsigned int steal_threshold = 2 * range;
+    // Store variable data here instead of worker struct to avoid any potential false sharing
+    unsigned int empty_count = 0;
+    request & req;
+    work_queue * curr_work_queue;
+    Exit:
+    for ( unsigned int i = 0;; i = (i + 1) % range ) { // cycle through set of request buffers
+        curr_work_queue = request_queues[i + start];
+        // check if queue is empty before trying to gulp it
+        if ( is_empty( *curr_work_queue->c_queue ) ) {
+            #ifdef __STEAL
+            empty_count++;
+            if ( empty_count < steal_threshold ) continue;
+            #else
+            continue;
+            #endif
+        }
+        transfer( *curr_work_queue, &current_queue );
+        #ifdef ACTOR_STATS
+        executor_->w_infos[id].gulps++;
+        #endif // ACTOR_STATS
+        #ifdef __STEAL
+        if ( is_empty( *current_queue ) ) {
+            if ( unlikely( no_steal ) ) { CHECK_TERMINATION; continue; }
+            empty_count++;
+            if ( empty_count < steal_threshold ) continue;
+            empty_count = 0;
+            CHECK_TERMINATION; // check for termination
+            __atomic_store_n( &executor_->w_infos[id].stamp, rdtscl(), __ATOMIC_RELAXED );
+            #ifdef ACTOR_STATS
+            executor_->w_infos[id].try_steal++;
+            #endif // ACTOR_STATS
+            steal_work( this, start + prng( range ) );
+            continue;
+        }
+        #endif // __STEAL
+        while ( ! is_empty( *current_queue ) ) {
+            #ifdef ACTOR_STATS
+            executor_->w_infos[id].processed++;
+            #endif
+            &req = &remove( *current_queue );
+            if ( !&req ) continue;
+            deliver_request( req );
+        }
+        #ifdef __STEAL
+        curr_work_queue->being_processed = false; // set done processing
+        empty_count = 0; // we found work so reset empty counter
+        // #ifdef ACTOR_STATS
+        // for ( i; executor_->nrqueues ) {
+        //       replaced_queue[i] = 0;
+        //       __atomic_store_n( &stolen_arr[i], 0, __ATOMIC_SEQ_CST );
+        // }
+        // #endif
+        // threshold of empty queues we see before we go stealing
+        const unsigned int steal_threshold = 2 * range;
+        // Store variable data here instead of worker struct to avoid any potential false sharing
+        unsigned int empty_count = 0;
+        request & req;
+        work_queue * curr_work_queue;
+        Exit:
+        for ( unsigned int i = 0;; i = (i + 1) % range ) {      // cycle through set of request buffers
+                curr_work_queue = request_queues[i + start];
+        #ifndef __STEAL
+        CHECK_TERMINATION;
         #endif
+        CHECK_TERMINATION;
+        // potentially reclaim some of the current queue's vector space if it is unused
+        reclaim( *current_queue );
+    } // for
+                // check if queue is empty before trying to gulp it
+                if ( is_empty( *curr_work_queue->c_queue ) ) {
+                        #ifdef __STEAL
+                        empty_count++;
+                        if ( empty_count < steal_threshold ) continue;
+                        #else
+                        continue;
+                        #endif
+                }
+                transfer( *curr_work_queue, &current_queue );
+                #ifdef ACTOR_STATS
+                executor_->w_infos[id].gulps++;
+                #endif // ACTOR_STATS
+                #ifdef __STEAL
+                if ( is_empty( *current_queue ) ) {
+                        if ( unlikely( no_steal ) ) { CHECK_TERMINATION; continue; }
+                        empty_count++;
+                        if ( empty_count < steal_threshold ) continue;
+                        empty_count = 0;
+                        CHECK_TERMINATION; // check for termination
+                        __atomic_store_n( &executor_->w_infos[id].stamp, rdtscl(), __ATOMIC_RELAXED );
+                        #ifdef ACTOR_STATS
+                        executor_->w_infos[id].try_steal++;
+                        #endif // ACTOR_STATS
+                        steal_work( this, start + prng( range ) );
+                        continue;
+                }
+                #endif // __STEAL
+                while ( ! is_empty( *current_queue ) ) {
+                        #ifdef ACTOR_STATS
+                        executor_->w_infos[id].processed++;
+                        #endif
+                        &req = &remove( *current_queue );
+                        if ( !&req ) continue;
+                        deliver_request( req );
+                }
+                #ifdef __STEAL
+                curr_work_queue->being_processed = false;               // set done processing
+                empty_count = 0; // we found work so reset empty counter
+                #endif
+                CHECK_TERMINATION;
+                // potentially reclaim some of the current queue's vector space if it is unused
+                reclaim( *current_queue );
+        } // for
+}
 static inline void send( executor & this, request & req, unsigned long int ticket ) with(this) {
     insert( request_queues[ticket], req);
+        insert( request_queues[ticket], req);
+}
 static inline void send( actor & this, request & req ) {
     DEBUG_ABORT( this.ticket == (unsigned long int)MAX, "Attempted to send message to deleted/dead actor\n" );
     send( *__actor_executor_, req, this.ticket );
+        DEBUG_ABORT( this.ticket == (unsigned long int)MAX, "Attempted to send message to deleted/dead actor\n" );
+        send( *__actor_executor_, req, this.ticket );
+}
 static inline void __reset_stats() {
     #ifdef ACTOR_STATS
     __total_tries = 0;
     __total_stolen = 0;
     __all_gulps = 0;
     __total_failed_swaps = 0;
     __total_empty_stolen = 0;
     __all_processed = 0;
     __num_actors_stats = 0;
     __all_msgs_stolen = 0;
     #endif
+        #ifdef ACTOR_STATS
+        __total_tries = 0;
+        __total_stolen = 0;
+        __all_gulps = 0;
+        __total_failed_swaps = 0;
+        __total_empty_stolen = 0;
+        __all_processed = 0;
+        __num_actors_stats = 0;
+        __all_msgs_stolen = 0;
+        #endif
+}
 static inline void start_actor_system( size_t num_thds ) {
     __reset_stats();
     __actor_executor_thd = active_thread();
     __actor_executor_ = alloc();
     (*__actor_executor_){ 0, num_thds, num_thds == 1 ? 1 : num_thds * 16 };
+        __reset_stats();
+        __actor_executor_thd = active_thread();
+        __actor_executor_ = alloc();
+        (*__actor_executor_){ 0, num_thds, num_thds == 1 ? 1 : num_thds * 16 };
+}
 …
 static inline void start_actor_system( executor & this ) {
     __reset_stats();
     __actor_executor_thd = active_thread();
     __actor_executor_ = &this;
     __actor_executor_passed = true;
+        __reset_stats();
+        __actor_executor_thd = active_thread();
+        __actor_executor_ = &this;
+        __actor_executor_passed = true;
+}
 static inline void stop_actor_system() {
     park( ); // will be unparked when actor system is finished
     if ( !__actor_executor_passed ) delete( __actor_executor_ );
     __actor_executor_ = 0p;
     __actor_executor_thd = 0p;
     __next_ticket = 0;
     __actor_executor_passed = false;
+        park();                                                                                         // unparked when actor system is finished
+        if ( !__actor_executor_passed ) delete( __actor_executor_ );
+        __actor_executor_ = 0p;
+        __actor_executor_thd = 0p;
+        __next_ticket = 0;
+        __actor_executor_passed = false;
+}
 // Default messages to send to any actor to change status
 // assigned at creation to __base_msg_finished to avoid unused message warning
+message __base_msg_finished @= { .allocation_ : Finished };
+struct __delete_msg_t { inline message; } delete_msg = __base_msg_finished;
+struct __destroy_msg_t { inline message; } destroy_msg = __base_msg_finished;
+struct __finished_msg_t { inline message; } finished_msg = __base_msg_finished;
+allocation receive( actor & this, __delete_msg_t & msg ) { return Delete; }
+allocation receive( actor & this, __destroy_msg_t & msg ) { return Destroy; }
+allocation receive( actor & this, __finished_msg_t & msg ) { return Finished; }
+message __base_msg_finished @= { .alloc : Finished };
+struct delete_msg_t { inline message; } delete_msg = __base_msg_finished;
+struct destroy_msg_t { inline message; } destroy_msg = __base_msg_finished;
+struct finished_msg_t { inline message; } finished_msg = __base_msg_finished;
+allocation receive( actor & this, delete_msg_t & msg ) { return Delete; }
+allocation receive( actor & this, destroy_msg_t & msg ) { return Destroy; }
+allocation receive( actor & this, finished_msg_t & msg ) { return Finished; }

libcfa/src/concurrency/alarm.hfa

-              r92355883
+              r2a301ff
 // Created On       : Fri Jun 2 11:31:25 2017
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Mon Mar 26 16:25:41 2018
 // Update Count     : 11
+// Last Modified On : Wed Aug 30 21:27:40 2023
+// Update Count     : 12
 //
 …
 #include "time.hfa"
 #include "containers/list.hfa"
+#include "collections/list.hfa"
 struct thread$;

libcfa/src/concurrency/channel.hfa

-              r92355883
+              r2a301ff
     #endif
 };
+static inline void ?{}( channel(T) & this, channel(T) this2 ) = void;
+static inline void ?=?( channel(T) & this, channel(T) this2 ) = void;
 static inline void ?{}( channel(T) &c, size_t _size ) with(c) {
 …
     return retval;
+}
+static inline void remove( channel(T) & chan ) { T elem = (T)remove( chan ); }
+///////////////////////////////////////////////////////////////////////////////////////////
+// The following is Go-style operator support for channels
+///////////////////////////////////////////////////////////////////////////////////////////
+static inline void ?<<?( channel(T) & chan, T elem ) { insert( chan, elem ); }
+static inline void ?<<?( T & ret, channel(T) & chan ) { ret = remove( chan ); }
 ///////////////////////////////////////////////////////////////////////////////////////////
 …
     unlock( mutex_lock );
     // only return true when not special OR case, not exceptional calse and status is SAT
     return ( node.extra == 0p || !node.park_counter ) ? false : *node.clause_status == __SELECT_SAT;
+    // only return true when not special OR case and status is SAT
+    return !node.park_counter ? false : *node.clause_status == __SELECT_SAT;
+}
 …
 // type used by select statement to capture a chan read as the selected operation
 struct chan_read {
     T & ret;
     channel(T) & chan;
+    T * ret;
+    channel(T) * chan;
 };
+static inline void ?{}( chan_read(T) & cr, channel(T) & chan, T & ret ) {
+    &cr.chan = &chan;
+    &cr.ret = &ret;
+}
+static inline chan_read(T) ?<<?( T & ret, channel(T) & chan ) { chan_read(T) cr{ chan, ret }; return cr; }
+static inline void __handle_select_closed_read( chan_read(T) & this, select_node & node ) with(this.chan, this) {
+    __closed_remove( chan, ret );
+__CFA_SELECT_GET_TYPE( chan_read(T) );
+static inline void ?{}( chan_read(T) & cr, channel(T) * chan, T * ret ) {
+    cr.chan = chan;
+    cr.ret = ret;
+}
+static inline chan_read(T) ?<<?( T & ret, channel(T) & chan ) { chan_read(T) cr{ &chan, &ret }; return cr; }
+static inline void __handle_select_closed_read( chan_read(T) & this, select_node & node ) with(*this.chan, this) {
+    __closed_remove( *chan, *ret );
     // if we get here then the insert succeeded
     __make_select_node_available( node );
+}
 static inline bool register_select( chan_read(T) & this, select_node & node ) with(this.chan, this) {
     lock( mutex_lock );
     node.extra = &ret; // set .extra so that if it == 0p later in on_selected it is due to channel close
+static inline bool register_select( chan_read(T) & this, select_node & node ) with(*this.chan, this) {
+    lock( mutex_lock );
+    node.extra = ret; // set .extra so that if it == 0p later in on_selected it is due to channel close
     #ifdef CHAN_STATS
 …
             if ( __handle_pending( prods, node ) ) {
                 __prods_handoff( chan, ret );
+                __prods_handoff( *chan, *ret );
                 __make_select_node_sat( node ); // need to to mark SAT now that we know operation is done or else threads could get stuck in __mark_select_node
                 unlock( mutex_lock );
 …
     ZeroSize: if ( size == 0 && !prods`isEmpty ) {
         if ( !__handle_waituntil_OR( prods ) ) break ZeroSize;
         __prods_handoff( chan, ret );
+        __prods_handoff( *chan, *ret );
         __set_avail_then_unlock( node, mutex_lock );
         return true;
 …
     // Remove from buffer
     __do_remove( chan, ret );
+    __do_remove( *chan, *ret );
     __set_avail_then_unlock( node, mutex_lock );
     return true;
+}
+static inline bool unregister_select( chan_read(T) & this, select_node & node ) { return unregister_chan( this.chan, node ); }
+static inline void on_selected( chan_read(T) & this, select_node & node ) with(this) {
+    if ( node.extra == 0p ) // check if woken up due to closed channel
+        __closed_remove( chan, ret );
+static inline bool unregister_select( chan_read(T) & this, select_node & node ) { return unregister_chan( *this.chan, node ); }
+static inline bool on_selected( chan_read(T) & this, select_node & node ) with(this) {
+    if ( unlikely(node.extra == 0p) ) {
+        if ( !exception_in_flight() ) __closed_remove( *chan, *ret ); // check if woken up due to closed channel
+        else return false;
+    }
     // This is only reachable if not closed or closed exception was handled
+}
+    return true;
+}
+// type used by select statement to capture a chan read as the selected operation that doesn't have a param to read to
+struct chan_read_no_ret {
+    T retval;
+    chan_read( T ) c_read;
+};
+__CFA_SELECT_GET_TYPE( chan_read_no_ret(T) );
+static inline void ?{}( chan_read_no_ret(T) & this, channel(T) & chan ) {
+    this.c_read{ &chan, &this.retval };
+}
+static inline chan_read_no_ret(T) remove( channel(T) & chan ) { chan_read_no_ret(T) c_read{ chan }; return c_read; }
+static inline bool register_select( chan_read_no_ret(T) & this, select_node & node ) {
+    this.c_read.ret = &this.retval;
+    return register_select( this.c_read, node );
+}
+static inline bool unregister_select( chan_read_no_ret(T) & this, select_node & node ) { return unregister_select( this.c_read, node ); }
+static inline bool on_selected( chan_read_no_ret(T) & this, select_node & node ) { return on_selected( this.c_read, node ); }
 // type used by select statement to capture a chan write as the selected operation
 struct chan_write {
     T elem;
     channel(T) & chan;
+    channel(T) * chan;
 };
+static inline void ?{}( chan_write(T) & cw, channel(T) & chan, T elem ) {
+    &cw.chan = &chan;
+__CFA_SELECT_GET_TYPE( chan_write(T) );
+static inline void ?{}( chan_write(T) & cw, channel(T) * chan, T elem ) {
+    cw.chan = chan;
     memcpy( (void *)&cw.elem, (void *)&elem, sizeof(T) );
+}
+static inline chan_write(T) ?>>?( T elem, channel(T) & chan ) { chan_write(T) cw{ chan, elem }; return cw; }
+static inline void __handle_select_closed_write( chan_write(T) & this, select_node & node ) with(this.chan, this) {
+    __closed_insert( chan, elem );
+static inline chan_write(T) ?<<?( channel(T) & chan, T elem ) { chan_write(T) cw{ &chan, elem }; return cw; }
+static inline chan_write(T) insert( T elem, channel(T) & chan) { chan_write(T) cw{ &chan, elem }; return cw; }
+static inline void __handle_select_closed_write( chan_write(T) & this, select_node & node ) with(*this.chan, this) {
+    __closed_insert( *chan, elem );
     // if we get here then the insert succeeded
     __make_select_node_available( node );
+}
 static inline bool register_select( chan_write(T) & this, select_node & node ) with(this.chan, this) {
+static inline bool register_select( chan_write(T) & this, select_node & node ) with(*this.chan, this) {
     lock( mutex_lock );
     node.extra = &elem; // set .extra so that if it == 0p later in on_selected it is due to channel close
 …
             if ( __handle_pending( cons, node ) ) {
                 __cons_handoff( chan, elem );
+                __cons_handoff( *chan, elem );
                 __make_select_node_sat( node ); // need to to mark SAT now that we know operation is done or else threads could get stuck in __mark_select_node
                 unlock( mutex_lock );
 …
     ConsEmpty: if ( !cons`isEmpty ) {
         if ( !__handle_waituntil_OR( cons ) ) break ConsEmpty;
         __cons_handoff( chan, elem );
+        __cons_handoff( *chan, elem );
         __set_avail_then_unlock( node, mutex_lock );
         return true;
 …
     // otherwise carry out write either via normal insert
     __buf_insert( chan, elem );
+    __buf_insert( *chan, elem );
     __set_avail_then_unlock( node, mutex_lock );
     return true;
+}
+static inline bool unregister_select( chan_write(T) & this, select_node & node ) { return unregister_chan( this.chan, node ); }
+static inline void on_selected( chan_write(T) & this, select_node & node ) with(this) {
+    if ( node.extra == 0p ) // check if woken up due to closed channel
+        __closed_insert( chan, elem );
+static inline bool unregister_select( chan_write(T) & this, select_node & node ) { return unregister_chan( *this.chan, node ); }
+static inline bool on_selected( chan_write(T) & this, select_node & node ) with(this) {
+    if ( unlikely(node.extra == 0p) ) {
+        if ( !exception_in_flight() ) __closed_insert( *chan, elem ); // check if woken up due to closed channel
+        else return false;
+    }
     // This is only reachable if not closed or closed exception was handled
+    return true;
+}

libcfa/src/concurrency/coroutine.cfa

-              r92355883
+              r2a301ff
 #include "kernel/private.hfa"
 #include "exception.hfa"
+#include "exception.h"
 #include "math.hfa"
 …
         free( desc->cancellation );
         desc->cancellation = 0p;
+}
+// helper for popping from coroutine's ehm buffer
+inline nonlocal_exception * pop_ehm_head( coroutine$ * this ) {
+    lock( this->ehm_state.buffer_lock __cfaabi_dbg_ctx2 );
+    nonlocal_exception * nl_ex = pop_head( this->ehm_state.ehm_buffer );
+    unlock( this->ehm_state.buffer_lock );
+    return nl_ex;
+}
 …
         last = 0p;
         cancellation = 0p;
+    ehm_state.ehm_buffer{};
+    ehm_state.buffer_lock{};
+    ehm_state.ehm_enabled = false;
+}
 void ^?{}(coroutine$& this) libcfa_public {
+    // handle any leftover pending non-local exceptions
+    nonlocal_exception * nl_ex = pop_ehm_head( &this );
+    unsigned unhandled_ex = 0;
+    // if any leftover exceptions handle
+    while ( nl_ex != 0p ){
+        unhandled_ex++;
+        free( nl_ex->the_exception );
+        free( nl_ex );
+        nl_ex = pop_ehm_head( &this );
+    }
+    #ifdef __CFA_DEBUG__
+    if ( unhandled_ex > 0 )
+        printf( "Warning: Coroutine %p exited with %u pending nonlocal exceptions.\n", &this, unhandled_ex );
+    #endif
         if(this.state != Halted && this.state != Start && this.state != Primed) {
                 coroutine$ * src = active_coroutine();
 …
+}
+////////////////////////////////////////////////////////////////////////////////////////////////////
+// non local ehm routines
+void defaultResumeAtHandler( exception_t * except ) {
+    __cfaehm_allocate_exception( except );
+    free( except );
+    __cfaehm_begin_unwind( (void(*)(exception_t *))defaultTerminationHandler );
+}
+bool poll( coroutine$ * cor ) libcfa_public {
+    nonlocal_exception * nl_ex = pop_ehm_head( cor );
+    // if no exceptions return false
+    if ( nl_ex == 0p ) return false;
+    // otherwise loop and throwResume all pending exceptions
+    while ( nl_ex != 0p ){
+        exception_t * ex = nl_ex->the_exception;
+        free( nl_ex );
+        __cfaehm_throw_resume( ex, defaultResumeAtHandler );
+        // only reached if resumption handled. other dealloc handled in defaultResumeAtHandler
+        free( ex );
+        nl_ex = pop_ehm_head( cor );
+    }
+    return true;
+}
+bool poll() libcfa_public { return poll( active_coroutine() ); }
+coroutine$ * resumer() libcfa_public { return active_coroutine()->last; }
+// user facing ehm operations
+forall(T & | is_coroutine(T)) {
+    // enable/disable non-local exceptions
+    void enable_ehm( T & cor ) libcfa_public { get_coroutine( cor )->ehm_state.ehm_enabled = true; }
+    void disable_ehm( T & cor ) libcfa_public { get_coroutine( cor )->ehm_state.ehm_enabled = false; }
+    // poll for non-local exceptions
+    bool poll( T & cor ) libcfa_public { return poll( get_coroutine( cor ) ); }
+    // poll iff nonlocal ehm is enabled
+    bool checked_poll( T & cor ) libcfa_public { return get_coroutine( cor )->ehm_state.ehm_enabled ? poll( cor ) : false; }
+    coroutine$ * resumer( T & cor ) libcfa_public { return get_coroutine( cor )->last; }
+}
+// resume non local exception at receiver (i.e. enqueue in ehm buffer)
+forall(exceptT *, T & | ehm_resume_at( exceptT, T ))
+void resumeAt( T & receiver, exceptT & ex )  libcfa_public {
+    coroutine$ * cor = get_coroutine( receiver );
+    nonlocal_exception * nl_ex = alloc();
+    exceptT * ex_copy = alloc();
+    memcpy( ex_copy, &ex, sizeof(exceptT) );
+    (*nl_ex){ (exception_t *)ex_copy };
+    lock( cor->ehm_state.buffer_lock __cfaabi_dbg_ctx2 );
+    append( cor->ehm_state.ehm_buffer, nl_ex );
+    unlock( cor->ehm_state.buffer_lock );
+}
+forall(exceptT * | { void $throwResume(exceptT &); })
+void resumeAt( coroutine$ * receiver, exceptT & ex ) libcfa_public {
+    nonlocal_exception * nl_ex = alloc();
+    exceptT * ex_copy = alloc();
+    memcpy( ex_copy, &ex, sizeof(exceptT) );
+    (*nl_ex){ (exception_t *)ex_copy };
+    lock( receiver->ehm_state.buffer_lock __cfaabi_dbg_ctx2 );
+    append( receiver->ehm_state.ehm_buffer, nl_ex );
+    unlock( receiver->ehm_state.buffer_lock );
+}
 // Local Variables: //
 // mode: c //

libcfa/src/concurrency/coroutine.hfa

-              r92355883
+              r2a301ff
 #include "invoke.h"
 #include "../exception.hfa"
+//-----------------------------------------------------------------------------
+// Type used to store and queue nonlocal exceptions on coroutines
+struct nonlocal_exception {
+    exception_t * the_exception;
+    nonlocal_exception * next;
+};
+static inline void ?{} ( nonlocal_exception & this, exception_t * ex ) with(this) {
+    the_exception = ex;
+    next = 0p;
+}
+static inline nonlocal_exception *& get_next( nonlocal_exception & this ) __attribute__((const)) {
+    return this.next;
+}
 //-----------------------------------------------------------------------------
 …
+}
+// non local ehm and coroutine utility routines
+bool poll( coroutine$ * cor );
+bool poll();
+coroutine$ * resumer();
+forall(T & | is_coroutine(T)) {
+    void enable_ehm( T & cor );
+    void disable_ehm( T & cor );
+    bool poll( T & cor );
+    bool checked_poll( T & cor );
+    coroutine$ * resumer( T & cor );
+}
+// trait for exceptions able to be resumed at another coroutine
+forall(exceptT *, T & | is_coroutine(T))
+trait ehm_resume_at { void $throwResume(exceptT &); };
+// general resumeAt
+forall(exceptT *, T & | ehm_resume_at( exceptT, T ))
+void resumeAt( T & receiver, exceptT & ex );
+// resumeAt for underlying coroutine$ type
+forall(exceptT * | { void $throwResume(exceptT &); })
+void resumeAt( coroutine$ * receiver, exceptT & ex );
 // Local Variables: //
 // mode: c //

libcfa/src/concurrency/future.hfa

r92355883	r2a301ff
39	39	futex_mutex lock;
40	40	};
	41	__CFA_SELECT_GET_TYPE( future(T) );
41	42
42	43	struct future_node {
…	…
180	181	}
181	182
182		~~void on_selected( future(T) & this, select_node & node ) {~~}
	183	bool on_selected( future(T) & this, select_node & node ) { return true; }
183	184	}
184	185	}

libcfa/src/concurrency/invoke.h

-              r92355883
+              r2a301ff
 // Created On       : Tue Jan 17 12:27:26 2016
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Tue Mar 14 13:39:31 2023
 // Update Count     : 59
+// Last Modified On : Wed Aug 30 21:27:51 2023
+// Update Count     : 60
 //
 // No not use #pragma once was this file is included twice in some places. It has its own guard system.
 #include "bits/containers.hfa"
+#include "bits/collections.hfa"
 #include "bits/defs.hfa"
 #include "bits/locks.hfa"
 …
 #ifdef __cforall
 #include "containers/list.hfa"
+#include "collections/list.hfa"
 extern "C" {
 #endif
 …
         };
+    struct nonlocal_ehm {
+        // list of pending nonlocal exceptions
+        __queue_t(struct nonlocal_exception) ehm_buffer;
+        // lock to protect the buffer
+        struct __spinlock_t buffer_lock;
+        // enable/disabled flag
+        bool ehm_enabled;
+    };
         enum __Coroutine_State { Halted, Start, Primed, Blocked, Ready, Active, Cancelled, Halting };
 …
                 struct _Unwind_Exception * cancellation;
+        // Non-local exception handling information
+        struct nonlocal_ehm ehm_state;
         };
         // Wrapper for gdb
 …
         #ifdef __cforall
         extern "Cforall" {
+        static inline bool exception_in_flight() {
+            return __get_stack( &active_thread()->self_cor )->exception_context.current_exception != 0p;
+        }
                 static inline thread$ * volatile & ?`next ( thread$ * this ) {
                         return this->user_link.next;

libcfa/src/concurrency/iofwd.hfa

-              r92355883
+              r2a301ff
 // Created On       : Thu Apr 23 17:31:00 2020
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Mon Mar 13 23:54:57 2023
 // Update Count     : 1
+// Last Modified On : Fri Jul 21 21:36:01 2023
+// Update Count     : 3
 //
 …
 #include <unistd.h>
 #include <sys/socket.h>
+#include <string.h>                                                                             // memset
 extern "C" {
 …
 #if CFA_HAVE_LINUX_IO_URING_H
         static inline void zero_sqe(struct io_uring_sqe * sqe) {
+                sqe->flags = 0;
+                sqe->ioprio = 0;
+                sqe->fd = 0;
+                sqe->off = 0;
+                sqe->addr = 0;
+                sqe->len = 0;
+                sqe->fsync_flags = 0;
+                sqe->__pad2[0] = 0;
+                sqe->__pad2[1] = 0;
+                sqe->__pad2[2] = 0;
+                sqe->fd = 0;
+                sqe->off = 0;
+                sqe->addr = 0;
+                sqe->len = 0;
+                memset( sqe, 0, sizeof( struct io_uring_sqe ) );
+        }
 #endif

libcfa/src/concurrency/kernel.cfa

r92355883	r2a301ff
569	569	returnToKernel();
570	570	__enable_interrupts_checked();
571
572	571	}
573	572

libcfa/src/concurrency/kernel.hfa

-              r92355883
+              r2a301ff
 // Created On       : Tue Jan 17 12:27:26 2017
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Tue Feb  4 12:29:26 2020
 // Update Count     : 22
+// Last Modified On : Wed Aug 30 21:28:46 2023
+// Update Count     : 23
 //
 …
 #include "coroutine.hfa"
 #include "containers/list.hfa"
+#include "collections/list.hfa"
 extern "C" {

libcfa/src/concurrency/kernel/startup.cfa

-              r92355883
+              r2a301ff
         last = 0p;
         cancellation = 0p;
+    ehm_state.ehm_buffer{};
+    ehm_state.buffer_lock{};
+    ehm_state.ehm_enabled = false;
+}

libcfa/src/concurrency/locks.cfa

r92355883	r2a301ff
239	239	}
240	240
241		~~void on_selected( blocking_lock & this, select_node & node ) {~~}
	241	bool on_selected( blocking_lock & this, select_node & node ) { return true; }
242	242
243	243	//-----------------------------------------------------------------------------

libcfa/src/concurrency/locks.hfa

-              r92355883
+              r2a301ff
 #include "bits/weakso_locks.hfa"
 #include "containers/lockfree.hfa"
 #include "containers/list.hfa"
+#include "collections/lockfree.hfa"
+#include "collections/list.hfa"
 #include "limits.hfa"
 …
 static inline bool   register_select( single_acquisition_lock & this, select_node & node ) { return register_select( (blocking_lock &)this, node ); }
 static inline bool   unregister_select( single_acquisition_lock & this, select_node & node ) { return unregister_select( (blocking_lock &)this, node ); }
+static inline void   on_selected( single_acquisition_lock & this, select_node & node ) { on_selected( (blocking_lock &)this, node ); }
+static inline bool   on_selected( single_acquisition_lock & this, select_node & node ) { return on_selected( (blocking_lock &)this, node ); }
+__CFA_SELECT_GET_TYPE( single_acquisition_lock );
 //----------
 …
 static inline bool   register_select( owner_lock & this, select_node & node ) { return register_select( (blocking_lock &)this, node ); }
 static inline bool   unregister_select( owner_lock & this, select_node & node ) { return unregister_select( (blocking_lock &)this, node ); }
+static inline void   on_selected( owner_lock & this, select_node & node ) { on_selected( (blocking_lock &)this, node ); }
+static inline bool   on_selected( owner_lock & this, select_node & node ) { return on_selected( (blocking_lock &)this, node ); }
+__CFA_SELECT_GET_TYPE( owner_lock );
 //-----------------------------------------------------------------------------
 …
 };
 static inline void ?{}(mcs_node & this) { this.next = 0p; }
+static inline void ?{}( mcs_node & this ) { this.next = 0p; }
 static inline mcs_node * volatile & ?`next ( mcs_node * node ) {
 …
 };
 static inline void lock(mcs_lock & l, mcs_node & n) {
+static inline void lock( mcs_lock & l, mcs_node & n ) {
         if(push(l.queue, &n))
                 wait(n.sem);
 …
 };
 static inline void ?{}(mcs_spin_node & this) { this.next = 0p; this.locked = true; }
+static inline void ?{}( mcs_spin_node & this ) { this.next = 0p; this.locked = true; }
 struct mcs_spin_lock {
 …
 };
 static inline void lock(mcs_spin_lock & l, mcs_spin_node & n) {
+static inline void lock( mcs_spin_lock & l, mcs_spin_node & n ) {
     n.locked = true;
         mcs_spin_node * prev = __atomic_exchange_n(&l.queue.tail, &n, __ATOMIC_SEQ_CST);
 …
 };
 static inline void  ?{}( go_mutex & this ) with(this) { val = 0; }
+// static inline void ?{}( go_mutex & this, go_mutex this2 ) = void; // these don't compile correctly at the moment so they should be omitted
 // static inline void ?=?( go_mutex & this, go_mutex this2 ) = void;
+static inline void ?{}( go_mutex & this, go_mutex this2 ) = void;
+static inline void ?=?( go_mutex & this, go_mutex this2 ) = void;
 static inline bool internal_try_lock(go_mutex & this, int & compare_val, int new_val ) with(this) {
 …
+}
 static inline void on_selected( simple_owner_lock & this, select_node & node ) {}
+static inline bool on_selected( simple_owner_lock & this, select_node & node ) { return true; }
+__CFA_SELECT_GET_TYPE( simple_owner_lock );
 //-----------------------------------------------------------------------------

libcfa/src/concurrency/once.hfa

r92355883	r2a301ff
16	16	#pragma once
17	17
18		#include "co~~ntainer~~s/lockfree.hfa"
	18	#include "collections/lockfree.hfa"
19	19	#include "kernel/fwd.hfa"
20	20

libcfa/src/concurrency/select.cfa

r92355883	r2a301ff
49	49	return false;
50	50	}
51		~~void on_selected( select_timeout_node & this, select_node & node ) {~~}
	51	bool on_selected( select_timeout_node & this, select_node & node ) { return true; }
52	52
53	53	// Gateway routine to wait on duration

libcfa/src/concurrency/select.hfa

-              r92355883
+              r2a301ff
 #pragma once
 #include "containers/list.hfa"
+#include "collections/list.hfa"
 #include "alarm.hfa"
 #include "kernel.hfa"
 …
     // This routine is run on the selecting thread prior to executing the statement corresponding to the select_node
+    //    passed as an arg to this routine
+    // If on_selected returns false, the statement is not run, if it returns true it is run.
+    void on_selected( T &, select_node & );
+    //    passed as an arg to this routine. If true is returned proceed as normal, if false is returned the statement is skipped
+    bool on_selected( T &, select_node & );
 };
+// Used inside the compiler to allow for overloading on return type for operations such as '?<<?' for channels
+// YOU MUST USE THIS MACRO OR INCLUDE AN EQUIVALENT DECL FOR YOUR TYPE TO SUPPORT WAITUNTIL
+#define __CFA_SELECT_GET_TYPE( typename ) typename __CFA_select_get_type( typename __CFA_t )
 //=============================================================================================
 …
 bool register_select( select_timeout_node & this, select_node & node );
 bool unregister_select( select_timeout_node & this, select_node & node );
+void on_selected( select_timeout_node & this, select_node & node );
+bool on_selected( select_timeout_node & this, select_node & node );
+select_timeout_node __CFA_select_get_type( select_timeout_node this );
 // Gateway routines to waituntil on duration
 select_timeout_node timeout( Duration duration );
 select_timeout_node sleep( Duration duration );

libcfa/src/concurrency/stats.cfa

-              r92355883
+              r2a301ff
 #if !defined(__CFA_NO_STATISTICS__)
         void __init_stats( struct __stats_t * stats ) {
+                stats->ready.push.local.attempt = 0;
+                stats->ready.push.local.success = 0;
+                stats->ready.push.share.attempt = 0;
+                stats->ready.push.share.success = 0;
+                stats->ready.push.extrn.attempt = 0;
+                stats->ready.push.extrn.success = 0;
+                stats->ready.pop.local .attempt = 0;
+                stats->ready.pop.local .success = 0;
+                stats->ready.pop.help  .attempt = 0;
+                stats->ready.pop.help  .success = 0;
+                stats->ready.pop.steal .attempt = 0;
+                stats->ready.pop.steal .success = 0;
+                stats->ready.pop.search.attempt = 0;
+                stats->ready.pop.search.success = 0;
+                stats->ready.threads.migration = 0;
+                stats->ready.threads.extunpark = 0;
+                stats->ready.threads.threads   = 0;
+                stats->ready.threads.cthreads  = 0;
+                stats->ready.threads.preempt.yield  = 0;
+                stats->ready.threads.preempt.rllfwd = 0;
+                stats->ready.sleep.halts   = 0;
+                stats->ready.sleep.cancels = 0;
+                stats->ready.sleep.early   = 0;
+                stats->ready.sleep.wakes   = 0;
+                stats->ready.sleep.seen    = 0;
+                stats->ready.sleep.exits   = 0;
+                memset( &stats->ready, 0, sizeof( stats->ready ) );
                 #if defined(CFA_HAVE_LINUX_IO_URING_H)
+                        stats->io.alloc.fast        = 0;
+                        stats->io.alloc.slow        = 0;
+                        stats->io.alloc.fail        = 0;
+                        stats->io.alloc.revoke      = 0;
+                        stats->io.alloc.block       = 0;
+                        stats->io.submit.fast       = 0;
+                        stats->io.submit.slow       = 0;
+                        stats->io.submit.eagr       = 0;
+                        stats->io.submit.nblk       = 0;
+                        stats->io.submit.extr       = 0;
+                        stats->io.flush.external    = 0;
+                        stats->io.flush.signal      = 0;
+                        stats->io.flush.dirty       = 0;
+                        stats->io.flush.full        = 0;
+                        stats->io.flush.idle        = 0;
+                        stats->io.flush.eager       = 0;
+                        stats->io.calls.flush       = 0;
+                        stats->io.calls.submitted   = 0;
+                        stats->io.calls.drain       = 0;
+                        stats->io.calls.completed   = 0;
+                        stats->io.calls.locked      = 0;
+                        stats->io.calls.helped      = 0;
+                        stats->io.calls.errors.busy = 0;
+                        stats->io.ops.sockread      = 0;
+                        stats->io.ops.epllread      = 0;
+                        stats->io.ops.sockwrite     = 0;
+                        stats->io.ops.epllwrite     = 0;
+                        memset( &stats->io, 0, sizeof( stats->io ) );
                 #endif

Context Navigation

Legend:

libcfa/src/concurrency/actor.hfa

libcfa/src/concurrency/alarm.hfa

libcfa/src/concurrency/channel.hfa

libcfa/src/concurrency/coroutine.cfa

libcfa/src/concurrency/coroutine.hfa

libcfa/src/concurrency/future.hfa

libcfa/src/concurrency/invoke.h

libcfa/src/concurrency/iofwd.hfa

libcfa/src/concurrency/kernel.cfa

libcfa/src/concurrency/kernel.hfa

libcfa/src/concurrency/kernel/startup.cfa

libcfa/src/concurrency/locks.cfa

libcfa/src/concurrency/locks.hfa

libcfa/src/concurrency/once.hfa

libcfa/src/concurrency/select.cfa

libcfa/src/concurrency/select.hfa

libcfa/src/concurrency/stats.cfa

Download in other formats: