Context Navigation

← Previous Change
Next Change →

Changeset 358cba0 for src/libcfa/concurrency

Timestamp:

May 15, 2018, 4:17:15 PM (7 years ago)

Author:

Rob Schluntz <rschlunt@…>

Branches:

ADT, aaron-thesis, arm-eh, ast-experimental, cleanup-dtors, deferred_resn, demangler, enum, forall-pointer-decay, jacob/cs343-translation, jenkins-sandbox, master, new-ast, new-ast-unique-expr, new-env, no_list, persistent-indexer, pthread-emulation, qualifiedEnum, with_gc

Children:

Parents:

7d0a3ba (diff), a61fa0bb (diff)
Note: this is a merge changeset, the changes displayed below correspond to the merge itself.
Use the (diff) links above to see all the changes relative to each parent.

Message:

Merge branch 'master' of plg.uwaterloo.ca:/u/cforall/software/cfa/cfa-cc

Location:

src/libcfa/concurrency

Files:

: 10 edited

coroutine (modified) (5 diffs)
coroutine.c (modified) (3 diffs)
invoke.c (modified) (1 diff)
invoke.h (modified) (4 diffs)
kernel (modified) (4 diffs)
kernel.c (modified) (39 diffs)
kernel_private.h (modified) (1 diff)
monitor.c (modified) (12 diffs)
preemption.c (modified) (9 diffs)
thread.c (modified) (7 diffs)

Legend:

: Unmodified
: Added
: Removed

src/libcfa/concurrency/coroutine

-              r7d0a3ba
+              r358cba0
 // Suspend implementation inlined for performance
 static inline void suspend() {
+        coroutine_desc * src = TL_GET( this_coroutine );                        // optimization
+        // optimization : read TLS once and reuse it
+        // Safety note: this is preemption safe since if
+        // preemption occurs after this line, the pointer
+        // will also migrate which means this value will
+        // stay in syn with the TLS
+        coroutine_desc * src = TL_GET( this_coroutine );
         assertf( src->last != 0,
 …
 forall(dtype T | is_coroutine(T))
 static inline void resume(T & cor) {
+        coroutine_desc * src = TL_GET( this_coroutine );                        // optimization
+        // optimization : read TLS once and reuse it
+        // Safety note: this is preemption safe since if
+        // preemption occurs after this line, the pointer
+        // will also migrate which means this value will
+        // stay in syn with the TLS
+        coroutine_desc * src = TL_GET( this_coroutine );
         coroutine_desc * dst = get_coroutine(cor);
 …
                 dst->last = src;
                 dst->starter = dst->starter ? dst->starter : src;
         } // if
+        }
         // always done for performance testing
 …
 static inline void resume(coroutine_desc * dst) {
+        coroutine_desc * src = TL_GET( this_coroutine );                        // optimization
+        // optimization : read TLS once and reuse it
+        // Safety note: this is preemption safe since if
+        // preemption occurs after this line, the pointer
+        // will also migrate which means this value will
+        // stay in syn with the TLS
+        coroutine_desc * src = TL_GET( this_coroutine );
         // not resuming self ?
 …
                 // set last resumer
                 dst->last = src;
         } // if
+        }
         // always done for performance testing

src/libcfa/concurrency/coroutine.c

-              r7d0a3ba
+              r358cba0
 // Wrapper for co
 void CoroutineCtxSwitch(coroutine_desc* src, coroutine_desc* dst) {
+      verify( TL_GET( preemption_state ).enabled || TL_GET( this_processor )->do_terminate );
+      // Safety note : This could cause some false positives due to preemption
+      verify( TL_GET( preemption_state.enabled ) || TL_GET( this_processor )->do_terminate );
       disable_interrupts();
 …
       // set new coroutine that task is executing
       TL_SET( this_coroutine, dst );
+      kernelTLS.this_coroutine = dst;
       // context switch to specified coroutine
 …
       enable_interrupts( __cfaabi_dbg_ctx );
+      verify( TL_GET( preemption_state ).enabled || TL_GET( this_processor )->do_terminate );
+      // Safety note : This could cause some false positives due to preemption
+      verify( TL_GET( preemption_state.enabled ) || TL_GET( this_processor )->do_terminate );
 } //ctxSwitchDirect

src/libcfa/concurrency/invoke.c

r7d0a3ba	r358cba0
69	69	// Fetch the thread handle from the user defined thread structure
70	70	struct thread_desc* thrd = get_thread( this );
	71	thrd->self_cor.last = NULL;
71	72
72	73	// Officially start the thread by enabling preemption

src/libcfa/concurrency/invoke.h

-              r7d0a3ba
+              r358cba0
 #include "bits/locks.h"
 #define TL_GET( member ) kernelThreadData.member
 #define TL_SET( member, value ) kernelThreadData.member = value;
+#define TL_GET( member ) kernelTLS.member
+#define TL_SET( member, value ) kernelTLS.member = value;
 #ifdef __cforall
 …
                                 volatile bool in_progress;
                         } preemption_state;
                 } kernelThreadData;
+                } kernelTLS;
+        }
         static inline struct coroutine_desc * volatile active_coroutine() { return TL_GET( this_coroutine ); }
         static inline struct thread_desc * volatile active_thread() { return TL_GET( this_thread ); }
         static inline struct processor * volatile active_processor() { return TL_GET( this_processor ); }
+        static inline struct thread_desc    * volatile active_thread   () { return TL_GET( this_thread    ); }
+        static inline struct processor      * volatile active_processor() { return TL_GET( this_processor ); } // UNSAFE
         #endif
 …
                 struct thread_desc * next;
+                __cfaabi_dbg_debug_do(
+                        // instrusive link field for debugging
+                        struct thread_desc * dbg_next;
+                        struct thread_desc * dbg_prev;
+                )
+                struct {
+                        struct thread_desc * next;
+                        struct thread_desc * prev;
+                } node;
      };
 …
                 static inline thread_desc * & get_next( thread_desc & this ) {
                         return this.next;
+                }
+                static inline [thread_desc *&, thread_desc *& ] __get( thread_desc & this ) {
+                        return this.node.[next, prev];
+                }

src/libcfa/concurrency/kernel

-              r7d0a3ba
+              r358cba0
 //-----------------------------------------------------------------------------
+// Cluster
+struct cluster {
+        // Ready queue locks
+        __spinlock_t ready_queue_lock;
+// Processor
+extern struct cluster * mainCluster;
-        // Ready queue for threads
-        __queue_t(thread_desc) ready_queue;
-        // Name of the cluster
-        const char * name;
-        // Preemption rate on this cluster
-        Duration preemption_rate;
-};
-extern struct cluster * mainCluster;
-extern Duration default_preemption();
-void ?{} (cluster & this, const char * name, Duration preemption_rate);
-void ^?{}(cluster & this);
-static inline void ?{} (cluster & this)                           { this{"Anonymous Cluster", default_preemption()}; }
-static inline void ?{} (cluster & this, Duration preemption_rate) { this{"Anonymous Cluster", preemption_rate}; }
-static inline void ?{} (cluster & this, const char * name)        { this{name, default_preemption()}; }
-//-----------------------------------------------------------------------------
-// Processor
 enum FinishOpCode { No_Action, Release, Schedule, Release_Schedule, Release_Multi, Release_Multi_Schedule };
 …
         // Cluster from which to get threads
         cluster * cltr;
+        struct cluster * cltr;
         // Name of the processor
 …
         bool pending_preemption;
+        // Idle lock
+        // Link lists fields
+        struct {
+                struct processor * next;
+                struct processor * prev;
+        } node;
 #ifdef __CFA_DEBUG__
         // Last function to enable preemption on this processor
 …
 };
 void  ?{}(processor & this, const char * name, cluster & cltr);
+void  ?{}(processor & this, const char * name, struct cluster & cltr);
 void ^?{}(processor & this);
 static inline void  ?{}(processor & this)                    { this{ "Anonymous Processor", *mainCluster}; }
 static inline void  ?{}(processor & this, cluster & cltr)    { this{ "Anonymous Processor", cltr}; }
+static inline void  ?{}(processor & this, struct cluster & cltr)    { this{ "Anonymous Processor", cltr}; }
 static inline void  ?{}(processor & this, const char * name) { this{name, *mainCluster }; }
+static inline [processor *&, processor *& ] __get( processor & this ) {
+        return this.node.[next, prev];
+}
+//-----------------------------------------------------------------------------
+// Cluster
+struct cluster {
+        // Ready queue locks
+        __spinlock_t ready_queue_lock;
+        // Ready queue for threads
+        __queue_t(thread_desc) ready_queue;
+        // Name of the cluster
+        const char * name;
+        // Preemption rate on this cluster
+        Duration preemption_rate;
+        // List of processors
+        __spinlock_t proc_list_lock;
+        __dllist_t(struct processor) procs;
+        __dllist_t(struct processor) idles;
+        // Link lists fields
+        struct {
+                cluster * next;
+                cluster * prev;
+        } node;
+};
+extern Duration default_preemption();
+void ?{} (cluster & this, const char * name, Duration preemption_rate);
+void ^?{}(cluster & this);
+static inline void ?{} (cluster & this)                           { this{"Anonymous Cluster", default_preemption()}; }
+static inline void ?{} (cluster & this, Duration preemption_rate) { this{"Anonymous Cluster", preemption_rate}; }
+static inline void ?{} (cluster & this, const char * name)        { this{name, default_preemption()}; }
+static inline [cluster *&, cluster *& ] __get( cluster & this ) {
+        return this.node.[next, prev];
+}
 // Local Variables: //

src/libcfa/concurrency/kernel.c

-              r7d0a3ba
+              r358cba0
 thread_desc * mainThread;
+struct { __dllist_t(thread_desc) list; __spinlock_t lock; } global_threads ;
+struct { __dllist_t(cluster    ) list; __spinlock_t lock; } global_clusters;
 //-----------------------------------------------------------------------------
 // Global state
 …
 // volatile thread_local unsigned short disable_preempt_count = 1;
 thread_local struct KernelThreadData kernelThreadData = {
+thread_local struct KernelThreadData kernelTLS = {
         NULL,
         NULL,
 …
         self_mon_p = &self_mon;
         next = NULL;
+        __cfaabi_dbg_debug_do(
+                dbg_next = NULL;
+                dbg_prev = NULL;
+                __cfaabi_dbg_thread_register(&this);
+        )
+        node.next = NULL;
+        node.prev = NULL;
+        doregister(this);
         monitors{ &self_mon_p, 1, (fptr_t)0 };
 …
                 terminate(&this);
                 verify(this.do_terminate);
                 verify(TL_GET( this_processor ) != &this);
+                verify( kernelTLS.this_processor != &this);
                 P( terminated );
                 verify(TL_GET( this_processor ) != &this);
+                verify( kernelTLS.this_processor != &this);
                 pthread_join( kernel_thread, NULL );
+        }
 …
         ready_queue{};
         ready_queue_lock{};
+        procs{ __get };
+        idles{ __get };
+        doregister(this);
+}
 void ^?{}(cluster & this) {
+        unregister(this);
+}
 …
         __cfaabi_dbg_print_safe("Kernel : core %p starting\n", this);
+        doregister(this->cltr, this);
+        {
                 // Setup preemption data
 …
                         if(readyThread)
+                        {
                                 verify( ! TL_GET( preemption_state ).enabled );
+                                verify( ! kernelTLS.preemption_state.enabled );
                                 runThread(this, readyThread);
                                 verify( ! TL_GET( preemption_state ).enabled );
+                                verify( ! kernelTLS.preemption_state.enabled );
                                 //Some actions need to be taken from the kernel
 …
+        }
+        unregister(this->cltr, this);
         V( this->terminated );
 …
+}
+// KERNEL ONLY
 // runThread runs a thread by context switching
 // from the processor coroutine to the target thread
 …
         coroutine_desc * thrd_cor = dst->curr_cor;
         //Reset the terminating actions here
+        // Reset the terminating actions here
         this->finish.action_code = No_Action;
         //Update global state
         TL_SET( this_thread, dst );
+        // Update global state
+        kernelTLS.this_thread = dst;
         // Context Switch to the thread
 …
+}
+// KERNEL_ONLY
 void returnToKernel() {
         coroutine_desc * proc_cor = get_coroutine(TL_GET( this_processor )->runner);
         coroutine_desc * thrd_cor = TL_GET( this_thread )->curr_cor = TL_GET( this_coroutine );
+        coroutine_desc * proc_cor = get_coroutine(kernelTLS.this_processor->runner);
+        coroutine_desc * thrd_cor = kernelTLS.this_thread->curr_cor = kernelTLS.this_coroutine;
         ThreadCtxSwitch(thrd_cor, proc_cor);
+}
+// KERNEL_ONLY
 // Once a thread has finished running, some of
 // its final actions must be executed from the kernel
 void finishRunning(processor * this) with( this->finish ) {
         if( action_code == Release ) {
                 verify( ! TL_GET( preemption_state ).enabled );
+                verify( ! kernelTLS.preemption_state.enabled );
                 unlock( *lock );
+        }
 …
+        }
         else if( action_code == Release_Schedule ) {
                 verify( ! TL_GET( preemption_state ).enabled );
+                verify( ! kernelTLS.preemption_state.enabled );
                 unlock( *lock );
                 ScheduleThread( thrd );
+        }
         else if( action_code == Release_Multi ) {
                 verify( ! TL_GET( preemption_state ).enabled );
+                verify( ! kernelTLS.preemption_state.enabled );
                 for(int i = 0; i < lock_count; i++) {
                         unlock( *locks[i] );
 …
+}
+// KERNEL_ONLY
 // Context invoker for processors
 // This is the entry point for processors (kernel threads)
 …
 void * CtxInvokeProcessor(void * arg) {
         processor * proc = (processor *) arg;
         TL_SET( this_processor, proc );
         TL_SET( this_coroutine, NULL );
         TL_SET( this_thread, NULL );
         TL_GET( preemption_state ).[enabled, disable_count] = [false, 1];
+        kernelTLS.this_processor = proc;
+        kernelTLS.this_coroutine = NULL;
+        kernelTLS.this_thread    = NULL;
+        kernelTLS.preemption_state.[enabled, disable_count] = [false, 1];
         // SKULLDUGGERY: We want to create a context for the processor coroutine
         // which is needed for the 2-step context switch. However, there is no reason
 …
         //Set global state
         TL_SET( this_coroutine, get_coroutine(proc->runner) );
         TL_SET( this_thread, NULL );
+        kernelTLS.this_coroutine = get_coroutine(proc->runner);
+        kernelTLS.this_thread    = NULL;
         //We now have a proper context from which to schedule threads
 …
+}
+// KERNEL_ONLY
 void kernel_first_resume(processor * this) {
         coroutine_desc * src = TL_GET( this_coroutine );
+        coroutine_desc * src = kernelTLS.this_coroutine;
         coroutine_desc * dst = get_coroutine(this->runner);
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         create_stack(&dst->stack, dst->stack.size);
         CtxStart(&this->runner, CtxInvokeCoroutine);
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         dst->last = src;
 …
         // set new coroutine that task is executing
         TL_SET( this_coroutine, dst );
+        kernelTLS.this_coroutine = dst;
         // SKULLDUGGERY normally interrupts are enable before leaving a coroutine ctxswitch.
 …
         src->state = Active;
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
+}
 //-----------------------------------------------------------------------------
 // Scheduler routines
+// KERNEL ONLY
 void ScheduleThread( thread_desc * thrd ) {
-        // if( ! thrd ) return;
         verify( thrd );
         verify( thrd->self_cor.state != Halted );
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         verifyf( thrd->next == NULL, "Expected null got %p", thrd->next );
 …
+        }
+        verify( ! TL_GET( preemption_state ).enabled );
+}
+        verify( ! kernelTLS.preemption_state.enabled );
+}
+// KERNEL ONLY
 thread_desc * nextThread(cluster * this) with( *this ) {
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         lock( ready_queue_lock __cfaabi_dbg_ctx2 );
         thread_desc * head = pop_head( ready_queue );
         unlock( ready_queue_lock );
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         return head;
+}
 …
 void BlockInternal() {
         disable_interrupts();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
+}
 …
 void BlockInternal( __spinlock_t * lock ) {
         disable_interrupts();
         with( *TL_GET( this_processor ) ) {
+        with( *kernelTLS.this_processor ) {
                 finish.action_code = Release;
                 finish.lock        = lock;
+        }
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
 …
 void BlockInternal( thread_desc * thrd ) {
         disable_interrupts();
         with( *TL_GET( this_processor ) ) {
+        with( * kernelTLS.this_processor ) {
                 finish.action_code = Schedule;
                 finish.thrd        = thrd;
+        }
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
 …
         assert(thrd);
         disable_interrupts();
         with( *TL_GET( this_processor ) ) {
+        with( * kernelTLS.this_processor ) {
                 finish.action_code = Release_Schedule;
                 finish.lock        = lock;
 …
+        }
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
 …
 void BlockInternal(__spinlock_t * locks [], unsigned short count) {
         disable_interrupts();
         with( *TL_GET( this_processor ) ) {
+        with( * kernelTLS.this_processor ) {
                 finish.action_code = Release_Multi;
                 finish.locks       = locks;
 …
+        }
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
 …
 void BlockInternal(__spinlock_t * locks [], unsigned short lock_count, thread_desc * thrds [], unsigned short thrd_count) {
         disable_interrupts();
         with( *TL_GET( this_processor ) ) {
+        with( *kernelTLS.this_processor ) {
                 finish.action_code = Release_Multi_Schedule;
                 finish.locks       = locks;
 …
+        }
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
+}
+// KERNEL ONLY
 void LeaveThread(__spinlock_t * lock, thread_desc * thrd) {
         verify( ! TL_GET( preemption_state ).enabled );
         with( *TL_GET( this_processor ) ) {
+        verify( ! kernelTLS.preemption_state.enabled );
+        with( * kernelTLS.this_processor ) {
                 finish.action_code = thrd ? Release_Schedule : Release;
                 finish.lock        = lock;
 …
 // Kernel boot procedures
 void kernel_startup(void) {
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         __cfaabi_dbg_print_safe("Kernel : Starting\n");
+        global_threads. list{ __get };
+        global_threads. lock{};
+        global_clusters.list{ __get };
+        global_clusters.lock{};
         // Initialize the main cluster
 …
         //initialize the global state variables
         TL_SET( this_processor, mainProcessor );
         TL_SET( this_thread, mainThread );
         TL_SET( this_coroutine, &mainThread->self_cor );
+        kernelTLS.this_processor = mainProcessor;
+        kernelTLS.this_thread    = mainThread;
+        kernelTLS.this_coroutine = &mainThread->self_cor;
         // Enable preemption
 …
         // context. Hence, the main thread does not begin through CtxInvokeThread, like all other threads. The trick here is that
         // mainThread is on the ready queue when this call is made.
         kernel_first_resume( TL_GET( this_processor ) );
+        kernel_first_resume( kernelTLS.this_processor );
 …
         __cfaabi_dbg_print_safe("Kernel : Started\n--------------------------------------------------\n\n");
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
         verify( TL_GET( preemption_state ).enabled );
+        verify( TL_GET( preemption_state.enabled ) );
+}
 …
         __cfaabi_dbg_print_safe("\n--------------------------------------------------\nKernel : Shutting down\n");
         verify( TL_GET( preemption_state ).enabled );
+        verify( TL_GET( preemption_state.enabled ) );
         disable_interrupts();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         // SKULLDUGGERY: Notify the mainProcessor it needs to terminates.
 …
 //=============================================================================================
+// Kernel Quiescing
+//=============================================================================================
+// void halt(processor * this) with( this ) {
+//      pthread_mutex_lock( &idle.lock );
+//      // SKULLDUGGERY: Even if spurious wake-up is a thing
+//      // spuriously waking up a kernel thread is not a big deal
+//      // if it is very rare.
+//      pthread_cond_wait( &idle.cond, &idle.lock);
+//      pthread_mutex_unlock( &idle.lock );
+// }
+// void wake(processor * this) with( this ) {
+//      pthread_mutex_lock  (&idle.lock);
+//      pthread_cond_signal (&idle.cond);
+//      pthread_mutex_unlock(&idle.lock);
+// }
+//=============================================================================================
 // Unexpected Terminating logic
 //=============================================================================================
 …
 static __spinlock_t kernel_abort_lock;
-static __spinlock_t kernel_debug_lock;
 static bool kernel_abort_called = false;
 void * kernel_abort    (void) __attribute__ ((__nothrow__)) {
+void * kernel_abort(void) __attribute__ ((__nothrow__)) {
         // abort cannot be recursively entered by the same or different processors because all signal handlers return when
         // the globalAbort flag is true.
 …
         // first task to abort ?
+        if ( ! kernel_abort_called ) {                  // not first task to abort ?
+        if ( kernel_abort_called ) {                    // not first task to abort ?
+                unlock( kernel_abort_lock );
+                sigset_t mask;
+                sigemptyset( &mask );
+                sigaddset( &mask, SIGALRM );            // block SIGALRM signals
+                sigsuspend( &mask );                    // block the processor to prevent further damage during abort
+                _exit( EXIT_FAILURE );                  // if processor unblocks before it is killed, terminate it
+        }
+        else {
                 kernel_abort_called = true;
                 unlock( kernel_abort_lock );
+        }
+        else {
+                unlock( kernel_abort_lock );
+                sigset_t mask;
+                sigemptyset( &mask );
+                sigaddset( &mask, SIGALRM );                    // block SIGALRM signals
+                sigaddset( &mask, SIGUSR1 );                    // block SIGUSR1 signals
+                sigsuspend( &mask );                            // block the processor to prevent further damage during abort
+                _exit( EXIT_FAILURE );                          // if processor unblocks before it is killed, terminate it
+        }
+        return TL_GET( this_thread );
+        return kernelTLS.this_thread;
+}
 …
         thread_desc * thrd = kernel_data;
+        int len = snprintf( abort_text, abort_text_size, "Error occurred while executing task %.256s (%p)", thrd->self_cor.name, thrd );
+        __cfaabi_dbg_bits_write( abort_text, len );
+        if ( get_coroutine(thrd) != TL_GET( this_coroutine ) ) {
+                len = snprintf( abort_text, abort_text_size, " in coroutine %.256s (%p).\n", TL_GET( this_coroutine )->name, TL_GET( this_coroutine ) );
+        if(thrd) {
+                int len = snprintf( abort_text, abort_text_size, "Error occurred while executing thread %.256s (%p)", thrd->self_cor.name, thrd );
                 __cfaabi_dbg_bits_write( abort_text, len );
+                if ( get_coroutine(thrd) != kernelTLS.this_coroutine ) {
+                        len = snprintf( abort_text, abort_text_size, " in coroutine %.256s (%p).\n", kernelTLS.this_coroutine->name, kernelTLS.this_coroutine );
+                        __cfaabi_dbg_bits_write( abort_text, len );
+                }
+                else {
+                        __cfaabi_dbg_bits_write( ".\n", 2 );
+                }
+        }
         else {
                 __cfaabi_dbg_bits_write( ".\n", 2 );
+                int len = snprintf( abort_text, abort_text_size, "Error occurred outside of any thread.\n" );
+        }
+}
 int kernel_abort_lastframe( void ) __attribute__ ((__nothrow__)) {
+        return get_coroutine(TL_GET( this_thread )) == get_coroutine(mainThread) ? 4 : 2;
+}
+        return get_coroutine(kernelTLS.this_thread) == get_coroutine(mainThread) ? 4 : 2;
+}
+static __spinlock_t kernel_debug_lock;
 extern "C" {
 …
         if ( count < 0 ) {
                 // queue current task
                 append( waiting, (thread_desc *)TL_GET( this_thread ) );
+                append( waiting, kernelTLS.this_thread );
                 // atomically release spin lock and block
 …
 //-----------------------------------------------------------------------------
+// Global Queues
+void doregister( thread_desc & thrd ) {
+        // lock      ( global_thread.lock );
+        // push_front( global_thread.list, thrd );
+        // unlock    ( global_thread.lock );
+}
+void unregister( thread_desc & thrd ) {
+        // lock  ( global_thread.lock );
+        // remove( global_thread.list, thrd );
+        // unlock( global_thread.lock );
+}
+void doregister( cluster     & cltr ) {
+        // lock      ( global_cluster.lock );
+        // push_front( global_cluster.list, cltr );
+        // unlock    ( global_cluster.lock );
+}
+void unregister( cluster     & cltr ) {
+        // lock  ( global_cluster.lock );
+        // remove( global_cluster.list, cltr );
+        // unlock( global_cluster.lock );
+}
+void doregister( cluster * cltr, processor * proc ) {
+        // lock      (cltr->proc_list_lock __cfaabi_dbg_ctx2);
+        // push_front(cltr->procs, *proc);
+        // unlock    (cltr->proc_list_lock);
+}
+void unregister( cluster * cltr, processor * proc ) {
+        // lock  (cltr->proc_list_lock __cfaabi_dbg_ctx2);
+        // remove(cltr->procs, *proc );
+        // unlock(cltr->proc_list_lock);
+}
+//-----------------------------------------------------------------------------
 // Debug
 __cfaabi_dbg_debug_do(
-        struct {
-                thread_desc * tail;
-        } __cfaabi_dbg_thread_list = { NULL };
-        void __cfaabi_dbg_thread_register( thread_desc * thrd ) {
-                if( !__cfaabi_dbg_thread_list.tail ) {
-                        __cfaabi_dbg_thread_list.tail = thrd;
-                        return;
+                }
-                __cfaabi_dbg_thread_list.tail->dbg_next = thrd;
-                thrd->dbg_prev = __cfaabi_dbg_thread_list.tail;
-                __cfaabi_dbg_thread_list.tail = thrd;
+        }
-        void __cfaabi_dbg_thread_unregister( thread_desc * thrd ) {
-                thread_desc * prev = thrd->dbg_prev;
-                thread_desc * next = thrd->dbg_next;
-                if( next ) { next->dbg_prev = prev; }
-                else       {
-                        assert( __cfaabi_dbg_thread_list.tail == thrd );
-                        __cfaabi_dbg_thread_list.tail = prev;
+                }
-                if( prev ) { prev->dbg_next = next; }
-                thrd->dbg_prev = NULL;
-                thrd->dbg_next = NULL;
+        }
         void __cfaabi_dbg_record(__spinlock_t & this, const char * prev_name) {
                 this.prev_name = prev_name;
                 this.prev_thrd = TL_GET( this_thread );
+                this.prev_thrd = kernelTLS.this_thread;
+        }
+)

src/libcfa/concurrency/kernel_private.h

-              r7d0a3ba
+              r358cba0
 #define KERNEL_STORAGE(T,X) static char storage_##X[sizeof(T)]
+void doregister( struct thread_desc & thrd );
+void unregister( struct thread_desc & thrd );
+void doregister( struct cluster     & cltr );
+void unregister( struct cluster     & cltr );
+void doregister( struct cluster * cltr, struct processor * proc );
+void unregister( struct cluster * cltr, struct processor * proc );
 // Local Variables: //
 // mode: c //

src/libcfa/concurrency/monitor.c

-              r7d0a3ba
+              r358cba0
                 // Lock the monitor spinlock
                 lock( this->lock __cfaabi_dbg_ctx2 );
+                thread_desc * thrd = TL_GET( this_thread );
+                // Interrupts disable inside critical section
+                thread_desc * thrd = kernelTLS.this_thread;
                 __cfaabi_dbg_print_safe( "Kernel : %10p Entering mon %p (%p)\n", thrd, this, this->owner);
 …
                 // Lock the monitor spinlock
                 lock( this->lock __cfaabi_dbg_ctx2 );
+                thread_desc * thrd = TL_GET( this_thread );
+                // Interrupts disable inside critical section
+                thread_desc * thrd = kernelTLS.this_thread;
                 __cfaabi_dbg_print_safe( "Kernel : %10p Entering dtor for mon %p (%p)\n", thrd, this, this->owner);
 …
                         // Create the node specific to this wait operation
                         wait_ctx_primed( TL_GET( this_thread ), 0 )
+                        wait_ctx_primed( thrd, 0 )
                         // Some one else has the monitor, wait for him to finish and then run
 …
                         __cfaabi_dbg_print_safe( "Kernel :  blocking \n" );
                         wait_ctx( TL_GET( this_thread ), 0 )
+                        wait_ctx( thrd, 0 )
                         this->dtor_node = &waiter;
 …
                 lock( this->lock __cfaabi_dbg_ctx2 );
                 __cfaabi_dbg_print_safe( "Kernel : %10p Leaving mon %p (%p)\n", TL_GET( this_thread ), this, this->owner);
                 verifyf( TL_GET( this_thread ) == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", TL_GET( this_thread ), this->owner, this->recursion, this );
+                __cfaabi_dbg_print_safe( "Kernel : %10p Leaving mon %p (%p)\n", kernelTLS.this_thread, this, this->owner);
+                verifyf( kernelTLS.this_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this );
                 // Leaving a recursion level, decrement the counter
 …
 // Sorts monitors before entering
 void ?{}( monitor_guard_t & this, monitor_desc * m [], __lock_size_t count, fptr_t func ) {
+        thread_desc * thrd = TL_GET( this_thread );
         // Store current array
         this.m = m;
 …
         // Save previous thread context
         this.prev = TL_GET( this_thread )->monitors;
+        this.prev = thrd->monitors;
         // Update thread context (needed for conditions)
         (TL_GET( this_thread )->monitors){m, count, func};
+        (thrd->monitors){m, count, func};
         // __cfaabi_dbg_print_safe( "MGUARD : enter %d\n", count);
 …
 // Sorts monitors before entering
 void ?{}( monitor_dtor_guard_t & this, monitor_desc * m [], fptr_t func ) {
+        // optimization
+        thread_desc * thrd = TL_GET( this_thread );
         // Store current array
         this.m = *m;
         // Save previous thread context
         this.prev = TL_GET( this_thread )->monitors;
+        this.prev = thrd->monitors;
         // Update thread context (needed for conditions)
         (TL_GET( this_thread )->monitors){m, 1, func};
+        (thrd->monitors){m, 1, func};
         __enter_monitor_dtor( this.m, func );
 …
         // Create the node specific to this wait operation
         wait_ctx_primed( TL_GET( this_thread ), 0 )
+        wait_ctx_primed( kernelTLS.this_thread, 0 )
         //save contexts
 …
                                 // Create the node specific to this wait operation
                                 wait_ctx_primed( TL_GET( this_thread ), 0 );
+                                wait_ctx_primed( kernelTLS.this_thread, 0 );
                                 // Save monitor states
 …
         // Create the node specific to this wait operation
         wait_ctx_primed( TL_GET( this_thread ), 0 );
+        wait_ctx_primed( kernelTLS.this_thread, 0 );
         monitor_save;
 …
         for( __lock_size_t i = 0; i < count; i++) {
                 verify( monitors[i]->owner == TL_GET( this_thread ) );
+                verify( monitors[i]->owner == kernelTLS.this_thread );
+        }

src/libcfa/concurrency/preemption.c

-              r7d0a3ba
+              r358cba0
         // Disable interrupts by incrementing the counter
         void disable_interrupts() {
                 with( TL_GET( preemption_state ) ) {
+                with( kernelTLS.preemption_state ) {
                         enabled = false;
                         __attribute__((unused)) unsigned short new_val = disable_count + 1;
 …
         // If counter reaches 0, execute any pending CtxSwitch
         void enable_interrupts( __cfaabi_dbg_ctx_param ) {
                 processor   * proc = TL_GET( this_processor ); // Cache the processor now since interrupts can start happening after the atomic add
                 thread_desc * thrd = TL_GET( this_thread );       // Cache the thread now since interrupts can start happening after the atomic add
                 with( TL_GET( preemption_state ) ){
+                processor   * proc = kernelTLS.this_processor; // Cache the processor now since interrupts can start happening after the atomic add
+                thread_desc * thrd = kernelTLS.this_thread;       // Cache the thread now since interrupts can start happening after the atomic add
+                with( kernelTLS.preemption_state ){
                         unsigned short prev = disable_count;
                         disable_count -= 1;
 …
         // Don't execute any pending CtxSwitch even if counter reaches 0
         void enable_interrupts_noPoll() {
                 unsigned short prev = TL_GET( preemption_state ).disable_count;
                 TL_GET( preemption_state ).disable_count -= 1;
+                unsigned short prev = kernelTLS.preemption_state.disable_count;
+                kernelTLS.preemption_state.disable_count -= 1;
                 verifyf( prev != 0u, "Incremented from %u\n", prev );                     // If this triggers someone is enabled already enabled interrupts
                 if( prev == 1 ) {
                         TL_GET( preemption_state ).enabled = true;
+                        kernelTLS.preemption_state.enabled = true;
+                }
+        }
 …
+}
+// KERNEL ONLY
 // Check if a CtxSwitch signal handler shoud defer
 // If true  : preemption is safe
 // If false : preemption is unsafe and marked as pending
 static inline bool preemption_ready() {
+        bool ready = TL_GET( preemption_state ).enabled && !TL_GET( preemption_state ).in_progress; // Check if preemption is safe
+        TL_GET( this_processor )->pending_preemption = !ready;                  // Adjust the pending flag accordingly
+        // Check if preemption is safe
+        bool ready = kernelTLS.preemption_state.enabled && ! kernelTLS.preemption_state.in_progress;
+        // Adjust the pending flag accordingly
+        kernelTLS.this_processor->pending_preemption = !ready;
         return ready;
+}
 …
         // Start with preemption disabled until ready
         TL_GET( preemption_state ).enabled = false;
         TL_GET( preemption_state ).disable_count = 1;
+        kernelTLS.preemption_state.enabled = false;
+        kernelTLS.preemption_state.disable_count = 1;
         // Initialize the event kernel
 …
         // before the kernel thread has even started running. When that happens an iterrupt
         // we a null 'this_processor' will be caught, just ignore it.
         if(!TL_GET( this_processor )) return;
+        if(! kernelTLS.this_processor ) return;
         choose(sfp->si_value.sival_int) {
                 case PREEMPT_NORMAL   : ;// Normal case, nothing to do here
                 case PREEMPT_TERMINATE: verify(TL_GET( this_processor )->do_terminate);
+                case PREEMPT_TERMINATE: verify( kernelTLS.this_processor->do_terminate);
                 default:
                         abort( "internal error, signal value is %d", sfp->si_value.sival_int );
 …
         if( !preemption_ready() ) { return; }
+        __cfaabi_dbg_print_buffer_decl( " KERNEL: preempting core %p (%p).\n", TL_GET( this_processor ), TL_GET( this_thread ) );
+        TL_GET( preemption_state ).in_progress = true;  // Sync flag : prevent recursive calls to the signal handler
+        signal_unblock( SIGUSR1 );                          // We are about to CtxSwitch out of the signal handler, let other handlers in
+        TL_GET( preemption_state ).in_progress = false; // Clear the in progress flag
+        __cfaabi_dbg_print_buffer_decl( " KERNEL: preempting core %p (%p).\n", kernelTLS.this_processor, kernelTLS.this_thread );
+        // Sync flag : prevent recursive calls to the signal handler
+        kernelTLS.preemption_state.in_progress = true;
+        // We are about to CtxSwitch out of the signal handler, let other handlers in
+        signal_unblock( SIGUSR1 );
+        // TODO: this should go in finish action
+        // Clear the in progress flag
+        kernelTLS.preemption_state.in_progress = false;
         // Preemption can occur here
         BlockInternal( (thread_desc*)TL_GET( this_thread ) ); // Do the actual CtxSwitch
+        BlockInternal( kernelTLS.this_thread ); // Do the actual CtxSwitch
+}
 …
         // Block sigalrms to control when they arrive
         sigset_t mask;
+        sigfillset(&mask);
+        if ( pthread_sigmask( SIG_BLOCK, &mask, NULL ) == -1 ) {
+            abort( "internal error, pthread_sigmask" );
+        }
         sigemptyset( &mask );
         sigaddset( &mask, SIGALRM );
-        if ( pthread_sigmask( SIG_BLOCK, &mask, NULL ) == -1 ) {
-            abort( "internal error, pthread_sigmask" );
+        }
         // Main loop
 …
 void __cfaabi_check_preemption() {
         bool ready = TL_GET( preemption_state ).enabled;
+        bool ready = kernelTLS.preemption_state.enabled;
         if(!ready) { abort("Preemption should be ready"); }

src/libcfa/concurrency/thread.c

-              r7d0a3ba
+              r358cba0
         curr_cluster = &cl;
         next = NULL;
+        __cfaabi_dbg_debug_do(
+                dbg_next = NULL;
+                dbg_prev = NULL;
+                __cfaabi_dbg_thread_register(&this);
+        )
+        node.next = NULL;
+        node.prev = NULL;
+        doregister(this);
         monitors{ &self_mon_p, 1, (fptr_t)0 };
 …
 void ^?{}(thread_desc& this) with( this ) {
+        unregister(this);
         ^self_cor{};
+}
 …
         disable_interrupts();
         create_stack(&thrd_c->stack, thrd_c->stack.size);
         TL_SET( this_coroutine, thrd_c );
+        kernelTLS.this_coroutine = thrd_c;
         CtxStart(&this, CtxInvokeThread);
         assert( thrd_c->last->stack.context );
 …
 extern "C" {
+        // KERNEL ONLY
         void __finish_creation(void) {
                 coroutine_desc* thrd_c = TL_GET( this_coroutine );
+                coroutine_desc* thrd_c = kernelTLS.this_coroutine;
                 ThreadCtxSwitch( thrd_c, thrd_c->last );
+        }
 …
 void yield( void ) {
+        verify( TL_GET( preemption_state ).enabled );
+        // Safety note : This could cause some false positives due to preemption
+      verify( TL_GET( preemption_state.enabled ) );
         BlockInternal( TL_GET( this_thread ) );
+        verify( TL_GET( preemption_state ).enabled );
+        // Safety note : This could cause some false positives due to preemption
+      verify( TL_GET( preemption_state.enabled ) );
+}
 …
+}
+// KERNEL ONLY
 void ThreadCtxSwitch(coroutine_desc* src, coroutine_desc* dst) {
         // set state of current coroutine to inactive
 …
         // set new coroutine that the processor is executing
         // and context switch to it
         TL_SET( this_coroutine, dst );
+        kernelTLS.this_coroutine = dst;
         assert( src->stack.context );
         CtxSwitch( src->stack.context, dst->stack.context );
         TL_SET( this_coroutine, src );
+        kernelTLS.this_coroutine = src;
         // set state of new coroutine to active

Note: See TracChangeset for help on using the changeset viewer.

Download in other formats: