Context Navigation

Reverse Diff

kernel.cfa [c9c1c1cb:ae7adbc4]

File:

: 1 edited

libcfa/src/concurrency/kernel.cfa (modified) (18 diffs)

Legend:

: Unmodified
: Added
: Removed

libcfa/src/concurrency/kernel.cfa

-              rc9c1c1cb
+              rae7adbc4
 #if !defined(__CFA_NO_STATISTICS__)
         #define __STATS_DEF( ...) __VA_ARGS__
+        #define __STATS( ...) __VA_ARGS__
 #else
         #define __STATS_DEF( ...)
+        #define __STATS( ...)
 #endif
 …
 static thread$ * __next_thread(cluster * this);
 static thread$ * __next_thread_slow(cluster * this);
-static thread$ * __next_thread_search(cluster * this);
 static inline bool __must_unpark( thread$ * thrd ) __attribute((nonnull(1)));
 static void __run_thread(processor * this, thread$ * dst);
 …
                 MAIN_LOOP:
                 for() {
+                        #define OLD_MAIN 1
+                        #if OLD_MAIN
                         // Check if there is pending io
                         __maybe_io_drain( this );
 …
                         if( !readyThread ) {
-                                __IO_STATS__(true, io.flush.idle++; )
                                 __cfa_io_flush( this, 0 );
-                                readyThread = __next_thread( this->cltr );
+                        }
-                        if( !readyThread ) for(5) {
-                                __IO_STATS__(true, io.flush.idle++; )
                                 readyThread = __next_thread_slow( this->cltr );
-                                if( readyThread ) break;
-                                __cfa_io_flush( this, 0 );
+                        }
 …
                                 if( __atomic_load_n(&this->do_terminate, __ATOMIC_SEQ_CST) ) break MAIN_LOOP;
+                                #if !defined(__CFA_NO_STATISTICS__)
+                                        __tls_stats()->ready.sleep.halts++;
+                                #endif
                                 // Push self to idle stack
                                 if(!mark_idle(this->cltr->procs, * this)) continue MAIN_LOOP;
                                 // Confirm the ready-queue is empty
                                 readyThread = __next_thread_search( this->cltr );
+                                readyThread = __next_thread_slow( this->cltr );
                                 if( readyThread ) {
                                         // A thread was found, cancel the halt
                                         mark_awake(this->cltr->procs, * this);
+                                        __STATS__(true, ready.sleep.cancels++; )
+                                        #if !defined(__CFA_NO_STATISTICS__)
+                                                __tls_stats()->ready.sleep.cancels++;
+                                        #endif
                                         // continue the mai loop
 …
                         if(this->io.pending && !this->io.dirty) {
-                                __IO_STATS__(true, io.flush.dirty++; )
                                 __cfa_io_flush( this, 0 );
+                        }
+                        #else
+                                #warning new kernel loop
+                        SEARCH: {
+                                /* paranoid */ verify( ! __preemption_enabled() );
+                                // First, lock the scheduler since we are searching for a thread
+                                ready_schedule_lock();
+                                // Try to get the next thread
+                                readyThread = pop_fast( this->cltr );
+                                if(readyThread) { ready_schedule_unlock(); break SEARCH; }
+                                // If we can't find a thread, might as well flush any outstanding I/O
+                                if(this->io.pending) { __cfa_io_flush( this, 0 ); }
+                                // Spin a little on I/O, just in case
+                                for(5) {
+                                        __maybe_io_drain( this );
+                                        readyThread = pop_fast( this->cltr );
+                                        if(readyThread) { ready_schedule_unlock(); break SEARCH; }
+                                }
+                                // no luck, try stealing a few times
+                                for(5) {
+                                        if( __maybe_io_drain( this ) ) {
+                                                readyThread = pop_fast( this->cltr );
+                                        } else {
+                                                readyThread = pop_slow( this->cltr );
+                                        }
+                                        if(readyThread) { ready_schedule_unlock(); break SEARCH; }
+                                }
+                                // still no luck, search for a thread
+                                readyThread = pop_search( this->cltr );
+                                if(readyThread) { ready_schedule_unlock(); break SEARCH; }
+                                // Don't block if we are done
+                                if( __atomic_load_n(&this->do_terminate, __ATOMIC_SEQ_CST) ) {
+                                        ready_schedule_unlock();
+                                        break MAIN_LOOP;
+                                }
+                                __STATS( __tls_stats()->ready.sleep.halts++; )
+                                // Push self to idle stack
+                                ready_schedule_unlock();
+                                if(!mark_idle(this->cltr->procs, * this)) goto SEARCH;
+                                ready_schedule_lock();
+                                // Confirm the ready-queue is empty
+                                __maybe_io_drain( this );
+                                readyThread = pop_search( this->cltr );
+                                ready_schedule_unlock();
+                                if( readyThread ) {
+                                        // A thread was found, cancel the halt
+                                        mark_awake(this->cltr->procs, * this);
+                                        __STATS( __tls_stats()->ready.sleep.cancels++; )
+                                        // continue the main loop
+                                        break SEARCH;
+                                }
+                                __STATS( if(this->print_halts) __cfaabi_bits_print_safe( STDOUT_FILENO, "PH:%d - %lld 0\n", this->unique_id, rdtscl()); )
+                                __cfadbg_print_safe(runtime_core, "Kernel : core %p waiting on eventfd %d\n", this, this->idle_fd);
+                                {
+                                        eventfd_t val;
+                                        ssize_t ret = read( this->idle_fd, &val, sizeof(val) );
+                                        if(ret < 0) {
+                                                switch((int)errno) {
+                                                case EAGAIN:
+                                                #if EAGAIN != EWOULDBLOCK
+                                                        case EWOULDBLOCK:
+                                                #endif
+                                                case EINTR:
+                                                        // No need to do anything special here, just assume it's a legitimate wake-up
+                                                        break;
+                                                default:
+                                                        abort( "KERNEL : internal error, read failure on idle eventfd, error(%d) %s.", (int)errno, strerror( (int)errno ) );
+                                                }
+                                        }
+                                }
+                                        __STATS( if(this->print_halts) __cfaabi_bits_print_safe( STDOUT_FILENO, "PH:%d - %lld 1\n", this->unique_id, rdtscl()); )
+                                // We were woken up, remove self from idle
+                                mark_awake(this->cltr->procs, * this);
+                                // DON'T just proceed, start looking again
+                                continue MAIN_LOOP;
+                        }
+                RUN_THREAD:
+                        /* paranoid */ verify( ! __preemption_enabled() );
+                        /* paranoid */ verify( readyThread );
+                        // Reset io dirty bit
+                        this->io.dirty = false;
+                        // We found a thread run it
+                        __run_thread(this, readyThread);
+                        // Are we done?
+                        if( __atomic_load_n(&this->do_terminate, __ATOMIC_SEQ_CST) ) break MAIN_LOOP;
+                        if(this->io.pending && !this->io.dirty) {
+                                __cfa_io_flush( this, 0 );
+                        }
+                        ready_schedule_lock();
+                        __maybe_io_drain( this );
+                        ready_schedule_unlock();
+                        #endif
+                }
 …
                                 break RUNNING;
                         case TICKET_UNBLOCK:
+                                __STATS__(true, ready.threads.threads++; )
+                                #if !defined(__CFA_NO_STATISTICS__)
+                                        __tls_stats()->ready.threads.threads++;
+                                #endif
                                 // This is case 2, the racy case, someone tried to run this thread before it finished blocking
                                 // In this case, just run it again.
 …
         __cfadbg_print_safe(runtime_core, "Kernel : core %p finished running thread %p\n", this, thrd_dst);
+        __STATS__(true, ready.threads.threads--; )
+        #if !defined(__CFA_NO_STATISTICS__)
+                __tls_stats()->ready.threads.threads--;
+        #endif
         /* paranoid */ verify( ! __preemption_enabled() );
 …
         thread$ * thrd_src = kernelTLS().this_thread;
         __STATS_DEF( thrd_src->last_proc = kernelTLS().this_processor; )
+        __STATS( thrd_src->last_proc = kernelTLS().this_processor; )
         // Run the thread on this processor
 …
         /* paranoid */ verify( 0x0D15EA5E0D15EA5Ep == thrd->canary );
+        const bool local = thrd->state != Start;
         if (thrd->preempted == __NO_PREEMPTION) thrd->state = Ready;
         // Dereference the thread now because once we push it, there is not guaranteed it's still valid.
         struct cluster * cl = thrd->curr_cluster;
         __STATS_DEF(bool outside = hint == UNPARK_LOCAL && thrd->last_proc && thrd->last_proc != kernelTLS().this_processor; )
+        __STATS(bool outside = hint == UNPARK_LOCAL && thrd->last_proc && thrd->last_proc != kernelTLS().this_processor; )
         // push the thread to the cluster ready-queue
 …
         ready_schedule_lock();
+                thread$ * thrd = pop_slow( this );
+        ready_schedule_unlock();
+        /* paranoid */ verify( ! __preemption_enabled() );
+        return thrd;
+}
+// KERNEL ONLY
+static inline thread$ * __next_thread_search(cluster * this) with( *this ) {
+        /* paranoid */ verify( ! __preemption_enabled() );
+        ready_schedule_lock();
+                thread$ * thrd = pop_search( this );
+                thread$ * thrd;
+                for(25) {
+                        thrd = pop_slow( this );
+                        if(thrd) goto RET;
+                }
+                thrd = pop_search( this );
+                RET:
         ready_schedule_unlock();
 …
 // Wake a thread from the front if there are any
 static void __wake_one(cluster * this) {
+        /* paranoid */ verify( ! __preemption_enabled() );
+        /* paranoid */ verify( ready_schedule_islocked() );
+        // Check if there is a sleeping processor
+        // int fd = __atomic_load_n(&this->procs.fd, __ATOMIC_SEQ_CST);
+        int fd = 0;
+        if( __atomic_load_n(&this->procs.fd, __ATOMIC_SEQ_CST) != 0 ) {
+                fd = __atomic_exchange_n(&this->procs.fd, 0, __ATOMIC_RELAXED);
+        }
+        // If no one is sleeping, we are done
+        if( fd == 0 ) return;
+        // We found a processor, wake it up
         eventfd_t val;
+        /* paranoid */ verify( ! __preemption_enabled() );
+        /* paranoid */ verify( ready_schedule_islocked() );
+        // Check if there is a sleeping processor
+        struct __fd_waitctx * fdp = __atomic_load_n(&this->procs.fdw, __ATOMIC_SEQ_CST);
+        // If no one is sleeping: we are done
+        if( fdp == 0p ) return;
+        int fd = 1;
+        if( __atomic_load_n(&fdp->fd, __ATOMIC_SEQ_CST) != 1 ) {
+                fd = __atomic_exchange_n(&fdp->fd, 1, __ATOMIC_RELAXED);
+        }
+        switch(fd) {
+        case 0:
+                // If the processor isn't ready to sleep then the exchange will already wake it up
+                #if !defined(__CFA_NO_STATISTICS__)
+                        if( kernelTLS().this_stats ) { __tls_stats()->ready.sleep.early++;
+                        } else { __atomic_fetch_add(&this->stats->ready.sleep.early, 1, __ATOMIC_RELAXED); }
+                #endif
+                break;
+        case 1:
+                // If someone else already said they will wake them: we are done
+                #if !defined(__CFA_NO_STATISTICS__)
+                        if( kernelTLS().this_stats ) { __tls_stats()->ready.sleep.seen++;
+                        } else { __atomic_fetch_add(&this->stats->ready.sleep.seen, 1, __ATOMIC_RELAXED); }
+                #endif
+                break;
+        default:
+                // If the processor was ready to sleep, we need to wake it up with an actual write
+                val = 1;
+                eventfd_write( fd, val );
+                #if !defined(__CFA_NO_STATISTICS__)
+                        if( kernelTLS().this_stats ) { __tls_stats()->ready.sleep.wakes++;
+                        } else { __atomic_fetch_add(&this->stats->ready.sleep.wakes, 1, __ATOMIC_RELAXED); }
+                #endif
+                break;
+        }
+        val = 1;
+        eventfd_write( fd, val );
+        #if !defined(__CFA_NO_STATISTICS__)
+                if( kernelTLS().this_stats ) {
+                        __tls_stats()->ready.sleep.wakes++;
+                }
+                else {
+                        __atomic_fetch_add(&this->stats->ready.sleep.wakes, 1, __ATOMIC_RELAXED);
+                }
+        #endif
         /* paranoid */ verify( ready_schedule_islocked() );
 …
         __cfadbg_print_safe(runtime_core, "Kernel : waking Processor %p\n", this);
-        this->idle_wctx.fd = 1;
         eventfd_t val;
 …
 static void idle_sleep(processor * this, io_future_t & future, iovec & iov) {
-        // Tell everyone we are ready to go do sleep
-        for() {
-                int expected = this->idle_wctx.fd;
-                // Someone already told us to wake-up! No time for a nap.
-                if(expected == 1) { return; }
-                // Try to mark that we are going to sleep
-                if(__atomic_compare_exchange_n(&this->idle_wctx.fd, &expected, this->idle_fd, false,  __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST) ) {
-                        // Every one agreed, taking a nap
-                        break;
+                }
+        }
         #if !defined(CFA_WITH_IO_URING_IDLE)
                 #if !defined(__CFA_NO_STATISTICS__)
 …
 static bool mark_idle(__cluster_proc_list & this, processor & proc) {
-        __STATS__(true, ready.sleep.halts++; )
-        proc.idle_wctx.fd = 0;
         /* paranoid */ verify( ! __preemption_enabled() );
         if(!try_lock( this )) return false;
 …
                 insert_first(this.idles, proc);
                 __atomic_store_n(&this.fdw, &proc.idle_wctx, __ATOMIC_SEQ_CST);
+                __atomic_store_n(&this.fd, proc.idle_fd, __ATOMIC_SEQ_CST);
         unlock( this );
         /* paranoid */ verify( ! __preemption_enabled() );
 …
+                {
                         struct __fd_waitctx * wctx = 0;
                         if(!this.idles`isEmpty) wctx = &this.idles`first.idle_wctx;
                         __atomic_store_n(&this.fdw, wctx, __ATOMIC_SEQ_CST);
+                        int fd = 0;
+                        if(!this.idles`isEmpty) fd = this.idles`first.idle_fd;
+                        __atomic_store_n(&this.fd, fd, __ATOMIC_SEQ_CST);
+                }
 …
                 unsigned tail = *ctx->cq.tail;
                 if(head == tail) return false;
+                ready_schedule_lock();
+                ret = __cfa_io_drain( proc );
+                ready_schedule_unlock();
+                #if OLD_MAIN
+                        ready_schedule_lock();
+                        ret = __cfa_io_drain( proc );
+                        ready_schedule_unlock();
+                #else
+                        ret = __cfa_io_drain( proc );
+                #endif
         #endif
         return ret;

Note: See TracChangeset for help on using the changeset viewer.

Context Navigation

Changes in libcfa/src/concurrency/kernel.cfa [c9c1c1cb:ae7adbc4]

Legend:

libcfa/src/concurrency/kernel.cfa

Download in other formats: