source: libcfa/src/concurrency/preemption.cfa @ 250583e

ADTast-experimentalenumforall-pointer-decaypthread-emulationqualifiedEnum
Last change on this file since 250583e was 250583e, checked in by Thierry Delisle <tdelisle@…>, 2 years ago

Some clean-up after preemption fix

  • Property mode set to 100644
File size: 26.4 KB
RevLine 
[c81ebf9]1//
2// Cforall Version 1.0.0 Copyright (C) 2016 University of Waterloo
3//
4// The contents of this file are covered under the licence agreement in the
5// file "LICENCE" distributed with Cforall.
6//
7// signal.c --
8//
9// Author           : Thierry Delisle
10// Created On       : Mon Jun 5 14:20:42 2017
[6b0b624]11// Last Modified By : Peter A. Buhr
[231b18f]12// Last Modified On : Fri Nov  6 07:42:13 2020
13// Update Count     : 54
[c81ebf9]14//
15
[2026bb6]16#define __cforall_thread__
[43784ac]17#define _GNU_SOURCE
18
[1c6e1ec]19// #define __CFA_DEBUG_PRINT_PREEMPTION__
[2026bb6]20
[73abe95]21#include "preemption.hfa"
[c457dc41]22
[a83ffa4]23#include <assert.h>
[c81ebf9]24
[82ff5845]25#include <errno.h>
26#include <stdio.h>
27#include <string.h>
28#include <unistd.h>
[27f5f71]29#include <limits.h>                                                                             // PTHREAD_STACK_MIN
[c81ebf9]30
[c457dc41]31#include "bits/debug.hfa"
[73abe95]32#include "bits/signal.hfa"
[e660761]33#include "kernel_private.hfa"
[82ff5845]34
[1c6e1ec]35
[d8548e2]36#if !defined(__CFA_DEFAULT_PREEMPTION__)
[2a84d06d]37#define __CFA_DEFAULT_PREEMPTION__ 10`ms
[d8548e2]38#endif
[c81ebf9]39
[1c6e1ec]40__attribute__((weak)) Duration default_preemption() {
[357fae8]41        const char * preempt_rate_s = getenv("CFA_DEFAULT_PREEMPTION");
[1c6e1ec]42        if(!preempt_rate_s) {
[357fae8]43                __cfadbg_print_safe(preemption, "No CFA_DEFAULT_PREEMPTION in ENV\n");
[1c6e1ec]44                return __CFA_DEFAULT_PREEMPTION__;
45        }
46
47        char * endptr = 0p;
48        long int preempt_rate_l = strtol(preempt_rate_s, &endptr, 10);
49        if(preempt_rate_l < 0 || preempt_rate_l > 65535) {
[357fae8]50                __cfadbg_print_safe(preemption, "CFA_DEFAULT_PREEMPTION out of range : %ld\n", preempt_rate_l);
[1c6e1ec]51                return __CFA_DEFAULT_PREEMPTION__;
52        }
53        if('\0' != *endptr) {
[357fae8]54                __cfadbg_print_safe(preemption, "CFA_DEFAULT_PREEMPTION not a decimal number : %s\n", preempt_rate_s);
[1c6e1ec]55                return __CFA_DEFAULT_PREEMPTION__;
56        }
57
58        return preempt_rate_l`ms;
[c81ebf9]59}
60
[969b3fe]61// FwdDeclarations : timeout handlers
[c81ebf9]62static void preempt( processor   * this );
[e84ab3d]63static void timeout( thread$ * this );
[c81ebf9]64
[969b3fe]65// FwdDeclarations : Signal handlers
[c29c342]66static void sigHandler_ctxSwitch( __CFA_SIGPARMS__ );
[c59a346]67static void sigHandler_alarm    ( __CFA_SIGPARMS__ );
[c29c342]68static void sigHandler_segv     ( __CFA_SIGPARMS__ );
69static void sigHandler_ill      ( __CFA_SIGPARMS__ );
70static void sigHandler_fpe      ( __CFA_SIGPARMS__ );
71static void sigHandler_abort    ( __CFA_SIGPARMS__ );
[82ff5845]72
[969b3fe]73// FwdDeclarations : alarm thread main
[c29c342]74static void * alarm_loop( __attribute__((unused)) void * args );
[969b3fe]75
76// Machine specific register name
[381fdee]77#if   defined( __i386 )
[b2b44d8]78#define CFA_REG_IP gregs[REG_EIP]
[381fdee]79#elif defined( __x86_64 )
80#define CFA_REG_IP gregs[REG_RIP]
[e9b49379]81#elif defined( __arm__ )
82#define CFA_REG_IP arm_pc
83#elif defined( __aarch64__ )
[482fa08]84#define CFA_REG_IP pc
[381fdee]85#else
[e9b49379]86#error unsupported hardware architecture
[cd17862]87#endif
88
[969b3fe]89KERNEL_STORAGE(event_kernel_t, event_kernel);         // private storage for event kernel
90event_kernel_t * event_kernel;                        // kernel public handle to even kernel
91static pthread_t alarm_thread;                        // pthread handle to alarm thread
[09d4b22]92static void * alarm_stack;                                                        // pthread stack for alarm thread
[969b3fe]93
[c29c342]94static void ?{}(event_kernel_t & this) with( this ) {
[65deb18]95        alarms{};
96        lock{};
[969b3fe]97}
[82ff5845]98
[4dad189]99enum {
100        PREEMPT_NORMAL    = 0,
101        PREEMPT_TERMINATE = 1,
102};
103
[c81ebf9]104//=============================================================================================
105// Kernel Preemption logic
106//=============================================================================================
107
[969b3fe]108// Get next expired node
[2a84d06d]109static inline alarm_node_t * get_expired( alarm_list_t * alarms, Time currtime ) {
[d3ab183]110        if( ! & (*alarms)`first ) return 0p;                                            // If no alarms return null
[c457dc41]111        if( (*alarms)`first.timeval >= currtime ) return 0p;    // If alarms head not expired return null
[27f5f71]112        return pop(alarms);                                                                     // Otherwise just pop head
[969b3fe]113}
114
115// Tick one frame of the Discrete Event Simulation for alarms
[e873838]116static void tick_preemption(void) {
[27f5f71]117        alarm_node_t * node = 0p;                                                       // Used in the while loop but cannot be declared in the while condition
118        alarm_list_t * alarms = &event_kernel->alarms;          // Local copy for ease of reading
119        Time currtime = __kernel_get_time();                            // Check current time once so everything "happens at once"
[8cb529e]120
[969b3fe]121        //Loop throught every thing expired
122        while( node = get_expired( alarms, currtime ) ) {
[c9ec301]123                __cfadbg_print_buffer_decl( preemption, " KERNEL: preemption tick %lu\n", currtime.tn);
[185efe6]124                Duration period = node->period;
125                if( period == 0) {
126                        node->set = false;                  // Node is one-shot, just mark it as not pending
127                }
[1c273d0]128
[c9ec301]129                __cfadbg_print_buffer_local( preemption, " KERNEL: alarm ticking node %p.\n", node );
130
131
[969b3fe]132                // Check if this is a kernel
[4b30e8cc]133                if( node->type == Kernel ) {
[c81ebf9]134                        preempt( node->proc );
135                }
[4b30e8cc]136                else if( node->type == User ) {
[c9ec301]137                        __cfadbg_print_buffer_local( preemption, " KERNEL: alarm unparking %p.\n", node->thrd );
[e873838]138                        timeout( node->thrd );
[c81ebf9]139                }
[4b30e8cc]140                else {
[eeb5023]141                        node->callback(*node);
[4b30e8cc]142                }
[c81ebf9]143
[969b3fe]144                // Check if this is a periodic alarm
[8cb529e]145                if( period > 0 ) {
[c9ec301]146                        __cfadbg_print_buffer_local( preemption, " KERNEL: alarm period is %lu.\n", period`ns );
[c457dc41]147                        node->timeval = currtime + period;  // Alarm is periodic, add currtime to it (used cached current time)
[969b3fe]148                        insert( alarms, node );             // Reinsert the node for the next time it triggers
[c81ebf9]149                }
150        }
151
[969b3fe]152        // If there are still alarms pending, reset the timer
[d3ab183]153        if( & (*alarms)`first ) {
[c457dc41]154                Duration delta = (*alarms)`first.timeval - currtime;
155                __kernel_set_timer( delta );
[b1a4300]156        }
[c81ebf9]157}
158
[969b3fe]159// Update the preemption of a processor and notify interested parties
[2a84d06d]160void update_preemption( processor * this, Duration duration ) {
[c81ebf9]161        alarm_node_t * alarm = this->preemption_alarm;
162
163        // Alarms need to be enabled
[2a84d06d]164        if ( duration > 0 && ! alarm->set ) {
[c457dc41]165                alarm->initial = duration;
166                alarm->period  = duration;
[c81ebf9]167                register_self( alarm );
168        }
[8ad6533]169        // Zero duration but alarm is set
[c81ebf9]170        else if ( duration == 0 && alarm->set ) {
171                unregister_self( alarm );
[c457dc41]172                alarm->initial = 0;
173                alarm->period  = 0;
[c81ebf9]174        }
175        // If alarm is different from previous, change it
176        else if ( duration > 0 && alarm->period != duration ) {
177                unregister_self( alarm );
[c457dc41]178                alarm->initial = duration;
179                alarm->period  = duration;
[c81ebf9]180                register_self( alarm );
181        }
182}
183
184//=============================================================================================
[cd17862]185// Kernel Signal Tools
[c81ebf9]186//=============================================================================================
[231b18f]187// In a user-level threading system, there are handful of thread-local variables where this problem occurs on the ARM.
[54dcab1]188//
[231b18f]189// For each kernel thread running user-level threads, there is a flag variable to indicate if interrupts are
190// enabled/disabled for that kernel thread. Therefore, this variable is made thread local.
[54dcab1]191//
[231b18f]192// For example, this code fragment sets the state of the "interrupt" variable in thread-local memory.
[54dcab1]193//
[231b18f]194// _Thread_local volatile int interrupts;
195// int main() {
196//     interrupts = 0; // disable interrupts }
[54dcab1]197//
[231b18f]198// which generates the following code on the ARM
[54dcab1]199//
[231b18f]200// (gdb) disassemble main
201// Dump of assembler code for function main:
202//    0x0000000000000610 <+0>:  mrs     x1, tpidr_el0
203//    0x0000000000000614 <+4>:  mov     w0, #0x0                        // #0
204//    0x0000000000000618 <+8>:  add     x1, x1, #0x0, lsl #12
205//    0x000000000000061c <+12>: add     x1, x1, #0x10
206//    0x0000000000000620 <+16>: str     wzr, [x1]
207//    0x0000000000000624 <+20>: ret
[54dcab1]208//
[231b18f]209// The mrs moves a pointer from coprocessor register tpidr_el0 into register x1.  Register w0 is set to 0. The two adds
210// increase the TLS pointer with the displacement (offset) 0x10, which is the location in the TSL of variable
211// "interrupts".  Finally, 0 is stored into "interrupts" through the pointer in register x1 that points into the
212// TSL. Now once x1 has the pointer to the location of the TSL for kernel thread N, it can be be preempted at a
213// user-level and the user thread is put on the user-level ready-queue. When the preempted thread gets to the front of
214// the user-level ready-queue it is run on kernel thread M. It now stores 0 into "interrupts" back on kernel thread N,
215// turning off interrupt on the wrong kernel thread.
[54dcab1]216//
[231b18f]217// On the x86, the following code is generated for the same code fragment.
[54dcab1]218//
[231b18f]219// (gdb) disassemble main
220// Dump of assembler code for function main:
221//    0x0000000000400420 <+0>:  movl   $0x0,%fs:0xfffffffffffffffc
222//    0x000000000040042c <+12>: xor    %eax,%eax
[54dcab1]223//    0x000000000040042e <+14>: retq
224//
[231b18f]225// and there is base-displacement addressing used to atomically reset variable "interrupts" off of the TSL pointer in
226// register "fs".
[54dcab1]227//
[231b18f]228// Hence, the ARM has base-displacement address for the general purpose registers, BUT not to the coprocessor
229// registers. As a result, generating the address for the write into variable "interrupts" is no longer atomic.
[54dcab1]230//
[231b18f]231// Note this problem does NOT occur when just using multiple kernel threads because the preemption ALWAYS restarts the
232// thread on the same kernel thread.
[54dcab1]233//
[231b18f]234// The obvious question is why does ARM use a coprocessor register to store the TSL pointer given that coprocessor
235// registers are second-class registers with respect to the instruction set. One possible answer is that they did not
236// want to dedicate one of the general registers to hold the TLS pointer and there was a free coprocessor register
237// available.
[c81ebf9]238
[ead174a]239//-----------------------------------------------------------------------------
240// Some assembly required
241#define __cfaasm_label(label, when) when: asm volatile goto(".global __cfaasm_" #label "_" #when "\n" "__cfaasm_" #label "_" #when ":":::"memory":when)
242
[8fc652e0]243//----------
244// special case for preemption since used often
245bool __preemption_enabled() {
246        // create a assembler label before
247        // marked as clobber all to avoid movement
[ead174a]248        __cfaasm_label(check, before);
[8fc652e0]249
250        // access tls as normal
251        bool enabled = __cfaabi_tls.preemption_state.enabled;
252
[becb85b9]253        // Check if there is a pending preemption
254        processor   * proc = __cfaabi_tls.this_processor;
255        bool pending = proc ? proc->pending_preemption : false;
256        if( enabled && pending ) proc->pending_preemption = false;
257
[8fc652e0]258        // create a assembler label after
259        // marked as clobber all to avoid movement
[ead174a]260        __cfaasm_label(check, after);
[becb85b9]261
262        // If we can preempt and there is a pending one
263        // this is a good time to yield
264        if( enabled && pending ) {
265                force_yield( __POLL_PREEMPTION );
266        }
[8fc652e0]267        return enabled;
268}
269
[82a2fed]270struct asm_region {
271        void * before;
272        void * after;
273};
274
275static inline bool __cfaasm_in( void * ip, struct asm_region & region ) {
276        return ip >= region.before && ip <= region.after;
277}
278
279
[8fc652e0]280//----------
281// Get data from the TLS block
[82a2fed]282// struct asm_region __cfaasm_get;
[8fc652e0]283uintptr_t __cfatls_get( unsigned long int offset ) __attribute__((__noinline__)); //no inline to avoid problems
284uintptr_t __cfatls_get( unsigned long int offset ) {
285        // create a assembler label before
286        // marked as clobber all to avoid movement
[ead174a]287        __cfaasm_label(get, before);
[8fc652e0]288
289        // access tls as normal (except for pointer arithmetic)
290        uintptr_t val = *(uintptr_t*)((uintptr_t)&__cfaabi_tls + offset);
291
292        // create a assembler label after
293        // marked as clobber all to avoid movement
[ead174a]294        __cfaasm_label(get, after);
[becb85b9]295
296        // This is used everywhere, to avoid cost, we DO NOT poll pending preemption
[8fc652e0]297        return val;
298}
299
[82ff5845]300extern "C" {
[969b3fe]301        // Disable interrupts by incrementing the counter
[82ff5845]302        void disable_interrupts() {
[8fc652e0]303                // create a assembler label before
304                // marked as clobber all to avoid movement
[ead174a]305                __cfaasm_label(dsable, before);
[8fc652e0]306
307                with( __cfaabi_tls.preemption_state ) {
[1f81d61]308                        #if GCC_VERSION > 50000
[13073be]309                        static_assert(__atomic_always_lock_free(sizeof(enabled), &enabled), "Must be lock-free");
[1f81d61]310                        #endif
[13073be]311
312                        // Set enabled flag to false
313                        // should be atomic to avoid preemption in the middle of the operation.
314                        // use memory order RELAXED since there is no inter-thread on this variable requirements
315                        __atomic_store_n(&enabled, false, __ATOMIC_RELAXED);
316
317                        // Signal the compiler that a fence is needed but only for signal handlers
318                        __atomic_signal_fence(__ATOMIC_ACQUIRE);
319
[de6319f]320                        __attribute__((unused)) unsigned short new_val = disable_count + 1;
321                        disable_count = new_val;
322                        verify( new_val < 65_000u );              // If this triggers someone is disabling interrupts without enabling them
323                }
[8fc652e0]324
325                // create a assembler label after
326                // marked as clobber all to avoid movement
[ead174a]327                __cfaasm_label(dsable, after);
328
[82ff5845]329        }
330
[969b3fe]331        // Enable interrupts by decrementing the counter
[c7a900a]332        // If counter reaches 0, execute any pending __cfactx_switch
[a3821fa]333        void enable_interrupts( bool poll ) {
[ead174a]334                // Cache the processor now since interrupts can start happening after the atomic store
335                processor   * proc = __cfaabi_tls.this_processor;
[a3821fa]336                /* paranoid */ verify( !poll || proc );
[969b3fe]337
[8fc652e0]338                with( __cfaabi_tls.preemption_state ){
[de6319f]339                        unsigned short prev = disable_count;
340                        disable_count -= 1;
[ead174a]341
342                        // If this triggers someone is enabled already enabled interruptsverify( prev != 0u );
343                        /* paranoid */ verify( prev != 0u );
[de6319f]344
345                        // Check if we need to prempt the thread because an interrupt was missed
346                        if( prev == 1 ) {
[1f81d61]347                                #if GCC_VERSION > 50000
[ead174a]348                                        static_assert(__atomic_always_lock_free(sizeof(enabled), &enabled), "Must be lock-free");
[1f81d61]349                                #endif
[13073be]350
351                                // Set enabled flag to true
352                                // should be atomic to avoid preemption in the middle of the operation.
353                                // use memory order RELAXED since there is no inter-thread on this variable requirements
354                                __atomic_store_n(&enabled, true, __ATOMIC_RELAXED);
355
356                                // Signal the compiler that a fence is needed but only for signal handlers
357                                __atomic_signal_fence(__ATOMIC_RELEASE);
[a3821fa]358                                if( poll && proc->pending_preemption ) {
[de6319f]359                                        proc->pending_preemption = false;
[3381ed7]360                                        force_yield( __POLL_PREEMPTION );
[de6319f]361                                }
[d0a045c7]362                        }
[82ff5845]363                }
[969b3fe]364        }
[82ff5845]365}
366
[adf34b3]367//-----------------------------------------------------------------------------
368// Kernel Signal Debug
369void __cfaabi_check_preemption() {
370        bool ready = __preemption_enabled();
371        if(!ready) { abort("Preemption should be ready"); }
372
[250583e]373        sigset_t oldset;
374        int ret;
375        ret = pthread_sigmask(0, ( const sigset_t * ) 0p, &oldset);  // workaround trac#208: cast should be unnecessary
376        if(ret != 0) { abort("ERROR sigprocmask returned %d", ret); }
377
378        ret = sigismember(&oldset, SIGUSR1);
379        if(ret <  0) { abort("ERROR sigismember returned %d", ret); }
380        if(ret == 1) { abort("ERROR SIGUSR1 is disabled"); }
381
382        ret = sigismember(&oldset, SIGALRM);
383        if(ret <  0) { abort("ERROR sigismember returned %d", ret); }
384        if(ret == 0) { abort("ERROR SIGALRM is enabled"); }
385
386        ret = sigismember(&oldset, SIGTERM);
387        if(ret <  0) { abort("ERROR sigismember returned %d", ret); }
388        if(ret == 1) { abort("ERROR SIGTERM is disabled"); }
[adf34b3]389}
390
391#ifdef __CFA_WITH_VERIFY__
392bool __cfaabi_dbg_in_kernel() {
393        return !__preemption_enabled();
394}
395#endif
396
[ead174a]397#undef __cfaasm_label
398
[adf34b3]399//-----------------------------------------------------------------------------
400// Signal handling
401
[969b3fe]402// sigprocmask wrapper : unblock a single signal
[7222630]403static inline void signal_unblock( int sig ) {
[82ff5845]404        sigset_t mask;
405        sigemptyset( &mask );
[1c273d0]406        sigaddset( &mask, sig );
[82ff5845]407
[27f5f71]408        if ( pthread_sigmask( SIG_UNBLOCK, &mask, 0p ) == -1 ) {
[169d944]409            abort( "internal error, pthread_sigmask" );
[cd17862]410        }
[82ff5845]411}
412
[969b3fe]413// sigprocmask wrapper : block a single signal
[7222630]414static inline void signal_block( int sig ) {
[cd17862]415        sigset_t mask;
416        sigemptyset( &mask );
417        sigaddset( &mask, sig );
[47ecf2b]418
[27f5f71]419        if ( pthread_sigmask( SIG_BLOCK, &mask, 0p ) == -1 ) {
[c59a346]420                abort( "internal error, pthread_sigmask" );
[cd17862]421        }
422}
[47ecf2b]423
[969b3fe]424// kill wrapper : signal a processor
[cd17862]425static void preempt( processor * this ) {
[4dad189]426        sigval_t value = { PREEMPT_NORMAL };
427        pthread_sigqueue( this->kernel_thread, SIGUSR1, value );
428}
429
[969b3fe]430// reserved for future use
[e84ab3d]431static void timeout( thread$ * this ) {
[e873838]432        unpark( this );
[cd17862]433}
434
[7222630]435void __disable_interrupts_hard() {
436        sigset_t oldset;
437        int ret;
438        ret = pthread_sigmask(0, ( const sigset_t * ) 0p, &oldset);  // workaround trac#208: cast should be unnecessary
439        if(ret != 0) { abort("ERROR sigprocmask returned %d", ret); }
440
441        ret = sigismember(&oldset, SIGUSR1);
442        if(ret <  0) { abort("ERROR sigismember returned %d", ret); }
443        if(ret == 1) { abort("ERROR SIGUSR1 is disabled"); }
444
445        ret = sigismember(&oldset, SIGALRM);
446        if(ret <  0) { abort("ERROR sigismember returned %d", ret); }
447        if(ret == 0) { abort("ERROR SIGALRM is enabled"); }
448
449        signal_block( SIGUSR1 );
450}
451
452void __enable_interrupts_hard() {
453        signal_unblock( SIGUSR1 );
454
455        sigset_t oldset;
456        int ret;
457        ret = pthread_sigmask(0, ( const sigset_t * ) 0p, &oldset);  // workaround trac#208: cast should be unnecessary
458        if(ret != 0) { abort("ERROR sigprocmask returned %d", ret); }
459
460        ret = sigismember(&oldset, SIGUSR1);
461        if(ret <  0) { abort("ERROR sigismember returned %d", ret); }
462        if(ret == 1) { abort("ERROR SIGUSR1 is disabled"); }
463
464        ret = sigismember(&oldset, SIGALRM);
465        if(ret <  0) { abort("ERROR sigismember returned %d", ret); }
466        if(ret == 0) { abort("ERROR SIGALRM is enabled"); }
467}
468
[82a2fed]469//-----------------------------------------------------------------------------
470// Some assembly required
471#if defined( __i386 )
472        #ifdef __PIC__
473                #define RELOC_PRELUDE( label ) \
474                        "calll   .Lcfaasm_prelude_" #label "$pb\n\t" \
475                        ".Lcfaasm_prelude_" #label "$pb:\n\t" \
476                        "popl    %%eax\n\t" \
477                        ".Lcfaasm_prelude_" #label "_end:\n\t" \
478                        "addl    $_GLOBAL_OFFSET_TABLE_+(.Lcfaasm_prelude_" #label "_end-.Lcfaasm_prelude_" #label "$pb), %%eax\n\t"
479                #define RELOC_PREFIX ""
480                #define RELOC_SUFFIX "@GOT(%%eax)"
481        #else
482                #define RELOC_PREFIX "$"
483                #define RELOC_SUFFIX ""
484        #endif
[a12810d]485        #define __cfaasm_label( label ) struct asm_region label = \
[82a2fed]486                ({ \
487                        struct asm_region region; \
488                        asm( \
489                                RELOC_PRELUDE( label ) \
490                                "movl " RELOC_PREFIX "__cfaasm_" #label "_before" RELOC_SUFFIX ", %[vb]\n\t" \
491                                "movl " RELOC_PREFIX "__cfaasm_" #label "_after"  RELOC_SUFFIX ", %[va]\n\t" \
492                                 : [vb]"=r"(region.before), [va]"=r"(region.after) \
493                        ); \
494                        region; \
495                });
496#elif defined( __x86_64 )
497        #ifdef __PIC__
498                #define RELOC_PREFIX ""
499                #define RELOC_SUFFIX "@GOTPCREL(%%rip)"
500        #else
501                #define RELOC_PREFIX "$"
502                #define RELOC_SUFFIX ""
503        #endif
[a12810d]504        #define __cfaasm_label( label ) struct asm_region label = \
[82a2fed]505                ({ \
506                        struct asm_region region; \
507                        asm( \
508                                "movq " RELOC_PREFIX "__cfaasm_" #label "_before" RELOC_SUFFIX ", %[vb]\n\t" \
509                                "movq " RELOC_PREFIX "__cfaasm_" #label "_after"  RELOC_SUFFIX ", %[va]\n\t" \
510                                 : [vb]"=r"(region.before), [va]"=r"(region.after) \
511                        ); \
512                        region; \
513                });
514#elif defined( __aarch64__ )
515        #ifdef __PIC__
[ead174a]516                // Note that this works only for gcc
[a12810d]517                #define __cfaasm_label( label ) struct asm_region label = \
[82a2fed]518                ({ \
519                        struct asm_region region; \
520                        asm( \
[ead174a]521                                "adrp %[vb], _GLOBAL_OFFSET_TABLE_"                              "\n\t" \
522                                "ldr  %[vb], [%[vb], #:gotpage_lo15:__cfaasm_" #label "_before]" "\n\t" \
523                                "adrp %[va], _GLOBAL_OFFSET_TABLE_"                              "\n\t" \
524                                "ldr  %[va], [%[va], #:gotpage_lo15:__cfaasm_" #label "_after]"  "\n\t" \
[82a2fed]525                                 : [vb]"=r"(region.before), [va]"=r"(region.after) \
526                        ); \
527                        region; \
528                });
529        #else
[ead174a]530                #error this is not the right thing to do
[b5344a3]531                /*
[a12810d]532                #define __cfaasm_label( label ) struct asm_region label = \
[82a2fed]533                ({ \
534                        struct asm_region region; \
535                        asm( \
[b5344a3]536                                "adrp %[vb], __cfaasm_" #label "_before"              "\n\t" \
537                                "add  %[vb], %[vb], :lo12:__cfaasm_" #label "_before" "\n\t" \
538                                "adrp %[va], :got:__cfaasm_" #label "_after"          "\n\t" \
539                                "add  %[va], %[va], :lo12:__cfaasm_" #label "_after"  "\n\t" \
[82a2fed]540                                 : [vb]"=r"(region.before), [va]"=r"(region.after) \
541                        ); \
542                        region; \
543                });
[b5344a3]544                */
[ead174a]545        #endif
[82a2fed]546#else
547        #error unknown hardware architecture
548#endif
549
[14a61b5]550// KERNEL ONLY
[c7a900a]551// Check if a __cfactx_switch signal handler shoud defer
[969b3fe]552// If true  : preemption is safe
553// If false : preemption is unsafe and marked as pending
[82a2fed]554static inline bool preemption_ready( void * ip ) {
555        // Get all the region for which it is not safe to preempt
556        __cfaasm_label( get    );
557        __cfaasm_label( check  );
558        __cfaasm_label( dsable );
[becb85b9]559        // __cfaasm_label( debug  );
[14a61b5]560
[82a2fed]561        // Check if preemption is safe
562        bool ready = true;
563        if( __cfaasm_in( ip, get    ) ) { ready = false; goto EXIT; };
564        if( __cfaasm_in( ip, check  ) ) { ready = false; goto EXIT; };
565        if( __cfaasm_in( ip, dsable ) ) { ready = false; goto EXIT; };
[becb85b9]566        // if( __cfaasm_in( ip, debug  ) ) { ready = false; goto EXIT; };
[82a2fed]567        if( !__cfaabi_tls.preemption_state.enabled) { ready = false; goto EXIT; };
568        if( __cfaabi_tls.preemption_state.in_progress ) { ready = false; goto EXIT; };
569
570EXIT:
[14a61b5]571        // Adjust the pending flag accordingly
[8fc652e0]572        __cfaabi_tls.this_processor->pending_preemption = !ready;
[969b3fe]573        return ready;
574}
575
[cd17862]576//=============================================================================================
577// Kernel Signal Startup/Shutdown logic
578//=============================================================================================
579
[969b3fe]580// Startup routine to activate preemption
581// Called from kernel_startup
[e660761]582void __kernel_alarm_startup() {
[169d944]583        __cfaabi_dbg_print_safe( "Kernel : Starting preemption\n" );
[969b3fe]584
585        // Start with preemption disabled until ready
[8fc652e0]586        __cfaabi_tls.preemption_state.enabled = false;
587        __cfaabi_tls.preemption_state.disable_count = 1;
[969b3fe]588
589        // Initialize the event kernel
590        event_kernel = (event_kernel_t *)&storage_event_kernel;
[9236060]591        (*event_kernel){};
[969b3fe]592
593        // Setup proper signal handlers
[6047b00]594        __cfaabi_sigaction( SIGUSR1, sigHandler_ctxSwitch, SA_SIGINFO ); // __cfactx_switch handler
595        __cfaabi_sigaction( SIGALRM, sigHandler_alarm    , SA_SIGINFO ); // debug handler
[cd17862]596
597        signal_block( SIGALRM );
598
[8c50aed]599        alarm_stack = __create_pthread( &alarm_thread, alarm_loop, 0p );
[cd17862]600}
601
[969b3fe]602// Shutdown routine to deactivate preemption
603// Called from kernel_shutdown
[e660761]604void __kernel_alarm_shutdown() {
[169d944]605        __cfaabi_dbg_print_safe( "Kernel : Preemption stopping\n" );
[d6ff3ff]606
[969b3fe]607        // Block all signals since we are already shutting down
[cd17862]608        sigset_t mask;
609        sigfillset( &mask );
[27f5f71]610        sigprocmask( SIG_BLOCK, &mask, 0p );
[cd17862]611
[969b3fe]612        // Notify the alarm thread of the shutdown
[c457dc41]613        sigval val;
614        val.sival_int = 0;
[a0b3e32]615        pthread_sigqueue( alarm_thread, SIGALRM, val );
[969b3fe]616
617        // Wait for the preemption thread to finish
[27f5f71]618
[bfcf6b9]619        __destroy_pthread( alarm_thread, alarm_stack, 0p );
[969b3fe]620
621        // Preemption is now fully stopped
622
[169d944]623        __cfaabi_dbg_print_safe( "Kernel : Preemption stopped\n" );
[cd17862]624}
625
[92bfda0]626// Prevent preemption since we are about to start terminating things
627void __kernel_abort_lock(void) {
628        signal_block( SIGUSR1 );
629}
630
[969b3fe]631// Raii ctor/dtor for the preemption_scope
632// Used by thread to control when they want to receive preemption signals
[242a902]633void ?{}( preemption_scope & this, processor * proc ) {
[c457dc41]634        (this.alarm){ proc, 0`s, 0`s };
[242a902]635        this.proc = proc;
636        this.proc->preemption_alarm = &this.alarm;
[969b3fe]637
[d8548e2]638        update_preemption( this.proc, this.proc->cltr->preemption_rate );
[cd17862]639}
640
[242a902]641void ^?{}( preemption_scope & this ) {
[cd17862]642        disable_interrupts();
643
[2a84d06d]644        update_preemption( this.proc, 0`s );
[cd17862]645}
646
647//=============================================================================================
648// Kernel Signal Handlers
649//=============================================================================================
[54dcab1]650__cfaabi_dbg_debug_do( static thread_local void * last_interrupt = 0; )
[47ecf2b]651
[969b3fe]652// Context switch signal handler
653// Receives SIGUSR1 signal and causes the current thread to yield
[c29c342]654static void sigHandler_ctxSwitch( __CFA_SIGPARMS__ ) {
[8fc652e0]655        void * ip = (void *)(cxt->uc_mcontext.CFA_REG_IP);
656        __cfaabi_dbg_debug_do( last_interrupt = ip; )
[969b3fe]657
[4dad189]658        // SKULLDUGGERY: if a thread creates a processor and the immediately deletes it,
659        // the interrupt that is supposed to force the kernel thread to preempt might arrive
[482fa08]660        // before the kernel thread has even started running. When that happens, an interrupt
[97cba9f]661        // with a null 'this_processor' will be caught, just ignore it.
[8fc652e0]662        if(! __cfaabi_tls.this_processor ) return;
[4dad189]663
664        choose(sfp->si_value.sival_int) {
665                case PREEMPT_NORMAL   : ;// Normal case, nothing to do here
[8fc652e0]666                case PREEMPT_TERMINATE: verify( __atomic_load_n( &__cfaabi_tls.this_processor->do_terminate, __ATOMIC_SEQ_CST ) );
[4dad189]667                default:
[ff878b7]668                        abort( "internal error, signal value is %d", sfp->si_value.sival_int );
[4dad189]669        }
670
[b2b44d8]671        // Check if it is safe to preempt here
[941e14a]672        if( !preemption_ready( ip ) ) {
673                #if !defined(__CFA_NO_STATISTICS__)
674                        __cfaabi_tls.this_stats->ready.threads.preempt.rllfwd++;
675                #endif
676                return;
677        }
[8fc652e0]678
679        __cfaabi_dbg_print_buffer_decl( " KERNEL: preempting core %p (%p @ %p).\n", __cfaabi_tls.this_processor, __cfaabi_tls.this_thread, (void *)(cxt->uc_mcontext.CFA_REG_IP) );
[14a61b5]680
681        // Sync flag : prevent recursive calls to the signal handler
[8fc652e0]682        __cfaabi_tls.preemption_state.in_progress = true;
[14a61b5]683
[a83ffa4]684        // Clear sighandler mask before context switching.
[1f81d61]685        #if GCC_VERSION > 50000
[a83ffa4]686        static_assert( sizeof( sigset_t ) == sizeof( cxt->uc_sigmask ), "Expected cxt->uc_sigmask to be of sigset_t" );
[1f81d61]687        #endif
[27f5f71]688        if ( pthread_sigmask( SIG_SETMASK, (sigset_t *)&(cxt->uc_sigmask), 0p ) == -1 ) {
[a83ffa4]689                abort( "internal error, sigprocmask" );
690        }
[05615ba]691
[14a61b5]692        // Clear the in progress flag
[8fc652e0]693        __cfaabi_tls.preemption_state.in_progress = false;
[969b3fe]694
695        // Preemption can occur here
696
[941e14a]697        #if !defined(__CFA_NO_STATISTICS__)
698                __cfaabi_tls.this_stats->ready.threads.preempt.yield++;
699        #endif
700
[c7a900a]701        force_yield( __ALARM_PREEMPTION ); // Do the actual __cfactx_switch
[c81ebf9]702}
703
[c59a346]704static void sigHandler_alarm( __CFA_SIGPARMS__ ) {
705        abort("SIGALRM should never reach the signal handler");
[c81ebf9]706}
707
[969b3fe]708// Main of the alarm thread
709// Waits on SIGALRM and send SIGUSR1 to whom ever needs it
[c29c342]710static void * alarm_loop( __attribute__((unused)) void * args ) {
[c993b15]711        unsigned id = register_proc_id();
[1b033b8]712
[969b3fe]713        // Block sigalrms to control when they arrive
[cd17862]714        sigset_t mask;
[ade5272]715        sigfillset(&mask);
[27f5f71]716        if ( pthread_sigmask( SIG_BLOCK, &mask, 0p ) == -1 ) {
[169d944]717            abort( "internal error, pthread_sigmask" );
[82ff5845]718        }
[c81ebf9]719
[ade5272]720        sigemptyset( &mask );
721        sigaddset( &mask, SIGALRM );
722
[969b3fe]723        // Main loop
[cd17862]724        while( true ) {
[969b3fe]725                // Wait for a sigalrm
[a0b3e32]726                siginfo_t info;
727                int sig = sigwaitinfo( &mask, &info );
[969b3fe]728
[c457dc41]729                __cfadbg_print_buffer_decl ( preemption, " KERNEL: sigwaitinfo returned %d, c: %d, v: %d\n", sig, info.si_code, info.si_value.sival_int );
730                __cfadbg_print_buffer_local( preemption, " KERNEL: SI_QUEUE %d, SI_TIMER %d, SI_KERNEL %d\n", SI_QUEUE, SI_TIMER, SI_KERNEL );
731
[e2f7bc3]732                if( sig < 0 ) {
733                        //Error!
734                        int err = errno;
735                        switch( err ) {
736                                case EAGAIN :
737                                case EINTR :
[c457dc41]738                                        {__cfadbg_print_buffer_local( preemption, " KERNEL: Spurious wakeup %d.\n", err );}
[e2f7bc3]739                                        continue;
[27f5f71]740                                case EINVAL :
[169d944]741                                        abort( "Timeout was invalid." );
[e2f7bc3]742                                default:
[169d944]743                                        abort( "Unhandled error %d", err);
[e2f7bc3]744                        }
745                }
746
[969b3fe]747                // If another signal arrived something went wrong
[8cb529e]748                assertf(sig == SIGALRM, "Kernel Internal Error, sigwait: Unexpected signal %d (%d : %d)\n", sig, info.si_code, info.si_value.sival_int);
749
[969b3fe]750                // Switch on the code (a.k.a. the sender) to
[8cb529e]751                switch( info.si_code )
[a0b3e32]752                {
[c457dc41]753                // Signal was not sent by the kernel but by an other thread
754                case SI_QUEUE:
755                        // other threads may signal the alarm thread to shut it down
756                        // or to manual cause the preemption tick
757                        // use info.si_value and handle the case here
758                        switch( info.si_value.sival_int ) {
759                        case 0:
760                                goto EXIT;
761                        default:
762                                abort( "SI_QUEUE with val %d", info.si_value.sival_int);
763                        }
764                        // fallthrough
[969b3fe]765                // Timers can apparently be marked as sent for the kernel
766                // In either case, tick preemption
[8cb529e]767                case SI_TIMER:
768                case SI_KERNEL:
[169d944]769                        // __cfaabi_dbg_print_safe( "Kernel : Preemption thread tick\n" );
[36982fc]770                        lock( event_kernel->lock __cfaabi_dbg_ctx2 );
[e873838]771                        tick_preemption();
[ea7d2b0]772                        unlock( event_kernel->lock );
[8cb529e]773                        break;
[cd17862]774                }
775        }
[a0b3e32]776
[8cb529e]777EXIT:
[169d944]778        __cfaabi_dbg_print_safe( "Kernel : Preemption thread stopping\n" );
[c993b15]779        unregister_proc_id(id);
[1b033b8]780
[27f5f71]781        return 0p;
[82ff5845]782}
783
[6b0b624]784// Local Variables: //
785// mode: c //
786// tab-width: 4 //
787// End: //
Note: See TracBrowser for help on using the repository browser.