Changes in / [54dcab1:231b18f]
- Files:
-
- 15 edited
Legend:
- Unmodified
- Added
- Removed
-
benchmark/readyQ/cycle.cfa
r54dcab1 r231b18f 84 84 } 85 85 86 printf("Duration (ms) : %'ld\n", (end - start)` dms);86 printf("Duration (ms) : %'ld\n", (end - start)`ms); 87 87 printf("Number of processors : %'d\n", nprocs); 88 88 printf("Number of threads : %'d\n", tthreads); … … 90 90 printf("Total Operations(ops): %'15llu\n", global_counter); 91 91 printf("Total blocks : %'15llu\n", global_blocks); 92 printf("Ops per second : %'18.2lf\n", ((double)global_counter) / (end - start)` ds);93 printf("ns per ops : %'18.2lf\n", ( end - start)`dns/ global_counter);92 printf("Ops per second : %'18.2lf\n", ((double)global_counter) / (end - start)`s); 93 printf("ns per ops : %'18.2lf\n", ((double)(end - start)`ns) / global_counter); 94 94 printf("Ops per threads : %'15llu\n", global_counter / tthreads); 95 95 printf("Ops per procs : %'15llu\n", global_counter / nprocs); 96 printf("Ops/sec/procs : %'18.2lf\n", (((double)global_counter) / nprocs) / (end - start)` ds);97 printf("ns per ops/procs : %'18.2lf\n", ( end - start)`dns/ (global_counter / nprocs));96 printf("Ops/sec/procs : %'18.2lf\n", (((double)global_counter) / nprocs) / (end - start)`s); 97 printf("ns per ops/procs : %'18.2lf\n", ((double)(end - start)`ns) / (global_counter / nprocs)); 98 98 fflush(stdout); 99 99 } -
benchmark/readyQ/cycle.go
r54dcab1 r231b18f 72 72 p.Printf("Cycle size (# thrds) : %d\n", ring_size); 73 73 p.Printf("Total Operations(ops): %15d\n", global_counter) 74 p.Printf(" Ops per second: %18.2f\n", float64(global_counter) / delta.Seconds())74 p.Printf("Yields per second : %18.2f\n", float64(global_counter) / delta.Seconds()) 75 75 p.Printf("ns per ops : %18.2f\n", float64(delta.Nanoseconds()) / float64(global_counter)) 76 76 p.Printf("Ops per threads : %15d\n", global_counter / uint64(tthreads)) -
benchmark/readyQ/rq_bench.hfa
r54dcab1 r231b18f 88 88 } 89 89 90 struct __attribute__((aligned(128)))bench_sem {90 struct bench_sem { 91 91 struct $thread * volatile ptr; 92 92 }; -
benchmark/readyQ/rq_bench.hpp
r54dcab1 r231b18f 75 75 } 76 76 77 class __attribute__((aligned(128)))bench_sem {77 class bench_sem { 78 78 Fibre * volatile ptr = nullptr; 79 79 public: -
libcfa/src/concurrency/io.cfa
r54dcab1 r231b18f 76 76 77 77 static inline bool next( __leaderlock_t & this ) { 78 /* paranoid */ verify( ! __preemption_enabled());78 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 79 79 struct $thread * nextt; 80 80 for() { … … 168 168 // This is NOT thread-safe 169 169 static [int, bool] __drain_io( & struct __io_data ring ) { 170 /* paranoid */ verify( ! __preemption_enabled());170 /* paranoid */ verify( !kernelTLS.preemption_state.enabled ); 171 171 172 172 unsigned to_submit = 0; … … 404 404 return; 405 405 } 406 /* paranoid */ verify( ! __preemption_enabled());406 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 407 407 __STATS__( true, 408 408 io.submit_q.leader += 1; … … 442 442 443 443 #if defined(LEADER_LOCK) 444 /* paranoid */ verify( ! __preemption_enabled());444 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 445 445 next(ring.submit_q.submit_lock); 446 446 #else -
libcfa/src/concurrency/io/setup.cfa
r54dcab1 r231b18f 149 149 id.full_proc = false; 150 150 id.id = doregister(&id); 151 __cfaabi_tls.this_proc_id = &id;151 kernelTLS.this_proc_id = &id; 152 152 __cfaabi_dbg_print_safe( "Kernel : IO poller thread starting\n" ); 153 153 … … 179 179 __cfadbg_print_safe(io_core, "Kernel I/O : Unparking io poller %p\n", io_ctx); 180 180 #if !defined( __CFA_NO_STATISTICS__ ) 181 __cfaabi_tls.this_stats = io_ctx->self.curr_cluster->stats;181 kernelTLS.this_stats = io_ctx->self.curr_cluster->stats; 182 182 #endif 183 183 post( io_ctx->sem ); -
libcfa/src/concurrency/kernel.cfa
r54dcab1 r231b18f 122 122 // Because of a bug, we couldn't initialized the seed on construction 123 123 // Do it here 124 __cfaabi_tls.rand_seed ^= rdtscl();125 __cfaabi_tls.ready_rng.fwd_seed = 25214903917_l64u * (rdtscl() ^ (uintptr_t)&runner);124 kernelTLS.rand_seed ^= rdtscl(); 125 kernelTLS.ready_rng.fwd_seed = 25214903917_l64u * (rdtscl() ^ (uintptr_t)&runner); 126 126 __tls_rand_advance_bck(); 127 127 … … 217 217 // and it make sense for it to be set in all other cases except here 218 218 // fake it 219 __cfaabi_tls.this_thread = mainThread;219 kernelTLS.this_thread = mainThread; 220 220 } 221 221 … … 230 230 // from the processor coroutine to the target thread 231 231 static void __run_thread(processor * this, $thread * thrd_dst) { 232 /* paranoid */ verify( ! __preemption_enabled());232 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 233 233 /* paranoid */ verifyf( thrd_dst->state == Ready || thrd_dst->preempted != __NO_PREEMPTION, "state : %d, preempted %d\n", thrd_dst->state, thrd_dst->preempted); 234 234 /* paranoid */ verifyf( thrd_dst->link.next == 0p, "Expected null got %p", thrd_dst->link.next ); … … 247 247 248 248 // Update global state 249 kernelTLS ().this_thread = thrd_dst;250 251 /* paranoid */ verify( ! __preemption_enabled());252 /* paranoid */ verify( kernelTLS ().this_thread == thrd_dst );249 kernelTLS.this_thread = thrd_dst; 250 251 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 252 /* paranoid */ verify( kernelTLS.this_thread == thrd_dst ); 253 253 /* paranoid */ verify( thrd_dst->context.SP ); 254 254 /* paranoid */ verify( thrd_dst->state != Halted ); … … 267 267 /* paranoid */ verifyf( ((uintptr_t)thrd_dst->context.SP) < ((uintptr_t)__get_stack(thrd_dst->curr_cor)->base ), "ERROR : Destination $thread %p has been corrupted.\n StackPointer too small.\n", thrd_dst ); 268 268 /* paranoid */ verify( thrd_dst->context.SP ); 269 /* paranoid */ verify( kernelTLS ().this_thread == thrd_dst );270 /* paranoid */ verify( ! __preemption_enabled());269 /* paranoid */ verify( kernelTLS.this_thread == thrd_dst ); 270 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 271 271 272 272 // Reset global state 273 kernelTLS ().this_thread = 0p;273 kernelTLS.this_thread = 0p; 274 274 275 275 // We just finished running a thread, there are a few things that could have happened. … … 315 315 proc_cor->state = Active; 316 316 317 /* paranoid */ verify( ! __preemption_enabled());317 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 318 318 } 319 319 320 320 // KERNEL_ONLY 321 321 void returnToKernel() { 322 /* paranoid */ verify( ! __preemption_enabled());323 $coroutine * proc_cor = get_coroutine(kernelTLS ().this_processor->runner);324 $thread * thrd_src = kernelTLS ().this_thread;322 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 323 $coroutine * proc_cor = get_coroutine(kernelTLS.this_processor->runner); 324 $thread * thrd_src = kernelTLS.this_thread; 325 325 326 326 #if !defined(__CFA_NO_STATISTICS__) 327 struct processor * last_proc = kernelTLS ().this_processor;327 struct processor * last_proc = kernelTLS.this_processor; 328 328 #endif 329 329 … … 345 345 346 346 #if !defined(__CFA_NO_STATISTICS__) 347 if(last_proc != kernelTLS ().this_processor) {347 if(last_proc != kernelTLS.this_processor) { 348 348 __tls_stats()->ready.threads.migration++; 349 349 } 350 350 #endif 351 351 352 /* paranoid */ verify( ! __preemption_enabled());352 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 353 353 /* paranoid */ verifyf( ((uintptr_t)thrd_src->context.SP) < ((uintptr_t)__get_stack(thrd_src->curr_cor)->base ), "ERROR : Returning $thread %p has been corrupted.\n StackPointer too small.\n", thrd_src ); 354 354 /* paranoid */ verifyf( ((uintptr_t)thrd_src->context.SP) > ((uintptr_t)__get_stack(thrd_src->curr_cor)->limit), "ERROR : Returning $thread %p has been corrupted.\n StackPointer too large.\n", thrd_src ); … … 359 359 // KERNEL ONLY 360 360 void __schedule_thread( $thread * thrd ) { 361 /* paranoid */ verify( ! __preemption_enabled() );362 361 /* paranoid */ verify( thrd ); 363 362 /* paranoid */ verify( thrd->state != Halted ); 364 /* paranoid */ verify( kernelTLS().this_proc_id ); 363 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 364 /* paranoid */ verify( kernelTLS.this_proc_id ); 365 365 /* paranoid */ #if defined( __CFA_WITH_VERIFY__ ) 366 366 /* paranoid */ if( thrd->state == Blocked || thrd->state == Start ) assertf( thrd->preempted == __NO_PREEMPTION, … … 380 380 ready_schedule_unlock(); 381 381 382 /* paranoid */ verify( ! __preemption_enabled());382 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 383 383 } 384 384 385 385 // KERNEL ONLY 386 386 static inline $thread * __next_thread(cluster * this) with( *this ) { 387 /* paranoid */ verify( ! __preemption_enabled());388 /* paranoid */ verify( kernelTLS().this_proc_id );387 /* paranoid */ verify( kernelTLS.this_proc_id ); 388 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 389 389 390 390 ready_schedule_lock(); … … 392 392 ready_schedule_unlock(); 393 393 394 /* paranoid */ verify( kernelTLS().this_proc_id );395 /* paranoid */ verify( ! __preemption_enabled());394 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 395 /* paranoid */ verify( kernelTLS.this_proc_id ); 396 396 return thrd; 397 397 } … … 399 399 // KERNEL ONLY 400 400 static inline $thread * __next_thread_slow(cluster * this) with( *this ) { 401 /* paranoid */ verify( ! __preemption_enabled());402 /* paranoid */ verify( kernelTLS().this_proc_id );401 /* paranoid */ verify( kernelTLS.this_proc_id ); 402 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 403 403 404 404 ready_schedule_lock(); … … 406 406 ready_schedule_unlock(); 407 407 408 /* paranoid */ verify( kernelTLS().this_proc_id );409 /* paranoid */ verify( ! __preemption_enabled());408 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 409 /* paranoid */ verify( kernelTLS.this_proc_id ); 410 410 return thrd; 411 411 } … … 414 414 if( !thrd ) return; 415 415 416 /* paranoid */ verify( kernelTLS.this_proc_id ); 417 bool full = kernelTLS.this_proc_id->full_proc; 418 if(full) disable_interrupts(); 419 420 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 416 421 int old_ticket = __atomic_fetch_add(&thrd->ticket, 1, __ATOMIC_SEQ_CST); 417 422 switch(old_ticket) { … … 423 428 /* paranoid */ verify( thrd->state == Blocked ); 424 429 425 { 426 /* paranoid */ verify( publicTLS_get(this_proc_id) ); 427 bool full = publicTLS_get(this_proc_id)->full_proc; 428 if(full) disable_interrupts(); 429 430 /* paranoid */ verify( ! __preemption_enabled() ); 431 432 // Wake lost the race, 433 __schedule_thread( thrd ); 434 435 /* paranoid */ verify( ! __preemption_enabled() ); 436 437 if(full) enable_interrupts( __cfaabi_dbg_ctx ); 438 /* paranoid */ verify( publicTLS_get(this_proc_id) ); 439 } 440 430 // Wake lost the race, 431 __schedule_thread( thrd ); 441 432 break; 442 433 default: … … 444 435 abort("Thread %p (%s) has mismatch park/unpark\n", thrd, thrd->self_cor.name); 445 436 } 437 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 438 439 if(full) enable_interrupts( __cfaabi_dbg_ctx ); 440 /* paranoid */ verify( kernelTLS.this_proc_id ); 446 441 } 447 442 448 443 void park( void ) { 449 /* paranoid */ verify( __preemption_enabled());444 /* paranoid */ verify( kernelTLS.preemption_state.enabled ); 450 445 disable_interrupts(); 451 /* paranoid */ verify( ! __preemption_enabled());452 /* paranoid */ verify( kernelTLS ().this_thread->preempted == __NO_PREEMPTION );446 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 447 /* paranoid */ verify( kernelTLS.this_thread->preempted == __NO_PREEMPTION ); 453 448 454 449 returnToKernel(); 455 450 456 /* paranoid */ verify( ! __preemption_enabled());451 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 457 452 enable_interrupts( __cfaabi_dbg_ctx ); 458 /* paranoid */ verify( __preemption_enabled());453 /* paranoid */ verify( kernelTLS.preemption_state.enabled ); 459 454 460 455 } … … 465 460 // Should never return 466 461 void __cfactx_thrd_leave() { 467 $thread * thrd = active_thread();462 $thread * thrd = TL_GET( this_thread ); 468 463 $monitor * this = &thrd->self_mon; 469 464 … … 478 473 479 474 // Leave the thread 480 /* paranoid */ verify( ! __preemption_enabled());475 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 481 476 returnToKernel(); 482 477 abort(); … … 488 483 // KERNEL ONLY 489 484 bool force_yield( __Preemption_Reason reason ) { 490 /* paranoid */ verify( __preemption_enabled());485 /* paranoid */ verify( kernelTLS.preemption_state.enabled ); 491 486 disable_interrupts(); 492 /* paranoid */ verify( ! __preemption_enabled());493 494 $thread * thrd = kernelTLS ().this_thread;487 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 488 489 $thread * thrd = kernelTLS.this_thread; 495 490 /* paranoid */ verify(thrd->state == Active); 496 491 … … 506 501 } 507 502 508 /* paranoid */ verify( ! __preemption_enabled());503 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 509 504 enable_interrupts_noPoll(); 510 /* paranoid */ verify( __preemption_enabled());505 /* paranoid */ verify( kernelTLS.preemption_state.enabled ); 511 506 512 507 return preempted; … … 518 513 // Wake a thread from the front if there are any 519 514 static void __wake_one(cluster * this) { 520 /* paranoid */ verify( ! __preemption_enabled());515 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 521 516 /* paranoid */ verify( ready_schedule_islocked() ); 522 517 … … 538 533 539 534 /* paranoid */ verify( ready_schedule_islocked() ); 540 /* paranoid */ verify( ! __preemption_enabled());535 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 541 536 542 537 return; … … 548 543 549 544 disable_interrupts(); 550 /* paranoid */ verify( ! __preemption_enabled());545 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 551 546 post( this->idle ); 552 547 enable_interrupts( __cfaabi_dbg_ctx ); … … 554 549 555 550 static void push (__cluster_idles & this, processor & proc) { 556 /* paranoid */ verify( ! __preemption_enabled());551 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 557 552 lock( this ); 558 553 this.idle++; … … 561 556 insert_first(this.list, proc); 562 557 unlock( this ); 563 /* paranoid */ verify( ! __preemption_enabled());558 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 564 559 } 565 560 566 561 static void remove(__cluster_idles & this, processor & proc) { 567 /* paranoid */ verify( ! __preemption_enabled());562 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 568 563 lock( this ); 569 564 this.idle--; … … 572 567 remove(proc); 573 568 unlock( this ); 574 /* paranoid */ verify( ! __preemption_enabled());569 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 575 570 } 576 571 … … 616 611 } 617 612 618 return __cfaabi_tls.this_thread;613 return kernelTLS.this_thread; 619 614 } 620 615 … … 641 636 642 637 int kernel_abort_lastframe( void ) __attribute__ ((__nothrow__)) { 643 return get_coroutine(kernelTLS ().this_thread) == get_coroutine(mainThread) ? 4 : 2;638 return get_coroutine(kernelTLS.this_thread) == get_coroutine(mainThread) ? 4 : 2; 644 639 } 645 640 … … 673 668 if ( count < 0 ) { 674 669 // queue current task 675 append( waiting, active_thread());670 append( waiting, kernelTLS.this_thread ); 676 671 677 672 // atomically release spin lock and block … … 723 718 void __cfaabi_dbg_record_lock(__spinlock_t & this, const char prev_name[]) { 724 719 this.prev_name = prev_name; 725 this.prev_thrd = kernelTLS ().this_thread;720 this.prev_thrd = kernelTLS.this_thread; 726 721 } 727 722 } -
libcfa/src/concurrency/kernel.hfa
r54dcab1 r231b18f 275 275 static inline [cluster *&, cluster *& ] __get( cluster & this ) __attribute__((const)) { return this.node.[next, prev]; } 276 276 277 static inline struct processor * active_processor() { return publicTLS_get( this_processor ); } // UNSAFE278 static inline struct cluster * active_cluster () { return publicTLS_get( this_processor )->cltr; }277 static inline struct processor * active_processor() { return TL_GET( this_processor ); } // UNSAFE 278 static inline struct cluster * active_cluster () { return TL_GET( this_processor )->cltr; } 279 279 280 280 #if !defined(__CFA_NO_STATISTICS__) 281 void print_stats_now( cluster & this, int flags );282 283 281 static inline void print_stats_at_exit( cluster & this, int flags ) { 284 282 this.print_stats |= flags; -
libcfa/src/concurrency/kernel/fwd.hfa
r54dcab1 r231b18f 55 55 uint64_t bck_seed; 56 56 } ready_rng; 57 } __cfaabi_tls__attribute__ ((tls_model ( "initial-exec" )));57 } kernelTLS __attribute__ ((tls_model ( "initial-exec" ))); 58 58 59 extern bool __preemption_enabled();60 59 61 static inline KernelThreadData & kernelTLS( void ) {62 /* paranoid */ verify( ! __preemption_enabled() );63 return __cfaabi_tls;64 }65 66 extern uintptr_t __cfatls_get( unsigned long int member );67 // #define publicTLS_get( member ) ((typeof(__cfaabi_tls.member))__cfatls_get( __builtin_offsetof(KernelThreadData, member) ))68 #define publicTLS_get( member ) (__cfaabi_tls.member)69 // extern forall(otype T) T __cfatls_get( T * member, T value );70 // #define publicTLS_set( member, value ) __cfatls_set( (typeof(member)*)__builtin_offsetof(KernelThreadData, member), value );71 60 72 61 static inline uint64_t __tls_rand() { 73 62 #if defined(__SIZEOF_INT128__) 74 return __lehmer64( kernelTLS ().rand_seed );63 return __lehmer64( kernelTLS.rand_seed ); 75 64 #else 76 return __xorshift64( kernelTLS ().rand_seed );65 return __xorshift64( kernelTLS.rand_seed ); 77 66 #endif 78 67 } … … 86 75 static inline unsigned __tls_rand_fwd() { 87 76 88 kernelTLS ().ready_rng.fwd_seed = (A * kernelTLS().ready_rng.fwd_seed + C) & (M - 1);89 return kernelTLS ().ready_rng.fwd_seed >> D;77 kernelTLS.ready_rng.fwd_seed = (A * kernelTLS.ready_rng.fwd_seed + C) & (M - 1); 78 return kernelTLS.ready_rng.fwd_seed >> D; 90 79 } 91 80 92 81 static inline unsigned __tls_rand_bck() { 93 unsigned int r = kernelTLS ().ready_rng.bck_seed >> D;94 kernelTLS ().ready_rng.bck_seed = AI * (kernelTLS().ready_rng.bck_seed - C) & (M - 1);82 unsigned int r = kernelTLS.ready_rng.bck_seed >> D; 83 kernelTLS.ready_rng.bck_seed = AI * (kernelTLS.ready_rng.bck_seed - C) & (M - 1); 95 84 return r; 96 85 } … … 103 92 104 93 static inline void __tls_rand_advance_bck(void) { 105 kernelTLS ().ready_rng.bck_seed = kernelTLS().ready_rng.fwd_seed;94 kernelTLS.ready_rng.bck_seed = kernelTLS.ready_rng.fwd_seed; 106 95 } 107 96 } 108 97 98 #if 0 // def __ARM_ARCH 99 // function prototypes are only really used by these macros on ARM 100 void disable_global_interrupts(); 101 void enable_global_interrupts(); 109 102 103 #define TL_GET( member ) ( { __typeof__( kernelTLS.member ) target; \ 104 disable_global_interrupts(); \ 105 target = kernelTLS.member; \ 106 enable_global_interrupts(); \ 107 target; } ) 108 #define TL_SET( member, value ) disable_global_interrupts(); \ 109 kernelTLS.member = value; \ 110 enable_global_interrupts(); 111 #else 112 #define TL_GET( member ) kernelTLS.member 113 #define TL_SET( member, value ) kernelTLS.member = value; 114 #endif 110 115 111 116 extern void disable_interrupts(); … … 116 121 extern void park( void ); 117 122 extern void unpark( struct $thread * this ); 118 static inline struct $thread * active_thread () { 119 struct $thread * t = publicTLS_get( this_thread ); 120 /* paranoid */ verify( t ); 121 return t; 122 } 123 static inline struct $thread * active_thread () { return TL_GET( this_thread ); } 123 124 124 125 extern bool force_yield( enum __Preemption_Reason ); … … 139 140 #if !defined(__CFA_NO_STATISTICS__) 140 141 static inline struct __stats_t * __tls_stats() { 141 /* paranoid */ verify( ! __preemption_enabled());142 /* paranoid */ verify( kernelTLS ().this_stats );143 return kernelTLS ().this_stats;142 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 143 /* paranoid */ verify( kernelTLS.this_stats ); 144 return kernelTLS.this_stats; 144 145 } 145 146 -
libcfa/src/concurrency/kernel/startup.cfa
r54dcab1 r231b18f 118 118 //----------------------------------------------------------------------------- 119 119 // Global state 120 thread_local struct KernelThreadData __cfaabi_tls__attribute__ ((tls_model ( "initial-exec" ))) @= {120 thread_local struct KernelThreadData kernelTLS __attribute__ ((tls_model ( "initial-exec" ))) @= { 121 121 NULL, // cannot use 0p 122 122 NULL, … … 156 156 // Kernel boot procedures 157 157 static void __kernel_startup(void) { 158 /* paranoid */ verify( ! __preemption_enabled());158 verify( ! kernelTLS.preemption_state.enabled ); 159 159 __cfadbg_print_safe(runtime_core, "Kernel : Starting\n"); 160 160 … … 212 212 213 213 //initialize the global state variables 214 __cfaabi_tls.this_processor = mainProcessor;215 __cfaabi_tls.this_proc_id = (__processor_id_t*)mainProcessor;216 __cfaabi_tls.this_thread = mainThread;214 kernelTLS.this_processor = mainProcessor; 215 kernelTLS.this_proc_id = (__processor_id_t*)mainProcessor; 216 kernelTLS.this_thread = mainThread; 217 217 218 218 #if !defined( __CFA_NO_STATISTICS__ ) 219 __cfaabi_tls.this_stats = (__stats_t *)& storage_mainProcStats;220 __init_stats( __cfaabi_tls.this_stats );219 kernelTLS.this_stats = (__stats_t *)& storage_mainProcStats; 220 __init_stats( kernelTLS.this_stats ); 221 221 #endif 222 222 … … 234 234 // context. Hence, the main thread does not begin through __cfactx_invoke_thread, like all other threads. The trick here is that 235 235 // mainThread is on the ready queue when this call is made. 236 __kernel_first_resume( __cfaabi_tls.this_processor );236 __kernel_first_resume( kernelTLS.this_processor ); 237 237 238 238 … … 251 251 __cfadbg_print_safe(runtime_core, "Kernel : Started\n--------------------------------------------------\n\n"); 252 252 253 /* paranoid */ verify( ! __preemption_enabled());253 verify( ! kernelTLS.preemption_state.enabled ); 254 254 enable_interrupts( __cfaabi_dbg_ctx ); 255 /* paranoid */ verify( __preemption_enabled() ); 256 255 verify( TL_GET( preemption_state.enabled ) ); 257 256 } 258 257 … … 263 262 mainCluster->io.ctxs = 0p; 264 263 265 /* paranoid */ verify( __preemption_enabled() );264 /* paranoid */ verify( TL_GET( preemption_state.enabled ) ); 266 265 disable_interrupts(); 267 /* paranoid */ verify( ! __preemption_enabled());266 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 268 267 269 268 __cfadbg_print_safe(runtime_core, "\n--------------------------------------------------\nKernel : Shutting down\n"); … … 273 272 // which is currently here 274 273 __atomic_store_n(&mainProcessor->do_terminate, true, __ATOMIC_RELEASE); 275 __kernel_last_resume( __cfaabi_tls.this_processor );274 __kernel_last_resume( kernelTLS.this_processor ); 276 275 mainThread->self_cor.state = Halted; 277 276 … … 322 321 __stats_t local_stats; 323 322 __init_stats( &local_stats ); 324 __cfaabi_tls.this_stats = &local_stats;323 kernelTLS.this_stats = &local_stats; 325 324 #endif 326 325 327 326 processor * proc = (processor *) arg; 328 __cfaabi_tls.this_processor = proc;329 __cfaabi_tls.this_proc_id = (__processor_id_t*)proc;330 __cfaabi_tls.this_thread = 0p;331 __cfaabi_tls.preemption_state.[enabled, disable_count] = [false, 1];327 kernelTLS.this_processor = proc; 328 kernelTLS.this_proc_id = (__processor_id_t*)proc; 329 kernelTLS.this_thread = 0p; 330 kernelTLS.preemption_state.[enabled, disable_count] = [false, 1]; 332 331 // SKULLDUGGERY: We want to create a context for the processor coroutine 333 332 // which is needed for the 2-step context switch. However, there is no reason … … 341 340 342 341 //Set global state 343 __cfaabi_tls.this_thread = 0p;342 kernelTLS.this_thread = 0p; 344 343 345 344 //We now have a proper context from which to schedule threads … … 371 370 $coroutine * dst = get_coroutine(this->runner); 372 371 373 /* paranoid */ verify( ! __preemption_enabled());374 375 __cfaabi_tls.this_thread->curr_cor = dst;372 verify( ! kernelTLS.preemption_state.enabled ); 373 374 kernelTLS.this_thread->curr_cor = dst; 376 375 __stack_prepare( &dst->stack, 65000 ); 377 376 __cfactx_start(main, dst, this->runner, __cfactx_invoke_coroutine); 378 377 379 /* paranoid */ verify( ! __preemption_enabled());378 verify( ! kernelTLS.preemption_state.enabled ); 380 379 381 380 dst->last = &src->self_cor; … … 395 394 /* paranoid */ verify(src->state == Active); 396 395 397 /* paranoid */ verify( ! __preemption_enabled());396 verify( ! kernelTLS.preemption_state.enabled ); 398 397 } 399 398 … … 403 402 $coroutine * dst = get_coroutine(this->runner); 404 403 405 /* paranoid */ verify( ! __preemption_enabled());406 /* paranoid */verify( dst->starter == src );407 /* paranoid */verify( dst->context.SP );404 verify( ! kernelTLS.preemption_state.enabled ); 405 verify( dst->starter == src ); 406 verify( dst->context.SP ); 408 407 409 408 // SKULLDUGGERY in debug the processors check that the … … 547 546 548 547 P( terminated ); 549 /* paranoid */ verify( active_processor()!= &this);548 verify( kernelTLS.this_processor != &this); 550 549 } 551 550 … … 697 696 #if defined(__CFA_WITH_VERIFY__) 698 697 static bool verify_fwd_bck_rng(void) { 699 __cfaabi_tls.ready_rng.fwd_seed = 25214903917_l64u * (rdtscl() ^ (uintptr_t)&verify_fwd_bck_rng);698 kernelTLS.ready_rng.fwd_seed = 25214903917_l64u * (rdtscl() ^ (uintptr_t)&verify_fwd_bck_rng); 700 699 701 700 unsigned values[10]; -
libcfa/src/concurrency/kernel_private.hfa
r54dcab1 r231b18f 38 38 #endif 39 39 ; 40 41 extern bool __preemption_enabled();42 40 43 41 //release/wake-up the following resources … … 183 181 // creating/destroying queues 184 182 static inline void ready_schedule_lock(void) with(*__scheduler_lock) { 185 /* paranoid */ verify( ! __preemption_enabled() ); 186 /* paranoid */ verify( kernelTLS().this_proc_id ); 187 188 unsigned iproc = kernelTLS().this_proc_id->id; 189 /*paranoid*/ verify(data[iproc].handle == kernelTLS().this_proc_id); 183 /*paranoid*/ verify( kernelTLS.this_proc_id ); 184 185 unsigned iproc = kernelTLS.this_proc_id->id; 186 /*paranoid*/ verify(data[iproc].handle == kernelTLS.this_proc_id); 190 187 /*paranoid*/ verify(iproc < ready); 191 188 … … 210 207 211 208 static inline void ready_schedule_unlock(void) with(*__scheduler_lock) { 212 /* paranoid */ verify( ! __preemption_enabled() ); 213 /* paranoid */ verify( kernelTLS().this_proc_id ); 214 215 unsigned iproc = kernelTLS().this_proc_id->id; 216 /*paranoid*/ verify(data[iproc].handle == kernelTLS().this_proc_id); 209 /*paranoid*/ verify( kernelTLS.this_proc_id ); 210 211 unsigned iproc = kernelTLS.this_proc_id->id; 212 /*paranoid*/ verify(data[iproc].handle == kernelTLS.this_proc_id); 217 213 /*paranoid*/ verify(iproc < ready); 218 214 /*paranoid*/ verify(data[iproc].lock); … … 227 223 #ifdef __CFA_WITH_VERIFY__ 228 224 static inline bool ready_schedule_islocked(void) { 229 /* paranoid */ verify( ! __preemption_enabled() ); 230 /*paranoid*/ verify( kernelTLS().this_proc_id ); 231 __processor_id_t * proc = kernelTLS().this_proc_id; 225 /*paranoid*/ verify( kernelTLS.this_proc_id ); 226 __processor_id_t * proc = kernelTLS.this_proc_id; 232 227 return __scheduler_lock->data[proc->id].owned; 233 228 } -
libcfa/src/concurrency/monitor.cfa
r54dcab1 r231b18f 82 82 // Enter single monitor 83 83 static void __enter( $monitor * this, const __monitor_group_t & group ) { 84 $thread * thrd = active_thread();85 86 84 // Lock the monitor spinlock 87 85 lock( this->lock __cfaabi_dbg_ctx2 ); 86 // Interrupts disable inside critical section 87 $thread * thrd = kernelTLS.this_thread; 88 88 89 89 __cfaabi_dbg_print_safe( "Kernel : %10p Entering mon %p (%p)\n", thrd, this, this->owner); … … 126 126 __cfaabi_dbg_print_safe( "Kernel : %10p Entered mon %p\n", thrd, this); 127 127 128 /* paranoid */ verifyf( active_thread() == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), this->owner, this->recursion, this );128 /* paranoid */ verifyf( kernelTLS.this_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this ); 129 129 return; 130 130 } … … 132 132 __cfaabi_dbg_print_safe( "Kernel : %10p Entered mon %p\n", thrd, this); 133 133 134 /* paranoid */ verifyf( active_thread() == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), this->owner, this->recursion, this );134 /* paranoid */ verifyf( kernelTLS.this_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this ); 135 135 /* paranoid */ verify( this->lock.lock ); 136 136 … … 141 141 142 142 static void __dtor_enter( $monitor * this, fptr_t func, bool join ) { 143 $thread * thrd = active_thread();144 145 143 // Lock the monitor spinlock 146 144 lock( this->lock __cfaabi_dbg_ctx2 ); 145 // Interrupts disable inside critical section 146 $thread * thrd = kernelTLS.this_thread; 147 147 148 148 __cfaabi_dbg_print_safe( "Kernel : %10p Entering dtor for mon %p (%p)\n", thrd, this, this->owner); … … 155 155 __set_owner( this, thrd ); 156 156 157 verifyf( active_thread() == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), this->owner, this->recursion, this );157 verifyf( kernelTLS.this_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this ); 158 158 159 159 unlock( this->lock ); … … 174 174 this->owner = thrd; 175 175 176 verifyf( active_thread() == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), this->owner, this->recursion, this );176 verifyf( kernelTLS.this_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this ); 177 177 178 178 unlock( this->lock ); … … 200 200 201 201 // Release the next thread 202 /* paranoid */ verifyf( urgent->owner->waiting_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), this->owner, this->recursion, this );202 /* paranoid */ verifyf( urgent->owner->waiting_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this ); 203 203 unpark( urgent->owner->waiting_thread ); 204 204 … … 207 207 208 208 // Some one was waiting for us, enter 209 /* paranoid */ verifyf( active_thread() == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), this->owner, this->recursion, this );209 /* paranoid */ verifyf( kernelTLS.this_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this ); 210 210 } 211 211 else { … … 224 224 park(); 225 225 226 /* paranoid */ verifyf( active_thread() == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), this->owner, this->recursion, this );226 /* paranoid */ verifyf( kernelTLS.this_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this ); 227 227 return; 228 228 } … … 237 237 lock( this->lock __cfaabi_dbg_ctx2 ); 238 238 239 __cfaabi_dbg_print_safe( "Kernel : %10p Leaving mon %p (%p)\n", active_thread(), this, this->owner);240 241 /* paranoid */ verifyf( active_thread() == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), this->owner, this->recursion, this );239 __cfaabi_dbg_print_safe( "Kernel : %10p Leaving mon %p (%p)\n", kernelTLS.this_thread, this, this->owner); 240 241 /* paranoid */ verifyf( kernelTLS.this_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this ); 242 242 243 243 // Leaving a recursion level, decrement the counter … … 270 270 void __dtor_leave( $monitor * this, bool join ) { 271 271 __cfaabi_dbg_debug_do( 272 if( active_thread() != this->owner ) {273 abort( "Destroyed monitor %p has inconsistent owner, expected %p got %p.\n", this, active_thread(), this->owner);272 if( TL_GET( this_thread ) != this->owner ) { 273 abort( "Destroyed monitor %p has inconsistent owner, expected %p got %p.\n", this, TL_GET( this_thread ), this->owner); 274 274 } 275 275 if( this->recursion != 1 && !join ) { … … 287 287 /* paranoid */ verify( this->lock.lock ); 288 288 /* paranoid */ verifyf( thrd == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", thrd, this->owner, this->recursion, this ); 289 /* paranoid */ verify( ! __preemption_enabled());289 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 290 290 /* paranoid */ verify( thrd->state == Halted ); 291 291 /* paranoid */ verify( this->recursion == 1 ); … … 303 303 // Unpark the next owner if needed 304 304 /* paranoid */ verifyf( !new_owner || new_owner == this->owner, "Expected owner to be %p, got %p (m: %p)", new_owner, this->owner, this ); 305 /* paranoid */ verify( ! __preemption_enabled());305 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 306 306 /* paranoid */ verify( thrd->state == Halted ); 307 307 unpark( new_owner ); … … 327 327 // Sorts monitors before entering 328 328 void ?{}( monitor_guard_t & this, $monitor * m [], __lock_size_t count, fptr_t func ) { 329 $thread * thrd = active_thread();329 $thread * thrd = TL_GET( this_thread ); 330 330 331 331 // Store current array … … 362 362 363 363 // Restore thread context 364 active_thread()->monitors = this.prev;364 TL_GET( this_thread )->monitors = this.prev; 365 365 } 366 366 … … 369 369 void ?{}( monitor_dtor_guard_t & this, $monitor * m [], fptr_t func, bool join ) { 370 370 // optimization 371 $thread * thrd = active_thread();371 $thread * thrd = TL_GET( this_thread ); 372 372 373 373 // Store current array … … 392 392 393 393 // Restore thread context 394 active_thread()->monitors = this.prev;394 TL_GET( this_thread )->monitors = this.prev; 395 395 } 396 396 … … 432 432 433 433 // Create the node specific to this wait operation 434 wait_ctx( active_thread(), user_info );434 wait_ctx( TL_GET( this_thread ), user_info ); 435 435 436 436 // Append the current wait operation to the ones already queued on the condition … … 483 483 //Some more checking in debug 484 484 __cfaabi_dbg_debug_do( 485 $thread * this_thrd = active_thread();485 $thread * this_thrd = TL_GET( this_thread ); 486 486 if ( this.monitor_count != this_thrd->monitors.size ) { 487 487 abort( "Signal on condition %p made with different number of monitor(s), expected %zi got %zi", &this, this.monitor_count, this_thrd->monitors.size ); … … 531 531 532 532 // Create the node specific to this wait operation 533 wait_ctx_primed( active_thread(), 0 )533 wait_ctx_primed( kernelTLS.this_thread, 0 ) 534 534 535 535 //save contexts … … 630 630 631 631 // Create the node specific to this wait operation 632 wait_ctx_primed( active_thread(), 0 );632 wait_ctx_primed( kernelTLS.this_thread, 0 ); 633 633 634 634 // Save monitor states … … 682 682 683 683 // Create the node specific to this wait operation 684 wait_ctx_primed( active_thread(), 0 );684 wait_ctx_primed( kernelTLS.this_thread, 0 ); 685 685 686 686 monitor_save; … … 688 688 689 689 for( __lock_size_t i = 0; i < count; i++) { 690 verify( monitors[i]->owner == active_thread());690 verify( monitors[i]->owner == kernelTLS.this_thread ); 691 691 } 692 692 … … 724 724 static inline void __set_owner( $monitor * monitors [], __lock_size_t count, $thread * owner ) { 725 725 /* paranoid */ verify ( monitors[0]->lock.lock ); 726 /* paranoid */ verifyf( monitors[0]->owner == active_thread(), "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), monitors[0]->owner, monitors[0]->recursion, monitors[0] );726 /* paranoid */ verifyf( monitors[0]->owner == kernelTLS.this_thread, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, monitors[0]->owner, monitors[0]->recursion, monitors[0] ); 727 727 monitors[0]->owner = owner; 728 728 monitors[0]->recursion = 1; 729 729 for( __lock_size_t i = 1; i < count; i++ ) { 730 730 /* paranoid */ verify ( monitors[i]->lock.lock ); 731 /* paranoid */ verifyf( monitors[i]->owner == active_thread(), "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), monitors[i]->owner, monitors[i]->recursion, monitors[i] );731 /* paranoid */ verifyf( monitors[i]->owner == kernelTLS.this_thread, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, monitors[i]->owner, monitors[i]->recursion, monitors[i] ); 732 732 monitors[i]->owner = owner; 733 733 monitors[i]->recursion = 0; … … 755 755 //regardless of if we are ready to baton pass, 756 756 //we need to set the monitor as in use 757 /* paranoid */ verifyf( !this->owner || active_thread() == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), this->owner, this->recursion, this );757 /* paranoid */ verifyf( !this->owner || kernelTLS.this_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this ); 758 758 __set_owner( this, urgent->owner->waiting_thread ); 759 759 … … 764 764 // Get the next thread in the entry_queue 765 765 $thread * new_owner = pop_head( this->entry_queue ); 766 /* paranoid */ verifyf( !this->owner || active_thread() == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", active_thread(), this->owner, this->recursion, this );766 /* paranoid */ verifyf( !this->owner || kernelTLS.this_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this ); 767 767 /* paranoid */ verify( !new_owner || new_owner->link.next == 0p ); 768 768 __set_owner( this, new_owner ); … … 892 892 893 893 static inline void brand_condition( condition & this ) { 894 $thread * thrd = active_thread();894 $thread * thrd = TL_GET( this_thread ); 895 895 if( !this.monitors ) { 896 896 // __cfaabi_dbg_print_safe( "Branding\n" ); -
libcfa/src/concurrency/preemption.cfa
r54dcab1 r231b18f 163 163 // Kernel Signal Tools 164 164 //============================================================================================= 165 165 166 // In a user-level threading system, there are handful of thread-local variables where this problem occurs on the ARM. 166 // 167 // 167 168 // For each kernel thread running user-level threads, there is a flag variable to indicate if interrupts are 168 169 // enabled/disabled for that kernel thread. Therefore, this variable is made thread local. 169 // 170 // 170 171 // For example, this code fragment sets the state of the "interrupt" variable in thread-local memory. 171 // 172 // 172 173 // _Thread_local volatile int interrupts; 173 174 // int main() { 174 175 // interrupts = 0; // disable interrupts } 175 // 176 // 176 177 // which generates the following code on the ARM 177 // 178 // 178 179 // (gdb) disassemble main 179 180 // Dump of assembler code for function main: … … 184 185 // 0x0000000000000620 <+16>: str wzr, [x1] 185 186 // 0x0000000000000624 <+20>: ret 186 // 187 // 187 188 // The mrs moves a pointer from coprocessor register tpidr_el0 into register x1. Register w0 is set to 0. The two adds 188 189 // increase the TLS pointer with the displacement (offset) 0x10, which is the location in the TSL of variable … … 192 193 // the user-level ready-queue it is run on kernel thread M. It now stores 0 into "interrupts" back on kernel thread N, 193 194 // turning off interrupt on the wrong kernel thread. 194 // 195 // 195 196 // On the x86, the following code is generated for the same code fragment. 196 // 197 // 197 198 // (gdb) disassemble main 198 199 // Dump of assembler code for function main: 199 200 // 0x0000000000400420 <+0>: movl $0x0,%fs:0xfffffffffffffffc 200 201 // 0x000000000040042c <+12>: xor %eax,%eax 201 // 0x000000000040042e <+14>: retq 202 // 202 // 0x000000000040042e <+14>: retq 203 // 203 204 // and there is base-displacement addressing used to atomically reset variable "interrupts" off of the TSL pointer in 204 205 // register "fs". 205 // 206 // 206 207 // Hence, the ARM has base-displacement address for the general purpose registers, BUT not to the coprocessor 207 208 // registers. As a result, generating the address for the write into variable "interrupts" is no longer atomic. 208 // 209 // 209 210 // Note this problem does NOT occur when just using multiple kernel threads because the preemption ALWAYS restarts the 210 211 // thread on the same kernel thread. 211 // 212 // 212 213 // The obvious question is why does ARM use a coprocessor register to store the TSL pointer given that coprocessor 213 214 // registers are second-class registers with respect to the instruction set. One possible answer is that they did not … … 215 216 // available. 216 217 217 //---------- 218 // special case for preemption since used often 219 bool __preemption_enabled() { 220 // create a assembler label before 221 // marked as clobber all to avoid movement 222 asm volatile("__cfaasm_check_before:":::"memory"); 223 224 // access tls as normal 225 bool enabled = __cfaabi_tls.preemption_state.enabled; 226 227 // create a assembler label after 228 // marked as clobber all to avoid movement 229 asm volatile("__cfaasm_check_after:":::"memory"); 230 return enabled; 231 } 232 233 //---------- 234 // Get data from the TLS block 235 uintptr_t __cfatls_get( unsigned long int offset ) __attribute__((__noinline__)); //no inline to avoid problems 236 uintptr_t __cfatls_get( unsigned long int offset ) { 237 // create a assembler label before 238 // marked as clobber all to avoid movement 239 asm volatile("__cfaasm_get_before:":::"memory"); 240 241 // access tls as normal (except for pointer arithmetic) 242 uintptr_t val = *(uintptr_t*)((uintptr_t)&__cfaabi_tls + offset); 243 244 // create a assembler label after 245 // marked as clobber all to avoid movement 246 asm volatile("__cfaasm_get_after:":::"memory"); 247 return val; 248 } 218 __cfaabi_dbg_debug_do( static thread_local void * last_interrupt = 0; ) 249 219 250 220 extern "C" { 251 221 // Disable interrupts by incrementing the counter 252 222 void disable_interrupts() { 253 // create a assembler label before 254 // marked as clobber all to avoid movement 255 asm volatile("__cfaasm_disable_before:":::"memory"); 256 257 with( __cfaabi_tls.preemption_state ) { 223 with( kernelTLS.preemption_state ) { 258 224 #if GCC_VERSION > 50000 259 225 static_assert(__atomic_always_lock_free(sizeof(enabled), &enabled), "Must be lock-free"); … … 272 238 verify( new_val < 65_000u ); // If this triggers someone is disabling interrupts without enabling them 273 239 } 274 275 // create a assembler label after276 // marked as clobber all to avoid movement277 asm volatile("__cfaasm_disable_after:":::"memory");278 240 } 279 241 … … 281 243 // If counter reaches 0, execute any pending __cfactx_switch 282 244 void enable_interrupts( __cfaabi_dbg_ctx_param ) { 283 // create a assembler label before 284 // marked as clobber all to avoid movement 285 asm volatile("__cfaasm_enable_before:":::"memory"); 286 287 processor * proc = __cfaabi_tls.this_processor; // Cache the processor now since interrupts can start happening after the atomic store 245 processor * proc = kernelTLS.this_processor; // Cache the processor now since interrupts can start happening after the atomic store 288 246 /* paranoid */ verify( proc ); 289 247 290 with( __cfaabi_tls.preemption_state ){248 with( kernelTLS.preemption_state ){ 291 249 unsigned short prev = disable_count; 292 250 disable_count -= 1; … … 315 273 // For debugging purposes : keep track of the last person to enable the interrupts 316 274 __cfaabi_dbg_debug_do( proc->last_enable = caller; ) 317 318 // create a assembler label after319 // marked as clobber all to avoid movement320 asm volatile("__cfaasm_enable_after:":::"memory");321 275 } 322 276 … … 324 278 // Don't execute any pending __cfactx_switch even if counter reaches 0 325 279 void enable_interrupts_noPoll() { 326 // create a assembler label before 327 // marked as clobber all to avoid movement 328 asm volatile("__cfaasm_nopoll_before:":::"memory"); 329 330 unsigned short prev = __cfaabi_tls.preemption_state.disable_count; 331 __cfaabi_tls.preemption_state.disable_count -= 1; 280 unsigned short prev = kernelTLS.preemption_state.disable_count; 281 kernelTLS.preemption_state.disable_count -= 1; 332 282 verifyf( prev != 0u, "Incremented from %u\n", prev ); // If this triggers someone is enabled already enabled interrupts 333 283 if( prev == 1 ) { 334 284 #if GCC_VERSION > 50000 335 static_assert(__atomic_always_lock_free(sizeof( __cfaabi_tls.preemption_state.enabled), &__cfaabi_tls.preemption_state.enabled), "Must be lock-free");285 static_assert(__atomic_always_lock_free(sizeof(kernelTLS.preemption_state.enabled), &kernelTLS.preemption_state.enabled), "Must be lock-free"); 336 286 #endif 337 287 // Set enabled flag to true 338 288 // should be atomic to avoid preemption in the middle of the operation. 339 289 // use memory order RELAXED since there is no inter-thread on this variable requirements 340 __atomic_store_n(& __cfaabi_tls.preemption_state.enabled, true, __ATOMIC_RELAXED);290 __atomic_store_n(&kernelTLS.preemption_state.enabled, true, __ATOMIC_RELAXED); 341 291 342 292 // Signal the compiler that a fence is needed but only for signal handlers 343 293 __atomic_signal_fence(__ATOMIC_RELEASE); 344 294 } 345 346 // create a assembler label after347 // marked as clobber all to avoid movement348 asm volatile("__cfaasm_nopoll_after:":::"memory");349 295 } 350 296 } … … 381 327 static void timeout( $thread * this ) { 382 328 #if !defined( __CFA_NO_STATISTICS__ ) 383 kernelTLS ().this_stats = this->curr_cluster->stats;329 kernelTLS.this_stats = this->curr_cluster->stats; 384 330 #endif 385 331 unpark( this ); … … 392 338 static inline bool preemption_ready() { 393 339 // Check if preemption is safe 394 bool ready = __cfaabi_tls.preemption_state.enabled && ! __cfaabi_tls.preemption_state.in_progress;340 bool ready = kernelTLS.preemption_state.enabled && ! kernelTLS.preemption_state.in_progress; 395 341 396 342 // Adjust the pending flag accordingly 397 __cfaabi_tls.this_processor->pending_preemption = !ready;343 kernelTLS.this_processor->pending_preemption = !ready; 398 344 return ready; 399 345 } … … 409 355 410 356 // Start with preemption disabled until ready 411 __cfaabi_tls.preemption_state.enabled = false;412 __cfaabi_tls.preemption_state.disable_count = 1;357 kernelTLS.preemption_state.enabled = false; 358 kernelTLS.preemption_state.disable_count = 1; 413 359 414 360 // Initialize the event kernel … … 468 414 // Kernel Signal Handlers 469 415 //============================================================================================= 470 struct asm_region {471 void * before;472 void * after;473 };474 475 //-----------------------------------------------------------------------------476 // Some assembly required477 #if defined( __i386 )478 #define __cfaasm_label( label ) \479 ({ \480 struct asm_region region; \481 asm( \482 "movl $__cfaasm_" #label "_before, %[vb]\n\t" \483 "movl $__cfaasm_" #label "_after , %[va]\n\t" \484 : [vb]"=r"(region.before), [vb]"=r"(region.before) \485 ); \486 region; \487 });488 #elif defined( __x86_64 )489 #ifdef __PIC__490 #define PLT "@PLT"491 #else492 #define PLT ""493 #endif494 #define __cfaasm_label( label ) \495 ({ \496 struct asm_region region; \497 asm( \498 "movq $__cfaasm_" #label "_before" PLT ", %[vb]\n\t" \499 "movq $__cfaasm_" #label "_after" PLT ", %[va]\n\t" \500 : [vb]"=r"(region.before), [va]"=r"(region.after) \501 ); \502 region; \503 });504 #elif defined( __aarch64__ )505 #error __cfaasm_label undefined for arm506 #else507 #error unknown hardware architecture508 #endif509 510 __cfaabi_dbg_debug_do( static thread_local void * last_interrupt = 0; )511 416 512 417 // Context switch signal handler 513 418 // Receives SIGUSR1 signal and causes the current thread to yield 514 419 static void sigHandler_ctxSwitch( __CFA_SIGPARMS__ ) { 515 void * ip = (void *)(cxt->uc_mcontext.CFA_REG_IP); 516 __cfaabi_dbg_debug_do( last_interrupt = ip; ) 420 __cfaabi_dbg_debug_do( last_interrupt = (void *)(cxt->uc_mcontext.CFA_REG_IP); ) 517 421 518 422 // SKULLDUGGERY: if a thread creates a processor and the immediately deletes it, … … 520 424 // before the kernel thread has even started running. When that happens, an interrupt 521 425 // with a null 'this_processor' will be caught, just ignore it. 522 if(! __cfaabi_tls.this_processor ) return;426 if(! kernelTLS.this_processor ) return; 523 427 524 428 choose(sfp->si_value.sival_int) { 525 429 case PREEMPT_NORMAL : ;// Normal case, nothing to do here 526 case PREEMPT_TERMINATE: verify( __atomic_load_n( & __cfaabi_tls.this_processor->do_terminate, __ATOMIC_SEQ_CST ) );430 case PREEMPT_TERMINATE: verify( __atomic_load_n( &kernelTLS.this_processor->do_terminate, __ATOMIC_SEQ_CST ) ); 527 431 default: 528 432 abort( "internal error, signal value is %d", sfp->si_value.sival_int ); … … 532 436 if( !preemption_ready() ) { return; } 533 437 534 struct asm_region region; 535 region = __cfaasm_label( get ); if( ip >= region.before && ip <= region.after ) return; 536 region = __cfaasm_label( check ); if( ip >= region.before && ip <= region.after ) return; 537 region = __cfaasm_label( disable ); if( ip >= region.before && ip <= region.after ) return; 538 region = __cfaasm_label( enable ); if( ip >= region.before && ip <= region.after ) return; 539 region = __cfaasm_label( nopoll ); if( ip >= region.before && ip <= region.after ) return; 540 541 __cfaabi_dbg_print_buffer_decl( " KERNEL: preempting core %p (%p @ %p).\n", __cfaabi_tls.this_processor, __cfaabi_tls.this_thread, (void *)(cxt->uc_mcontext.CFA_REG_IP) ); 438 __cfaabi_dbg_print_buffer_decl( " KERNEL: preempting core %p (%p @ %p).\n", kernelTLS.this_processor, kernelTLS.this_thread, (void *)(cxt->uc_mcontext.CFA_REG_IP) ); 542 439 543 440 // Sync flag : prevent recursive calls to the signal handler 544 __cfaabi_tls.preemption_state.in_progress = true;441 kernelTLS.preemption_state.in_progress = true; 545 442 546 443 // Clear sighandler mask before context switching. … … 552 449 } 553 450 451 // TODO: this should go in finish action 554 452 // Clear the in progress flag 555 __cfaabi_tls.preemption_state.in_progress = false;453 kernelTLS.preemption_state.in_progress = false; 556 454 557 455 // Preemption can occur here … … 570 468 id.full_proc = false; 571 469 id.id = doregister(&id); 572 __cfaabi_tls.this_proc_id = &id;470 kernelTLS.this_proc_id = &id; 573 471 574 472 // Block sigalrms to control when they arrive … … 638 536 639 537 void __cfaabi_check_preemption() { 640 bool ready = __preemption_enabled();538 bool ready = kernelTLS.preemption_state.enabled; 641 539 if(!ready) { abort("Preemption should be ready"); } 642 540 … … 661 559 #ifdef __CFA_WITH_VERIFY__ 662 560 bool __cfaabi_dbg_in_kernel() { 663 return ! __preemption_enabled();561 return !kernelTLS.preemption_state.enabled; 664 562 } 665 563 #endif -
libcfa/src/concurrency/ready_queue.cfa
r54dcab1 r231b18f 150 150 // queues or removing them. 151 151 uint_fast32_t ready_mutate_lock( void ) with(*__scheduler_lock) { 152 /* paranoid */ verify( ! __preemption_enabled());152 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 153 153 154 154 // Step 1 : lock global lock … … 166 166 } 167 167 168 /* paranoid */ verify( ! __preemption_enabled());168 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 169 169 return s; 170 170 } 171 171 172 172 void ready_mutate_unlock( uint_fast32_t last_s ) with(*__scheduler_lock) { 173 /* paranoid */ verify( ! __preemption_enabled());173 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 174 174 175 175 // Step 1 : release local locks … … 188 188 __atomic_store_n(&lock, (bool)false, __ATOMIC_RELEASE); 189 189 190 /* paranoid */ verify( ! __preemption_enabled());190 /* paranoid */ verify( ! kernelTLS.preemption_state.enabled ); 191 191 } 192 192 … … 252 252 preferred = 253 253 //* 254 kernelTLS ().this_processor ? kernelTLS().this_processor->id * 4 : -1;254 kernelTLS.this_processor ? kernelTLS.this_processor->id * 4 : -1; 255 255 /*/ 256 256 thrd->link.preferred * 4; … … 331 331 // Don't bother trying locally too much 332 332 int local_tries = 8; 333 preferred = kernelTLS ().this_processor->id * 4;333 preferred = kernelTLS.this_processor->id * 4; 334 334 #endif 335 335 -
tools/stat.py
r54dcab1 r231b18f 1 #!/usr/bin/python 31 #!/usr/bin/python 2 2 3 3 import sys … … 17 17 avg = numpy.mean (content) 18 18 std = numpy.std (content) 19 print ("median {0:.1f} avg {1:.1f} stddev {2:.1f}".format( med, avg, std ))19 print "median {0:.1f} avg {1:.1f} stddev {2:.1f}".format( med, avg, std ) 20 20 21 21
Note:
See TracChangeset
for help on using the changeset viewer.