source: src/libcfa/concurrency/monitor.c @ 97e3296

aaron-thesisarm-ehcleanup-dtorsdeferred_resndemanglerenumforall-pointer-decayjacob/cs343-translationjenkins-sandboxnew-astnew-ast-unique-exprnew-envno_listpersistent-indexerpthread-emulationqualifiedEnumresolv-newwith_gc
Last change on this file since 97e3296 was 97e3296, checked in by Thierry Delisle <tdelisle@…>, 6 years ago

First working implementation of external scheduling... Still lots of testing to do

  • Property mode set to 100644
File size: 20.2 KB
Line 
1//
2// Cforall Version 1.0.0 Copyright (C) 2016 University of Waterloo
3//
4// The contents of this file are covered under the licence agreement in the
5// file "LICENCE" distributed with Cforall.
6//
7// monitor_desc.c --
8//
9// Author           : Thierry Delisle
10// Created On       : Thd Feb 23 12:27:26 2017
11// Last Modified By : Peter A. Buhr
12// Last Modified On : Mon Jul 31 14:59:05 2017
13// Update Count     : 3
14//
15
16#include "monitor"
17
18#include <stdlib>
19
20#include "libhdr.h"
21#include "kernel_private.h"
22
23//-----------------------------------------------------------------------------
24// Forward declarations
25static inline void set_owner( monitor_desc * this, thread_desc * owner );
26static inline thread_desc * next_thread( monitor_desc * this );
27static inline int is_accepted( thread_desc * owner, monitor_desc * this, monitor_desc ** group, int group_cnt, void (*func)() );
28
29static inline void lock_all( spinlock ** locks, unsigned short count );
30static inline void lock_all( monitor_desc ** source, spinlock ** /*out*/ locks, unsigned short count );
31static inline void unlock_all( spinlock ** locks, unsigned short count );
32static inline void unlock_all( monitor_desc ** locks, unsigned short count );
33
34static inline void save_recursion   ( monitor_desc ** ctx, unsigned int * /*out*/ recursions, unsigned short count );
35static inline void restore_recursion( monitor_desc ** ctx, unsigned int * /*in */ recursions, unsigned short count );
36
37static inline void init     ( int count, monitor_desc ** monitors, __condition_node_t * waiter, __condition_criterion_t * criteria );
38static inline void init_push( int count, monitor_desc ** monitors, __condition_node_t * waiter, __condition_criterion_t * criteria );
39
40static inline thread_desc * check_condition( __condition_criterion_t * );
41static inline void brand_condition( condition * );
42static inline unsigned short insert_unique( thread_desc ** thrds, unsigned short end, thread_desc * val );
43
44static inline thread_desc * search_entry_queue( __acceptable_t * acceptables, int acc_count, monitor_desc ** monitors, int count );
45
46//-----------------------------------------------------------------------------
47// Useful defines
48#define wait_ctx(thrd, user_info)                               /* Create the necessary information to use the signaller stack       */ \
49        __condition_node_t waiter = { thrd, count, user_info };   /* Create the node specific to this wait operation                   */ \
50        __condition_criterion_t criteria[count];                  /* Create the creteria this wait operation needs to wake up          */ \
51        init( count, monitors, &waiter, criteria );               /* Link everything together                                          */ \
52
53#define wait_ctx_primed(thrd, user_info)                        /* Create the necessary information to use the signaller stack       */ \
54        __condition_node_t waiter = { thrd, count, user_info };   /* Create the node specific to this wait operation                   */ \
55        __condition_criterion_t criteria[count];                  /* Create the creteria this wait operation needs to wake up          */ \
56        init_push( count, monitors, &waiter, criteria );          /* Link everything together and push it to the AS-Stack              */ \
57
58#define monitor_ctx( mons, cnt )              /* Define that create the necessary struct for internal/external scheduling operations */ \
59        monitor_desc ** monitors = mons;        /* Save the targeted monitors                                                          */ \
60        unsigned short count = cnt;             /* Save the count to a local variable                                                  */ \
61        unsigned int recursions[ count ];       /* Save the current recursion levels to restore them later                             */ \
62        spinlock *   locks     [ count ];       /* We need to pass-in an array of locks to BlockInternal                               */ \
63
64//-----------------------------------------------------------------------------
65// Enter/Leave routines
66
67
68extern "C" {
69        // Enter single monitor
70        static void __enter_monitor_desc( monitor_desc * this, monitor_desc ** group, int group_cnt, void (*func)() ) {
71                // Lock the monitor spinlock, lock_yield to reduce contention
72                lock_yield( &this->lock DEBUG_CTX2 );
73                thread_desc * thrd = this_thread;
74
75                this->accepted_index = -1;
76                if( !this->owner ) {
77                        // No one has the monitor, just take it
78                        set_owner( this, thrd );
79                }
80                else if( this->owner == thrd) {
81                        // We already have the monitor, just not how many times we took it
82                        verify( this->recursion > 0 );
83                        this->recursion += 1;
84                }
85                else if( (this->accepted_index = is_accepted( thrd, this, group, group_cnt, func)) >= 0 ) {
86                        // Some one was waiting for us, enter
87                        set_owner( this, thrd );
88                }
89                else {
90                        // Some one else has the monitor, wait in line for it
91                        append( &this->entry_queue, thrd );
92                        BlockInternal( &this->lock );
93
94                        // BlockInternal will unlock spinlock, no need to unlock ourselves
95                        return;
96                }
97
98                // Release the lock and leave
99                unlock( &this->lock );
100                return;
101        }
102
103        // Leave single monitor
104        void __leave_monitor_desc( monitor_desc * this ) {
105                // Lock the monitor spinlock, lock_yield to reduce contention
106                lock_yield( &this->lock DEBUG_CTX2 );
107
108                verifyf( this_thread == this->owner, "Expected owner to be %p, got %p (r: %i)", this_thread, this->owner, this->recursion );
109
110                // Leaving a recursion level, decrement the counter
111                this->recursion -= 1;
112
113                // If we haven't left the last level of recursion
114                // it means we don't need to do anything
115                if( this->recursion != 0) {
116                        unlock( &this->lock );
117                        return;
118                }
119
120                // Get the next thread, will be null on low contention monitor
121                thread_desc * new_owner = next_thread( this );
122
123                // We can now let other threads in safely
124                unlock( &this->lock );
125
126                //We need to wake-up the thread
127                WakeThread( new_owner );
128        }
129
130        // Leave the thread monitor
131        // last routine called by a thread.
132        // Should never return
133        void __leave_thread_monitor( thread_desc * thrd ) {
134                monitor_desc * this = &thrd->mon;
135
136                // Lock the monitor now
137                lock_yield( &this->lock DEBUG_CTX2 );
138
139                disable_interrupts();
140
141                thrd->cor.state = Halted;
142
143                verifyf( thrd == this->owner, "Expected owner to be %p, got %p (r: %i)", thrd, this->owner, this->recursion );
144
145                // Leaving a recursion level, decrement the counter
146                this->recursion -= 1;
147
148                // If we haven't left the last level of recursion
149                // it must mean there is an error
150                if( this->recursion != 0) { abortf("Thread internal monitor has unbalanced recursion"); }
151
152                // Fetch the next thread, can be null
153                thread_desc * new_owner = next_thread( this );
154
155                // Leave the thread, this will unlock the spinlock
156                // Use leave thread instead of BlockInternal which is
157                // specialized for this case and supports null new_owner
158                LeaveThread( &this->lock, new_owner );
159
160                // Control flow should never reach here!
161        }
162}
163
164// Enter multiple monitor
165// relies on the monitor array being sorted
166static inline void enter(monitor_desc ** monitors, int count, void (*func)() ) {
167        for(int i = 0; i < count; i++) {
168                __enter_monitor_desc( monitors[i], monitors, count, func );
169        }
170
171        int acc_idx = monitors[0]->accepted_index;
172        if( acc_idx >= 0 && monitors[0]->acceptables[ acc_idx ].run_preaccept ) {
173                assert( monitors[0]->pre_accept );
174                monitors[0]->pre_accept();
175        }
176}
177
178// Leave multiple monitor
179// relies on the monitor array being sorted
180static inline void leave(monitor_desc ** monitors, int count) {
181        for(int i = count - 1; i >= 0; i--) {
182                __leave_monitor_desc( monitors[i] );
183        }
184}
185
186// Ctor for monitor guard
187// Sorts monitors before entering
188void ?{}( monitor_guard_t * this, monitor_desc ** m, int count, void (*func)() ) {
189        // Store current array
190        this->m = m;
191        this->count = count;
192
193        // Sort monitors based on address -> TODO use a sort specialized for small numbers
194        qsort(this->m, count);
195
196        // Enter the monitors in order
197        enter( this->m, this->count, func );
198
199        // Save previous thread context
200        this->prev_mntrs = this_thread->current_monitors;
201        this->prev_count = this_thread->current_monitor_count;
202
203        // Update thread context (needed for conditions)
204        this_thread->current_monitors      = m;
205        this_thread->current_monitor_count = count;
206}
207
208// Dtor for monitor guard
209void ^?{}( monitor_guard_t * this ) {
210        // Leave the monitors in order
211        leave( this->m, this->count );
212
213        // Restore thread context
214        this_thread->current_monitors      = this->prev_mntrs;
215        this_thread->current_monitor_count = this->prev_count;
216}
217
218//-----------------------------------------------------------------------------
219// Internal scheduling types
220
221void ?{}(__condition_node_t * this, thread_desc * waiting_thread, unsigned short count, uintptr_t user_info ) {
222        this->waiting_thread = waiting_thread;
223        this->count = count;
224        this->next = NULL;
225        this->user_info = user_info;
226}
227
228void ?{}(__condition_criterion_t * this ) {
229        this->ready  = false;
230        this->target = NULL;
231        this->owner  = NULL;
232        this->next   = NULL;
233}
234
235void ?{}(__condition_criterion_t * this, monitor_desc * target, __condition_node_t * owner ) {
236        this->ready  = false;
237        this->target = target;
238        this->owner  = owner;
239        this->next   = NULL;
240}
241
242//-----------------------------------------------------------------------------
243// Internal scheduling
244void wait( condition * this, uintptr_t user_info = 0 ) {
245        brand_condition( this );
246
247        // Check that everything is as expected
248        assertf( this->monitors != NULL, "Waiting with no monitors (%p)", this->monitors );
249        verifyf( this->monitor_count != 0, "Waiting with 0 monitors (%i)", this->monitor_count );
250        verifyf( this->monitor_count < 32u, "Excessive monitor count (%i)", this->monitor_count );
251
252        // Create storage for monitor context
253        monitor_ctx( this->monitors, this->monitor_count );
254
255        // Create the node specific to this wait operation
256        wait_ctx( this_thread, user_info );
257
258        // Append the current wait operation to the ones already queued on the condition
259        // We don't need locks for that since conditions must always be waited on inside monitor mutual exclusion
260        append( &this->blocked, &waiter );
261
262        // Lock all monitors (aggregates the lock them as well)
263        lock_all( monitors, locks, count );
264
265        // DON'T unlock, ask the kernel to do it
266
267        // Save monitor state
268        save_recursion( monitors, recursions, count );
269
270        // Find the next thread(s) to run
271        unsigned short thread_count = 0;
272        thread_desc * threads[ count ];
273        for(int i = 0; i < count; i++) {
274                threads[i] = 0;
275        }
276
277        // Remove any duplicate threads
278        for( int i = 0; i < count; i++) {
279                thread_desc * new_owner = next_thread( monitors[i] );
280                thread_count = insert_unique( threads, thread_count, new_owner );
281        }
282
283        // Everything is ready to go to sleep
284        BlockInternal( locks, count, threads, thread_count );
285
286
287        // WE WOKE UP
288
289
290        // We are back, restore the owners and recursions
291        lock_all( locks, count );
292        restore_recursion( monitors, recursions, count );
293        unlock_all( locks, count );
294}
295
296bool signal( condition * this ) {
297        if( is_empty( this ) ) { return false; }
298
299        //Check that everything is as expected
300        verify( this->monitors );
301        verify( this->monitor_count != 0 );
302
303        //Some more checking in debug
304        LIB_DEBUG_DO(
305                thread_desc * this_thrd = this_thread;
306                if ( this->monitor_count != this_thrd->current_monitor_count ) {
307                        abortf( "Signal on condition %p made with different number of monitor(s), expected %i got %i", this, this->monitor_count, this_thrd->current_monitor_count );
308                }
309
310                for(int i = 0; i < this->monitor_count; i++) {
311                        if ( this->monitors[i] != this_thrd->current_monitors[i] ) {
312                                abortf( "Signal on condition %p made with different monitor, expected %p got %i", this, this->monitors[i], this_thrd->current_monitors[i] );
313                        }
314                }
315        );
316
317        unsigned short count = this->monitor_count;
318
319        // Lock all monitors
320        lock_all( this->monitors, NULL, count );
321
322        //Pop the head of the waiting queue
323        __condition_node_t * node = pop_head( &this->blocked );
324
325        //Add the thread to the proper AS stack
326        for(int i = 0; i < count; i++) {
327                __condition_criterion_t * crit = &node->criteria[i];
328                assert( !crit->ready );
329                push( &crit->target->signal_stack, crit );
330        }
331
332        //Release
333        unlock_all( this->monitors, count );
334
335        return true;
336}
337
338bool signal_block( condition * this ) {
339        if( !this->blocked.head ) { return false; }
340
341        //Check that everything is as expected
342        verifyf( this->monitors != NULL, "Waiting with no monitors (%p)", this->monitors );
343        verifyf( this->monitor_count != 0, "Waiting with 0 monitors (%i)", this->monitor_count );
344
345        // Create storage for monitor context
346        monitor_ctx( this->monitors, this->monitor_count );
347
348        // Lock all monitors (aggregates the locks them as well)
349        lock_all( monitors, locks, count );
350
351        // Create the node specific to this wait operation
352        wait_ctx_primed( this_thread, 0 )
353
354        //save contexts
355        save_recursion( monitors, recursions, count );
356
357        //Find the thread to run
358        thread_desc * signallee = pop_head( &this->blocked )->waiting_thread;
359        for(int i = 0; i < count; i++) {
360                set_owner( monitors[i], signallee );
361        }
362
363        //Everything is ready to go to sleep
364        BlockInternal( locks, count, &signallee, 1 );
365
366
367        // WE WOKE UP
368
369
370        //We are back, restore the owners and recursions
371        lock_all( locks, count );
372        restore_recursion( monitors, recursions, count );
373        unlock_all( locks, count );
374
375        return true;
376}
377
378// Access the user_info of the thread waiting at the front of the queue
379uintptr_t front( condition * this ) {
380        verifyf( !is_empty(this),
381                "Attempt to access user data on an empty condition.\n"
382                "Possible cause is not checking if the condition is empty before reading stored data."
383        );
384        return this->blocked.head->user_info;
385}
386
387//-----------------------------------------------------------------------------
388// Internal scheduling
389int __accept_internal( unsigned short acc_count, __acceptable_t * acceptables ) {
390        thread_desc * thrd = this_thread;
391
392        // Create storage for monitor context
393        monitor_ctx( acceptables->monitors, acceptables->count );
394
395        // Lock all monitors (aggregates the lock them as well)
396        lock_all( monitors, locks, count );
397
398        // Create the node specific to this wait operation
399        wait_ctx_primed( thrd, 0 );
400
401        // Check if the entry queue
402        thread_desc * next = search_entry_queue( acceptables, acc_count, monitors, count );
403
404        if( !next ) {
405                // Update acceptables on the current monitors
406                for(int i = 0; i < count; i++) {
407                        monitors[i]->acceptables = acceptables;
408                        monitors[i]->acceptable_count = acc_count;
409                }
410        }
411
412        save_recursion( monitors, recursions, count );
413
414        // Everything is ready to go to sleep
415        BlockInternal( locks, count, &next, next ? 1 : 0 );
416
417
418        //WE WOKE UP
419
420
421        //We are back, restore the owners and recursions
422        lock_all( locks, count );
423        restore_recursion( monitors, recursions, count );
424        int acc_idx = monitors[0]->accepted_index;
425        unlock_all( locks, count );
426
427        return acc_idx;
428}
429
430//-----------------------------------------------------------------------------
431// Utilities
432
433static inline void set_owner( monitor_desc * this, thread_desc * owner ) {
434        //Pass the monitor appropriately
435        this->owner = owner;
436
437        //We are passing the monitor to someone else, which means recursion level is not 0
438        this->recursion = owner ? 1 : 0;
439}
440
441static inline thread_desc * next_thread( monitor_desc * this ) {
442        //Check the signaller stack
443        __condition_criterion_t * urgent = pop( &this->signal_stack );
444        if( urgent ) {
445                //The signaller stack is not empty,
446                //regardless of if we are ready to baton pass,
447                //we need to set the monitor as in use
448                set_owner( this,  urgent->owner->waiting_thread );
449
450                return check_condition( urgent );
451        }
452
453        // No signaller thread
454        // Get the next thread in the entry_queue
455        thread_desc * new_owner = pop_head( &this->entry_queue );
456        set_owner( this, new_owner );
457
458        return new_owner;
459}
460
461static inline int is_accepted( thread_desc * owner, monitor_desc * this, monitor_desc ** group, int group_cnt, void (*func)() ) {
462        __acceptable_t* accs = this->acceptables; // Optim
463        int acc_cnt = this->acceptable_count;
464
465        // Check if there are any acceptable functions
466        if( !accs ) return -1;
467
468        // If this isn't the first monitor to test this, there is no reason to repeat the test.
469        if( this != group[0] ) return group[0]->accepted_index;
470
471        // For all acceptable functions check if this is the current function.
472        OUT_LOOP:
473        for( int i = 0; i < acc_cnt; i++ ) {
474                __acceptable_t * acc = &accs[i];
475
476                // if function matches, check the monitors
477                if( acc->func == func ) {
478
479                        // If the group count is different then it can't be a match
480                        if( acc->count != group_cnt ) return -1;
481
482                        // Check that all the monitors match
483                        for( int j = 0; j < group_cnt; j++ ) {
484                                // If not a match, check next function
485                                if( acc->monitors[j] != group[j] ) continue OUT_LOOP;
486                        }
487
488                        // It's a complete match, accept the call
489                        return i;
490                }
491        }
492
493        // No function matched
494        return -1;
495}
496
497static inline void init( int count, monitor_desc ** monitors, __condition_node_t * waiter, __condition_criterion_t * criteria ) {
498        for(int i = 0; i < count; i++) {
499                (&criteria[i]){ monitors[i], waiter };
500        }
501
502        waiter->criteria = criteria;
503}
504
505static inline void init_push( int count, monitor_desc ** monitors, __condition_node_t * waiter, __condition_criterion_t * criteria ) {
506        for(int i = 0; i < count; i++) {
507                (&criteria[i]){ monitors[i], waiter };
508                push( &criteria[i].target->signal_stack, &criteria[i] );
509        }
510
511        waiter->criteria = criteria;
512}
513
514static inline void lock_all( spinlock ** locks, unsigned short count ) {
515        for( int i = 0; i < count; i++ ) {
516                lock_yield( locks[i] DEBUG_CTX2 );
517        }
518}
519
520static inline void lock_all( monitor_desc ** source, spinlock ** /*out*/ locks, unsigned short count ) {
521        for( int i = 0; i < count; i++ ) {
522                spinlock * l = &source[i]->lock;
523                lock_yield( l DEBUG_CTX2 );
524                if(locks) locks[i] = l;
525        }
526}
527
528static inline void unlock_all( spinlock ** locks, unsigned short count ) {
529        for( int i = 0; i < count; i++ ) {
530                unlock( locks[i] );
531        }
532}
533
534static inline void unlock_all( monitor_desc ** locks, unsigned short count ) {
535        for( int i = 0; i < count; i++ ) {
536                unlock( &locks[i]->lock );
537        }
538}
539
540
541static inline void save_recursion   ( monitor_desc ** ctx, unsigned int * /*out*/ recursions, unsigned short count ) {
542        for( int i = 0; i < count; i++ ) {
543                recursions[i] = ctx[i]->recursion;
544        }
545}
546
547static inline void restore_recursion( monitor_desc ** ctx, unsigned int * /*in */ recursions, unsigned short count ) {
548        for( int i = 0; i < count; i++ ) {
549                ctx[i]->recursion = recursions[i];
550        }
551}
552
553// Function has 2 different behavior
554// 1 - Marks a monitors as being ready to run
555// 2 - Checks if all the monitors are ready to run
556//     if so return the thread to run
557static inline thread_desc * check_condition( __condition_criterion_t * target ) {
558        __condition_node_t * node = target->owner;
559        unsigned short count = node->count;
560        __condition_criterion_t * criteria = node->criteria;
561
562        bool ready2run = true;
563
564        for(    int i = 0; i < count; i++ ) {
565
566                // LIB_DEBUG_PRINT_SAFE( "Checking %p for %p\n", &criteria[i], target );
567                if( &criteria[i] == target ) {
568                        criteria[i].ready = true;
569                        // LIB_DEBUG_PRINT_SAFE( "True\n" );
570                }
571
572                ready2run = criteria[i].ready && ready2run;
573        }
574
575        // LIB_DEBUG_PRINT_SAFE( "Runing %i\n", ready2run );
576        return ready2run ? node->waiting_thread : NULL;
577}
578
579static inline void brand_condition( condition * this ) {
580        thread_desc * thrd = this_thread;
581        if( !this->monitors ) {
582                // LIB_DEBUG_PRINT_SAFE("Branding\n");
583                assertf( thrd->current_monitors != NULL, "No current monitor to brand condition %p", thrd->current_monitors );
584                this->monitor_count = thrd->current_monitor_count;
585
586                this->monitors = malloc( this->monitor_count * sizeof( *this->monitors ) );
587                for( int i = 0; i < this->monitor_count; i++ ) {
588                        this->monitors[i] = thrd->current_monitors[i];
589                }
590        }
591}
592
593static inline unsigned short insert_unique( thread_desc ** thrds, unsigned short end, thread_desc * val ) {
594        if( !val ) return end;
595
596        for(int i = 0; i <= end; i++) {
597                if( thrds[i] == val ) return end;
598        }
599
600        thrds[end] = val;
601        return end + 1;
602}
603
604static inline thread_desc * search_entry_queue( __acceptable_t * acceptables, int acc_count, monitor_desc ** monitors, int count ) {
605        return NULL;
606}
607
608void ?{}( __condition_blocked_queue_t * this ) {
609        this->head = NULL;
610        this->tail = &this->head;
611}
612
613void append( __condition_blocked_queue_t * this, __condition_node_t * c ) {
614        verify(this->tail != NULL);
615        *this->tail = c;
616        this->tail = &c->next;
617}
618
619__condition_node_t * pop_head( __condition_blocked_queue_t * this ) {
620        __condition_node_t * head = this->head;
621        if( head ) {
622                this->head = head->next;
623                if( !head->next ) {
624                        this->tail = &this->head;
625                }
626                head->next = NULL;
627        }
628        return head;
629}
630
631// Local Variables: //
632// mode: c //
633// tab-width: 4 //
634// End: //
Note: See TracBrowser for help on using the repository browser.