source: libcfa/src/concurrency/kernel.hfa @ d3ab183

ADTarm-ehast-experimentalenumforall-pointer-decayjacob/cs343-translationnew-astnew-ast-unique-exprpthread-emulationqualifiedEnum
Last change on this file since d3ab183 was f6660520, checked in by Thierry Delisle <tdelisle@…>, 4 years ago

Added new implementation of io_uring that uses user-thread

  • Property mode set to 100644
File size: 6.6 KB
RevLine 
[8118303]1//
2// Cforall Version 1.0.0 Copyright (C) 2016 University of Waterloo
3//
4// The contents of this file are covered under the licence agreement in the
5// file "LICENCE" distributed with Cforall.
6//
[75a17f1]7// kernel --
[8118303]8//
9// Author           : Thierry Delisle
[75f3522]10// Created On       : Tue Jan 17 12:27:26 2017
[6b0b624]11// Last Modified By : Peter A. Buhr
[e3fea42]12// Last Modified On : Tue Feb  4 12:29:26 2020
13// Update Count     : 22
[8118303]14//
15
[6b0b624]16#pragma once
[8118303]17
[c84e80a]18#include <stdbool.h>
[92976d9]19#include <stdint.h>
[8118303]20
[bd98b58]21#include "invoke.h"
[73abe95]22#include "time_t.hfa"
[d76bd79]23#include "coroutine.hfa"
[bd98b58]24
[8def349]25extern "C" {
26#include <pthread.h>
[6b4cdd3]27#include <semaphore.h>
[8def349]28}
29
[db6f06a]30//-----------------------------------------------------------------------------
31// Locks
[bdeba0b]32struct semaphore {
[ea7d2b0]33        __spinlock_t lock;
[bdeba0b]34        int count;
[ac2b598]35        __queue_t($thread) waiting;
[9c31349]36};
37
[242a902]38void  ?{}(semaphore & this, int count = 1);
39void ^?{}(semaphore & this);
[4cedd9f]40void   P (semaphore & this);
[f0ce5f4]41bool   V (semaphore & this);
[d384787]42bool   V (semaphore & this, unsigned count);
[9c31349]43
[db6f06a]44
[bd98b58]45//-----------------------------------------------------------------------------
[de94a60]46// Processor
[de6319f]47extern struct cluster * mainCluster;
[bd98b58]48
[e60e0dc]49// Processor
[094476d]50coroutine processorCtx_t {
51        struct processor * proc;
52};
53
[e60e0dc]54// Wrapper around kernel threads
[c84e80a]55struct processor {
[e60e0dc]56        // Main state
[025278e]57        // Coroutine ctx who does keeps the state of the processor
[094476d]58        struct processorCtx_t runner;
[025278e]59
60        // Cluster from which to get threads
[de94a60]61        struct cluster * cltr;
[025278e]62
[de6319f]63        // Name of the processor
64        const char * name;
65
[025278e]66        // Handle to pthreads
67        pthread_t kernel_thread;
[2ac095d]68
[e60e0dc]69        // RunThread data
[025278e]70        // Action to do after a thread is ran
[ac2b598]71        $thread * destroyer;
[c81ebf9]72
[e60e0dc]73        // Preemption data
[025278e]74        // Node which is added in the discrete event simulaiton
75        struct alarm_node_t * preemption_alarm;
76
77        // If true, a preemption was triggered in an unsafe region, the processor must preempt as soon as possible
78        bool pending_preemption;
[c81ebf9]79
[92e7631]80        // Idle lock (kernel semaphore)
81        __bin_sem_t idle;
[85b1deb]82
83        // Termination
84        // Set to true to notify the processor should terminate
85        volatile bool do_terminate;
86
[92e7631]87        // Termination synchronisation (user semaphore)
[85b1deb]88        semaphore terminated;
[de94a60]89
[27f5f71]90        // pthread Stack
91        void * stack;
92
[de94a60]93        // Link lists fields
[ea8b2f7]94        struct __dbg_node_proc {
[de94a60]95                struct processor * next;
96                struct processor * prev;
97        } node;
[14a61b5]98
[e60e0dc]99#ifdef __CFA_DEBUG__
[025278e]100        // Last function to enable preemption on this processor
[cdbfab0]101        const char * last_enable;
[e60e0dc]102#endif
[c84e80a]103};
104
[e3fea42]105void  ?{}(processor & this, const char name[], struct cluster & cltr);
[242a902]106void ^?{}(processor & this);
[c84e80a]107
[de6319f]108static inline void  ?{}(processor & this)                    { this{ "Anonymous Processor", *mainCluster}; }
[de94a60]109static inline void  ?{}(processor & this, struct cluster & cltr)    { this{ "Anonymous Processor", cltr}; }
[e3fea42]110static inline void  ?{}(processor & this, const char name[]) { this{name, *mainCluster }; }
[de6319f]111
[c7a900a]112static inline [processor *&, processor *& ] __get( processor & this ) __attribute__((const)) { return this.node.[next, prev]; }
[de94a60]113
[92976d9]114//-----------------------------------------------------------------------------
115// I/O
116#if defined(HAVE_LINUX_IO_URING_H)
117struct io_uring_sq {
[2d8f7b0]118        // Head and tail of the ring (associated with array)
119        volatile uint32_t * head;
120        volatile uint32_t * tail;
121
122        // The actual kernel ring which uses head/tail
123        // indexes into the sqes arrays
124        uint32_t * array;
125
126        // number of entries and mask to go with it
127        const uint32_t * num;
128        const uint32_t * mask;
129
130        // Submission flags (Not sure what for)
[92976d9]131        uint32_t * flags;
[2d8f7b0]132
133        // number of sqes not submitted (whatever that means)
[92976d9]134        uint32_t * dropped;
135
[2d8f7b0]136        // Like head/tail but not seen by the kernel
137        volatile uint32_t alloc;
[f6660520]138        volatile uint32_t ready;
[92976d9]139
[2d8f7b0]140        __spinlock_t lock;
141
142        // A buffer of sqes (not the actual ring)
143        struct io_uring_sqe * sqes;
144
145        // The location and size of the mmaped area
[92976d9]146        void * ring_ptr;
[2d8f7b0]147        size_t ring_sz;
[d384787]148
149        // Statistics
[038be32]150        #if !defined(__CFA_NO_STATISTICS__)
[d384787]151                struct {
[038be32]152                        struct {
153                                unsigned long long int val;
154                                unsigned long long int cnt;
155                        } submit_avg;
156                } stats;
157        #endif
[92976d9]158};
159
160struct io_uring_cq {
[2d8f7b0]161        // Head and tail of the ring
[92976d9]162        volatile uint32_t * head;
163        volatile uint32_t * tail;
[2d8f7b0]164
165        // number of entries and mask to go with it
166        const uint32_t * mask;
167        const uint32_t * num;
168
169        // number of cqes not submitted (whatever that means)
[92976d9]170        uint32_t * overflow;
[2d8f7b0]171
172        // the kernel ring
[92976d9]173        struct io_uring_cqe * cqes;
174
[2d8f7b0]175        // The location and size of the mmaped area
[92976d9]176        void * ring_ptr;
[2d8f7b0]177        size_t ring_sz;
[d384787]178
179        // Statistics
[038be32]180        #if !defined(__CFA_NO_STATISTICS__)
[d384787]181                struct {
[038be32]182                        struct {
183                                unsigned long long int val;
184                                unsigned long long int cnt;
185                        } completed_avg;
186                } stats;
187        #endif
[92976d9]188};
189
[f6660520]190#if defined(__CFA_IO_POLLING_USER__)
191        struct __io_poller_fast {
192                struct io_ring * ring;
193                $thread thrd;
194        };
195#endif
196
[92976d9]197struct io_ring {
198        struct io_uring_sq submit_q;
199        struct io_uring_cq completion_q;
200        uint32_t flags;
201        int fd;
[2d8f7b0]202        semaphore submit;
[f6660520]203        volatile bool done;
204        struct {
205                struct {
206                        void * stack;
207                        pthread_t kthrd;
208                } slow;
209                #if defined(__CFA_IO_POLLING_USER__)
210                        __io_poller_fast fast;
211                        __bin_sem_t sem;
212                #endif
213        } poller;
[92976d9]214};
215#endif
216
[de94a60]217//-----------------------------------------------------------------------------
218// Cluster
219struct cluster {
220        // Ready queue locks
221        __spinlock_t ready_queue_lock;
222
223        // Ready queue for threads
[ac2b598]224        __queue_t($thread) ready_queue;
[de94a60]225
226        // Name of the cluster
227        const char * name;
228
229        // Preemption rate on this cluster
230        Duration preemption_rate;
231
232        // List of processors
[92e7631]233        __spinlock_t idle_lock;
[de94a60]234        __dllist_t(struct processor) procs;
235        __dllist_t(struct processor) idles;
[d4e68a6]236        unsigned int nprocessors;
[de94a60]237
[d4e68a6]238        // List of threads
[a1a17a7]239        __spinlock_t thread_list_lock;
[ac2b598]240        __dllist_t(struct $thread) threads;
[d4e68a6]241        unsigned int nthreads;
[a1a17a7]242
[de94a60]243        // Link lists fields
[ea8b2f7]244        struct __dbg_node_cltr {
[de94a60]245                cluster * next;
246                cluster * prev;
247        } node;
[92976d9]248
249        #if defined(HAVE_LINUX_IO_URING_H)
250                struct io_ring io;
251        #endif
[038be32]252
253        #if !defined(__CFA_NO_STATISTICS__)
254                bool print_stats;
255        #endif
[de94a60]256};
257extern Duration default_preemption();
258
[e3fea42]259void ?{} (cluster & this, const char name[], Duration preemption_rate);
[de94a60]260void ^?{}(cluster & this);
261
262static inline void ?{} (cluster & this)                           { this{"Anonymous Cluster", default_preemption()}; }
263static inline void ?{} (cluster & this, Duration preemption_rate) { this{"Anonymous Cluster", preemption_rate}; }
[e3fea42]264static inline void ?{} (cluster & this, const char name[])        { this{name, default_preemption()}; }
[de94a60]265
[c7a900a]266static inline [cluster *&, cluster *& ] __get( cluster & this ) __attribute__((const)) { return this.node.[next, prev]; }
[de94a60]267
[0f2c555]268static inline struct processor * active_processor() { return TL_GET( this_processor ); } // UNSAFE
269static inline struct cluster   * active_cluster  () { return TL_GET( this_processor )->cltr; }
[d4e68a6]270
[038be32]271#if !defined(__CFA_NO_STATISTICS__)
272        static inline void print_stats_at_exit( cluster & this ) {
273                this.print_stats = true;
274        }
275#endif
276
[8118303]277// Local Variables: //
[6b0b624]278// mode: c //
279// tab-width: 4 //
[8118303]280// End: //
Note: See TracBrowser for help on using the repository browser.