Diff [7d0a3bad9fc8d744d49f01cae7de8f1f09578156:358cba0900eb921a7db399e9c3784420b68b4090] for / – Cforall

Jenkinsfile

-              r7d0a3ba
+              r358cba0
                 def install_dir = pwd tmp: true
+                //Output compiler version to help with debug
+                echo """C++ Compiler :"""
+                sh "which ${compiler.cpp_cc} && ${compiler.cpp_cc} --version"
+                echo """C   Compiler :"""
+                sh "which ${compiler.cfa_cc} && ${compiler.cfa_cc} --version"
                 //Configure the conpilation (Output is not relevant)
+                //Use the current directory as the installation target so nothing
+                //escapes the sandbox
+                //Use the current directory as the installation target so nothing escapes the sandbox
                 //Also specify the compiler by hand
                 sh "./configure CXX=${compiler.cpp_cc} ${architecture} --with-backend-compiler=${compiler.cfa_cc} --prefix=${install_dir} --enable-silent-rules --quiet"

doc/bibliography/pl.bib

-              r7d0a3ba
+              r358cba0
     howpublished= {\href{http://www.boost.org/doc/libs/1_61_0/libs/coroutine/doc/html/index.html}
                   {{http://www.boost.org/\-doc/\-libs/1\_61\_0/\-libs/\-coroutine/\-doc/\-html/\-index.html}}},
     note        = {Accessed: 2016-09},
+    optnote     = {Accessed: 2016-09},
+}
 …
     keywords    = {ANSI C 89},
     contributer = {gjditchfield@plg},
+    title       = {American National Standard for Information Systems -- Programming Language -- {C}},
+    author      = {C90},
+    title       = {Programming Languages -- {C}},
     organization= {American National Standards Institute},
+    address     = {1430 Broadway, New York, New York  10018},
+    month       = dec,
+    year        = 1989,
+    note        = {X3.159-1989}
+    address     = {New York, NY, U.S.A.},
+    year        = 1990,
+    note        = {ANSI/ISO 9899-1990}
+}
 …
     title       = {\textsf{C}{$\mathbf{\forall}$} Features},
     howpublished= {\url{https://plg.uwaterloo.ca/~cforall/features}},
     note        = {Accessed: 2018-01-01},
+    optnote     = {Accessed: 2018-01-01},
+}
 …
     address     = {Waterloo, Ontario, Canada, N2L 3G1},
     note        = {\href{http://plg.uwaterloo.ca/theses/EstevesThesis.pdf}{http://\-plg.uwaterloo.ca/\-theses/\-EstevesThesis.pdf}},
+}
+@misc{CFAStackEvaluation,
+    author      = {Aaron Moss},
+    title       = {\textsf{C}$\mathbf{\forall}$ Stack Evaluation Programs},
+    year        = 2018,
+    howpublished= {\href{https://plg.uwaterloo.ca/~cforall/evaluation.zip}{https://plg.uwaterloo.ca/\-\-$\sim$cforall/\-StackEvaluation.zip}},
+    optnote     = {[Accessed May 2018]},
+}
 …
+}
+@misc{Taylor10,
+    keywords    = {const, poisoning},
+    contributer = {pabuhr@plg},
+    author      = {Ian Lance Taylor},
+    title       = {const},
+    month       = oct,
+    year        = 2010,
+    howpublished= {\href{https://www.airs.com/blog/archives/428}
+                  {https://www.airs.com/\-blog/\-archives/\-428}},
+    optnote     = {Accessed: 2018-05},
+}
 @phdthesis{Ditchfield92,
     keywords    = {C, parametric polymorphism, overloading},
 …
 @misc{GCCExtensions,
     contributer = {a3moss@uwaterloo.ca},
     key         = {{GNU}},
+    key         = {C Extensions},
     author      = {{C Extensions}},
     title       = {Extensions to the {C} Language Family},
     year        = 2014,
     howpublished= {\href{https://gcc.gnu.org/onlinedocs/gcc-4.7.2/gcc/C-Extensions.html}{https://\-gcc.gnu.org/\-onlinedocs/\-gcc-4.7.2/\-gcc/\-C\-Extensions.html}},
     note        = {Accessed: 2017-04-02},
+    optnote     = {Accessed: 2017-04-02},
+}
 …
     month       = jul, year = 1987,
     volume      = 4, number = 4, pages = {9-16}
+}
+@misc{Sutter05c,
+    contributer = {pabuhr@plg},
+    title       = {The Free Lunch Is Over: A Fundamental Turn Toward Concurrency in Software},
+    author      = {Herb Sutter},
+    howpublished= {\url{http://www.gotw.ca/publications/concurrency-ddj.htm}},
+    year        = {2005},
+    note        = {originally Dr. Dobb's Journal 30(3)},
+}
 …
     year        = 2014,
     howpublished= {https://developer.gnome.org/gobject/stable/},
     note        = {Accessed: 2017-04},
+    optnote     = {Accessed: 2017-04},
+}
 …
 % H
+@manual{Haskell10,
+    keywords    = {Haskell},
+    contributer = {pabuhr@plg},
+    author      = {Haskell},
+    title       = {Haskell 2010 Language Report},
+    edition     = {{S}imon {M}arlow},
+    year        = 2010,
+    note        = {\href{https://haskell.org/definition/haskell2010.pdf}{https://haskell.org/\-definition/\-haskell2010.pdf}},
+}
 @article{Michael04a,
 …
     keywords    = {concurrency, critical section},
     contributer = {pabuhr@plg},
     author      = {Dominic Duggan and Gordon V. Cormack and John Ophel},
+    author      = {Dominic Duggan and G. V. Cormack and John Ophel},
     title       = {Kinded Type Inference for Parametric Overloading},
     journal     = acta,
 …
     year        = 2015,
     howpublished= {\href{https://developer.apple.com/library/content/documentation/General/Conceptual/DevPedia-CocoaCore/ObjectiveC.html}{https://developer.apple.com/\-library/\-content/\-documentation/\-General/\-Conceptual/\-DevPedia-\-CocoaCore/\-ObjectiveC.html}},
     note        = {Accessed: 2018-03}
+    optnote     = {Accessed: 2018-03}
+}
 …
     year        = 2015,
     howpublished= {\href{https://developer.apple.com/library/content/documentation/Xcode/Conceptual/RN-Xcode-Archive/Chapters/xc7_release_notes.html}{https://developer.apple.com/\-library/\-content/\-documentation/\-Xcode/\-Conceptual/\-RN-Xcode-Archive/\-Chapters/\-xc7\_release\_notes.html}},
     note        = {Accessed: 2017-04}
+    optnote     = {Accessed: 2017-04}
+}
 …
     keywords    = {Cyclone, existential types, polymorphism, type variables},
     contributer = {a3moss@plg},
     author      = {Dan Grossman},
+    author      = {D. Grossman},
     title       = {Quantified Types in an Imperative Language},
     journal     = toplas,
 …
     title       = {{TIOBE} Index},
     howpublished= {\href{http://www.tiobe.com/tiobe_index}{http://\-www.tiobe.com/\-tiobe\_index}},
     note        = {Accessed: 2018-09},
+    optnote     = {Accessed: 2018-09},
+}
 …
     year        = 2017,
     howpublished= {\url{https://wiki.gnome.org/Projects/Vala/Manual}},
     note        = {Accessed: 2017-04}
+    optnote     = {Accessed: 2017-04}
+}

doc/papers/AMA/AMA-stix/Documents/README.txt

-              r7d0a3ba
+              r358cba0
 %   NJDnatbib.sty --> NJD natbib reference package.
 %   Stix-Fonts (folder) -->   Stix font files
+%   MiKTeX 2.9 (Freeware software) is required to install STIX/LATO fonts
+%   Download MiKTeX installer & instructions from the below URLs
+        https://miktex.org/download
+        Instructions to install the basic MiKTeX installer
+        https://miktex.org/howto/install-miktex
+%   Execute(double click) --> Windows-Stix-fontinstaller.exe from Stix-Fonts folder (This EXE file will install fonts to local drive) (please rename Windows-Stix-fontinstaller.e_xe to Windows-Stix-fontinstaller.exe)
+%   Execute(double click) --> Windows-Stix-fontinstaller.exe from Stix-Fonts folder (This EXE file will install fonts to local drive)
 %   Still shows font error, please do the following
 %   Start-->run--> type "mo_edmin.exe" and press enter

doc/papers/AMA/AMA-stix/ama/WileyNJD-AMA.bst

-              r7d0a3ba
+              r358cba0
       editor empty$
       { booktitle emphasize * }
       { " " * format.editors * " " * booktitle emphasize * ", " * }
+    { " " * format.editors * " " * booktitle emphasize * ", " * }
       if$
+    }
 …
     { format.journal emphasize "journal" output.check
       format.date add.semicolon "year" output.check
+      blank.sep
       format.volume output
       format.number output
 …
       new.block
       format.pages output
+      new.block
       organization output
+      new.block
       publisher output
       inproformat.date "year" output.check
 …
     { new.block organization new.block address new.block.checkb
       organization output
+      new.block
       address output
+    }
 …
   new.block
   school "school" output.check
+  new.block
   address output
   format.date "year" output.check
 …
   "PhD thesis" format.thesis.type output.nonnull
   school "school" output.check
+  new.block
   address output
   format.date "year" output.check

doc/papers/AMA/AMA-stix/ama/WileyNJD-v2.cls

-              r7d0a3ba
+              r358cba0
 \if@STIXLargeOneCol%
 \RequirePackage[not1,notextcomp,lcgreekalpha]{stix}%
-%\usepackage[scaled]{helvet}
-%\renewcommand\familydefault{\sfdefault}
 \usepackage[T1]{fontenc}
 \BXhsize=170mm%
 …
 %\RequirePackage[not1,notextcomp,lcgreekalpha]{stix}%
 \captionsetup[figure]{labelformat=simple, labelsep=space, skip=10pt, labelfont=bf}
 \captionsetup[table]{labelformat=simple, labelsep=space, skip=10pt, labelfont=bf}
 \renewcommand{\thefigure}{\arabic{figure}}
 \renewcommand{\thetable}{\arabic{table}}
+\captionsetup[figure]{labelformat=simple, labelsep=none, skip=10pt, labelfont=bf}
+\captionsetup[table]{labelformat=simple, labelsep=none, skip=10pt, labelfont=bf}
+\renewcommand{\thefigure}{\arabic{figure}\enspace }
+\renewcommand{\thetable}{\arabic{table}\enspace }
 \renewcommand\figurename{\textbf{FIGURE}}%%
 …
 \gdef\@stix@font@defn{%
+  %
 %  \def\infoboxfont{\fontfamily{tim}\fontsize{8}{8}\selectfont}%
+  \def\infoboxfont{\fontfamily{tim}\fontsize{8}{8}\selectfont}%
+  %
 %  \def\watermarkfont{\reset@font\fontfamily{\ffdefault}\fontsize{45}{45}\bfseries\selectfont}
+  \def\watermarkfont{\reset@font\fontfamily{\ffdefault}\fontsize{45}{45}\bfseries\selectfont}
+  %
   \def\pagenumfont{\rmfamily\fontsize{7}{9}\bfseries\selectfont}%
 …
   \def\arttypefont{\rmfamily\fontsize{9}{9}\fontseries{b}\selectfont}%
   \def\SParttypefont{\rmfamily\fontsize{9}{12}\fontseries{b}\selectfont}%
   \def\titlefont{\rmfamily\fontsize{18}{23}\bfseries\selectfont\leftskip\z@\rightskip\z@ plus1fil}%
+  \def\titlefont{\rmfamily\fontsize{18}{23}\bfseries\selectfont\leftskip\z@\rightskip\z@ plus1fil\let\mathbcal\titmathbcal}%
   \def\subtitlefont{\rmfamily\fontsize{16}{21}\bfseries\selectfont\leftskip\z@\rightskip\z@ plus1fil}%
   \def\Authorfont{\rmfamily\fontsize{12}{18}\selectfont\leftskip\z@\rightskip\z@ plus1fil}%
 …
 \gdef\@lato@font@defn{%
+  %
 %  \def\infoboxfont{\fontfamily{tim}\fontsize{8}{8}\selectfont}%
+  \def\infoboxfont{\fontfamily{tim}\fontsize{8}{8}\selectfont}%
+  %
 %  \def\watermarkfont{\reset@font\fontfamily{\ffdefault}\fontsize{45}{45}\bfseries\selectfont}
+  \def\watermarkfont{\reset@font\fontfamily{\ffdefault}\fontsize{45}{45}\bfseries\selectfont}
+  %
   \def\pagenumfont{\rmfamily\fontsize{7}{9}\bfseries\selectfont}%
 …
     \fi
   \fi%
   \renewcommand\thefigure{\@Alph\c@section\arabic{figure}}%
   \renewcommand\thetable{\@Alph\c@section\arabic{table}}%
+  \renewcommand\thefigure{\@Alph\c@section\arabic{figure}\enspace }%
+  \renewcommand\thetable{\@Alph\c@section\arabic{table}\enspace }%
   \renewcommand\theequation{\@Alph\c@section\arabic{equation}}%
 }{%

doc/papers/general/.gitignore

r7d0a3ba	r358cba0
8	8	Paper.out.ps
9	9	WileyNJD-AMA.bst
	10	evaluation.zip

doc/papers/general/Makefile

-              r7d0a3ba
+              r358cba0
         @rm -frv ${DOCUMENT} ${BASE}.ps WileyNJD-AMA.bst ${BASE}.out.ps ${Build}
+Paper.zip :
+        zip -x general/.gitignore -x general/"*AMA*" -x general/Paper.out.ps -x general/Paper.tex.plain -x general/evaluation.zip -x general/mail -x general/response -x general/test.c -x general/evaluation.zip -x general/Paper.tex.plain -x general/Paper.ps -x general/Paper.pdf -x general/"*build*" -x general/evaluation/.gitignore -x general/evaluation/timing.xlsx -r Paper.zip general
+evaluation.zip :
+        zip -x evaluation/.gitignore  -x evaluation/timing.xlsx -x evaluation/timing.dat -r evaluation.zip evaluation
 # File Dependencies #
 …
 ## Define the default recipes.
 ${Build}:
+${Build} :
         mkdir -p ${Build}
 ${BASE}.out.ps: ${Build}
+${BASE}.out.ps : ${Build}
         ln -fs ${Build}/Paper.out.ps .
 WileyNJD-AMA.bst:
+WileyNJD-AMA.bst :
         ln -fs ../AMA/AMA-stix/ama/WileyNJD-AMA.bst .

doc/papers/general/Paper.tex

-              r7d0a3ba
+              r358cba0
 %\DeclareTextCommandDefault{\textunderscore}{\leavevmode\makebox[1.2ex][c]{\rule{1ex}{0.1ex}}}
 \renewcommand{\textunderscore}{\leavevmode\makebox[1.2ex][c]{\rule{1ex}{0.075ex}}}
+\renewcommand*{\thefootnote}{\Alph{footnote}} % hack because fnsymbol does not work
+%\renewcommand*{\thefootnote}{\fnsymbol{footnote}}
 \makeatletter
 …
 \lstMakeShortInline@%
+\let\OLDthebibliography\thebibliography
+\renewcommand\thebibliography[1]{
+  \OLDthebibliography{#1}
+  \setlength{\parskip}{0pt}
+  \setlength{\itemsep}{4pt plus 0.3ex}
+}
 \title{\texorpdfstring{\protect\CFA : Adding Modern Programming Language Features to C}{Cforall : Adding Modern Programming Language Features to C}}
 …
 The C programming language is a foundational technology for modern computing with millions of lines of code implementing everything from commercial operating-systems to hobby projects.
 This installation base and the programmers producing it represent a massive software-engineering investment spanning decades and likely to continue for decades more.
+Nevertheless, C, first standardized over thirty years ago, lacks many features that make programming in more modern languages safer and more productive.
+The goal of the \CFA project is to create an extension of C that provides modern safety and productivity features while still ensuring strong backwards compatibility with C and its programmers.
+Nevertheless, C, first standardized almost forty years ago, lacks many features that make programming in more modern languages safer and more productive.
+The goal of the \CFA project (pronounced ``C-for-all'') is to create an extension of C that provides modern safety and productivity features while still ensuring strong backwards compatibility with C and its programmers.
 Prior projects have attempted similar goals but failed to honour C programming-style; for instance, adding object-oriented or functional programming with garbage collection is a non-starter for many C developers.
 Specifically, \CFA is designed to have an orthogonal feature-set based closely on the C programming paradigm, so that \CFA features can be added \emph{incrementally} to existing C code-bases, and C programmers can learn \CFA extensions on an as-needed basis, preserving investment in existing code and programmers.
 …
 Love it or hate it, C is extremely popular, highly used, and one of the few systems languages.
 In many cases, \CC is often used solely as a better C.
 Nevertheless, C, first standardized over thirty years ago, lacks many features that make programming in more modern languages safer and more productive.
+Nevertheless, C, first standardized almost forty years ago~\cite{ANSI89:C}, lacks many features that make programming in more modern languages safer and more productive.
 \CFA (pronounced ``C-for-all'', and written \CFA or Cforall) is an evolutionary extension of the C programming language that adds modern language-features to C, while maintaining both source and runtime compatibility with C and a familiar programming model for programmers.
 …
 All languages features discussed in this paper are working, except some advanced exception-handling features.
 Not discussed in this paper are the integrated concurrency-constructs and user-level threading-library~\cite{Delisle18}.
 \CFA is an \emph{open-source} project implemented as an source-to-source translator from \CFA to the gcc-dialect of C~\cite{GCCExtensions}, allowing it to leverage the portability and code optimizations provided by gcc, meeting goals (1)--(3).
+\CFA is an \emph{open-source} project implemented as a source-to-source translator from \CFA to the gcc-dialect of C~\cite{GCCExtensions}, allowing it to leverage the portability and code optimizations provided by gcc, meeting goals (1)--(3).
 Ultimately, a compiler is necessary for advanced features and optimal performance.
 % @plg2[9]% cd cfa-cc/src; cloc ArgTweak CodeGen CodeTools Common Concurrency ControlStruct Designators GenPoly InitTweak MakeLibCfa.cc MakeLibCfa.h Parser ResolvExpr SymTab SynTree Tuples driver prelude main.cc
 …
 The \CFA tests are 290+ files and 27,000+ lines of code.
 The tests illustrate syntactic and semantic features in \CFA, plus a growing number of runtime benchmarks.
 The tests check for correctness and are used for daily regression testing of commits (3800+).
+The tests check for correctness and are used for daily regression testing of 3800+ commits.
 Finally, it is impossible to describe a programming language without usages before definitions.
 …
 There are only two hard things in Computer Science: cache invalidation and \emph{naming things} -- Phil Karlton
 \end{quote}
 \vspace{-10pt}
+\vspace{-9pt}
 C already has a limited form of ad-hoc polymorphism in the form of its basic arithmetic operators, which apply to a variety of different types using identical syntax.
 \CFA extends the built-in operator overloading by allowing users to define overloads for any function, not just operators, and even any variable;
 …
 int max( int a, int b ) { return a < b ? b : a; }  $\C{// (3)}$
 double max( double a, double b ) { return a < b ? b : a; }  $\C{// (4)}\CRT$
 max( 7, -max );                                         $\C[2.75in]{// uses (3) and (1), by matching int from constant 7}$
+max( 7, -max );                                         $\C{// uses (3) and (1), by matching int from constant 7}$
 max( max, 3.14 );                                       $\C{// uses (4) and (2), by matching double from constant 3.14}$
 max( max, -max );                                       $\C{// ERROR: ambiguous}$
 int m = max( max, -max );                       $\C{// uses (3) and (1) twice, by matching return type}\CRT$
+max( max, -max );                                       $\C{// ERROR, ambiguous}$
+int m = max( max, -max );                       $\C{// uses (3) and (1) twice, by matching return type}$
 \end{cfa}
 …
 As is shown later, there are a number of situations where \CFA takes advantage of available type information to disambiguate, where other programming languages generate ambiguities.
 \Celeven added @_Generic@ expressions, which is used in preprocessor macros to provide a form of ad-hoc polymorphism;
+\Celeven added @_Generic@ expressions~\cite[\S~6.5.1.1]{C11}, which is used with preprocessor macros to provide ad-hoc polymorphism;
 however, this polymorphism is both functionally and ergonomically inferior to \CFA name overloading.
 The macro wrapping the generic expression imposes some limitations;
 \eg, it cannot implement the example above, because the variables @max@ are ambiguous with the functions @max@.
 Ergonomic limitations of @_Generic@ include the necessity to put a fixed list of supported types in a single place and manually dispatch to appropriate overloads, as well as possible namespace pollution from the dispatch functions, which must all have distinct names.
 For backwards compatibility, \CFA supports @_Generic@ expressions, but it is an unnecessary mechanism. \TODO{actually implement that}
+\CFA supports @_Generic@ expressions for backwards compatibility, but it is an unnecessary mechanism. \TODO{actually implement that}
 % http://fanf.livejournal.com/144696.html
 …
 \begin{cfa}
 forall( otype T `| { T ?+?(T, T); }` ) T twice( T x ) { return x `+` x; }  $\C{// ? denotes operands}$
 int val = twice( twice( 3.7 ) );
+int val = twice( twice( 3.7 ) );  $\C{// val == 14}$
 \end{cfa}
 which works for any type @T@ with a matching addition operator.
 The polymorphism is achieved by creating a wrapper function for calling @+@ with @T@ bound to @double@, then passing this function to the first call of @twice@.
 There is now the option of using the same @twice@ and converting the result to @int@ on assignment, or creating another @twice@ with type parameter @T@ bound to @int@ because \CFA uses the return type~\cite{Cormack81,Baker82,Ada} in its type analysis.
 The first approach has a late conversion from @double@ to @int@ on the final assignment, while the second has an eager conversion to @int@.
+The first approach has a late conversion from @double@ to @int@ on the final assignment, while the second has an early conversion to @int@.
 \CFA minimizes the number of conversions and their potential to lose information, so it selects the first approach, which corresponds with C-programmer intuition.
 …
 \begin{cfa}
 forall( otype T | { int ?<?( T, T ); } ) void qsort( const T * arr, size_t size ) { /* use C qsort */ }
+{
+int main() {
         int ?<?( double x, double y ) { return x `>` y; } $\C{// locally override behaviour}$
         qsort( vals, size );                                    $\C{// descending sort}$
+        qsort( vals, 10 );                                                      $\C{// descending sort}$
+}
 \end{cfa}
 …
 Hence, programmers can easily form local environments, adding and modifying appropriate functions, to maximize reuse of other existing functions and types.
 To reducing duplication, it is possible to distribute a group of @forall@ (and storage-class qualifiers) over functions/types, so each block declaration is prefixed by the group (see example in Appendix~\ref{s:CforallStack}).
+To reduce duplication, it is possible to distribute a group of @forall@ (and storage-class qualifiers) over functions/types, so each block declaration is prefixed by the group (see example in Appendix~\ref{s:CforallStack}).
 \begin{cfa}
 forall( otype `T` ) {                                                   $\C{// distribution block, add forall qualifier to declarations}$
 …
 \end{cquote}
+In fact, the set of @summable@ trait operators is incomplete, as it is missing assignment for type @T@, but @otype@ is syntactic sugar for the following implicit trait:
+Note, the @sumable@ trait does not include a copy constructor needed for the right side of @?+=?@ and return;
+it is provided by @otype@, which is syntactic sugar for the following trait:
 \begin{cfa}
 trait otype( dtype T | sized(T) ) {  // sized is a pseudo-trait for types with known size and alignment
 …
 Instead, each polymorphic function (or generic type) defines the structural type needed for its execution (polymorphic type-key), and this key is fulfilled at each call site from the lexical environment, which is similar to Go~\cite{Go} interfaces.
 Hence, new lexical scopes and nested functions are used extensively to create local subtypes, as in the @qsort@ example, without having to manage a nominal-inheritance hierarchy.
 (Nominal inheritance can be approximated with traits using marker variables or functions, as is done in Go.)
+% (Nominal inheritance can be approximated with traits using marker variables or functions, as is done in Go.)
 % Nominal inheritance can be simulated with traits using marker variables or functions:
 …
-\vspace*{-2pt}
 \section{Generic Types}
 …
 \begin{cquote}
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l|@{\hspace{2\parindentlnth}}l@{}}
 \begin{cfa}
 forall( otype R, otype S ) struct pair {
+\begin{tabular}{@{}l|@{\hspace{\parindentlnth}}l@{}}
+\begin{cfa}
+`forall( otype R, otype S )` struct pair {
         R first;        S second;
 };
 …
 Concrete types have a fixed memory layout regardless of type parameters, while dynamic types vary in memory layout depending on their type parameters.
 A \newterm{dtype-static} type has polymorphic parameters but is still concrete.
+Polymorphic pointers are an example of dtype-static types, \eg @forall(dtype T) T *@ is a polymorphic type, but for any @T@, @T *@  is a fixed-sized pointer, and therefore, can be represented by a @void *@ in code generation.
+Polymorphic pointers are an example of dtype-static types;
+given some type variable @T@, @T@ is a polymorphic type, as is @T *@, but @T *@ has a fixed size and can therefore be represented by @void *@ in code generation.
 \CFA generic types also allow checked argument-constraints.
 …
 \begin{cfa}
 struct _pair_conc0 {
+        const char * first;
+        int second;
+        const char * first;  int second;
 };
 \end{cfa}
 …
 \begin{cfa}
 struct _pair_conc1 {
+        void * first;
+        void * second;
+        void * first, * second;
 };
 \end{cfa}
 …
 \begin{cquote}
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
+\begin{tabular}{@{}l|@{\hspace{\parindentlnth}}l@{}}
 \begin{cfa}
 forall( dtype Unit ) struct scalar { unsigned long value; };
 …
                                                         half_marathon;
 scalar(litres) two_pools = pool + pool;
 `marathon + pool;`      // compilation ERROR
+`marathon + pool;`      // ERROR, mismatched types
 \end{cfa}
 \end{tabular}
 …
+}
 \end{cfa}
 One more step permits the summation of any summable type with all arguments of the same type:
 \begin{cfa}
 trait summable( otype T ) {
+One more step permits the summation of any sumable type with all arguments of the same type:
+\begin{cfa}
+trait sumable( otype T ) {
         T ?+?( T, T );
 };
 forall( otype R | summable( R ) ) R sum( R x, R y ) {
+forall( otype R | sumable( R ) ) R sum( R x, R y ) {
         return x + y;
+}
 forall( otype R, ttype Params | summable(R) | { R sum(R, Params); } ) R sum(R x, R y, Params rest) {
+forall( otype R, ttype Params | sumable(R) | { R sum(R, Params); } ) R sum(R x, R y, Params rest) {
         return sum( x + y, rest );
+}
 …
 \begin{cfa}
 forall( dtype T0, dtype T1 | sized(T0) | sized(T1) ) struct _tuple2 {
+        T0 field_0;                                                             $\C{// generated before the first 2-tuple}$
+        T1 field_1;
+        T0 field_0;  T1 field_1;                                        $\C{// generated before the first 2-tuple}$
 };
 _tuple2(int, int) f() {
         _tuple2(double, double) x;
         forall( dtype T0, dtype T1, dtype T2 | sized(T0) | sized(T1) | sized(T2) ) struct _tuple3 {
+                T0 field_0;                                                     $\C{// generated before the first 3-tuple}$
+                T1 field_1;
+                T2 field_2;
+                T0 field_0;  T1 field_1;  T2 field_2;   $\C{// generated before the first 3-tuple}$
         };
         _tuple3(int, double, int) y;
+}
 \end{cfa}
+{\sloppy
+Tuple expressions are then simply converted directly into compound literals, \eg @[5, 'x', 1.24]@ becomes @(_tuple3(int, char, double)){ 5, 'x', 1.24 }@.
+\par}%
+Tuple expressions are then converted directly into compound literals, \eg @[5, 'x', 1.24]@ becomes @(_tuple3(int, char,@ @double)){ 5, 'x', 1.24 }@.
 \begin{comment}
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{C}}        \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{}}{\textbf{C}}     \\
 \begin{cfa}
 case 2, 10, 34, 42:
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{C}}        \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{}}{\textbf{C}}     \\
 \begin{cfa}
 case 2~42:
 …
 \centering
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{C}}        \\
+\begin{tabular}{@{}l|@{\hspace{\parindentlnth}}l@{}}
+\multicolumn{1}{@{}c|@{\hspace{\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{}}{\textbf{C}}     \\
 \begin{cfa}
 `choose` ( day ) {
   case Mon~Thu:  // program
   case Fri:  // program
+  case Fri:    // program
         wallet += pay;
         `fallthrough;`
   case Sat:  // party
+  case Sat:   // party
         wallet -= party;
   case Sun:  // rest
   default:  // error
+  default:    // print error
+}
 \end{cfa}
 …
   case Mon: case Tue: case Wed: case Thu:  // program
         `break;`
   case Fri:  // program
+  case Fri:    // program
         wallet += pay;
   case Sat:  // party
+  case Sat:   // party
         wallet -= party;
         `break;`
   case Sun:  // rest
         `break;`
   default:  // error
+  default:    // print error
+}
 \end{cfa}
 …
 \centering
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{non-terminator}}  & \multicolumn{1}{c}{\textbf{target label}}     \\
+\begin{tabular}{@{}l|@{\hspace{\parindentlnth}}l@{}}
+\multicolumn{1}{@{}c|@{\hspace{\parindentlnth}}}{\textbf{non-terminator}}       & \multicolumn{1}{c@{}}{\textbf{target label}}  \\
 \begin{cfa}
 choose ( ... ) {
 …
 \begin{figure}
 \lstDeleteShortInline@%
 \begin{tabular}{@{\hspace{\parindentlnth}}l@{\hspace{\parindentlnth}}l@{\hspace{\parindentlnth}}l@{}}
 \multicolumn{1}{@{\hspace{\parindentlnth}}c@{\hspace{\parindentlnth}}}{\textbf{\CFA}}   & \multicolumn{1}{@{\hspace{\parindentlnth}}c}{\textbf{C}}      \\
+\begin{tabular}{@{\hspace{\parindentlnth}}l|@{\hspace{\parindentlnth}}l@{\hspace{\parindentlnth}}l@{}}
+\multicolumn{1}{@{\hspace{\parindentlnth}}c|@{\hspace{\parindentlnth}}}{\textbf{\CFA}}  & \multicolumn{1}{@{\hspace{\parindentlnth}}c@{}}{\textbf{C}}   \\
 \begin{cfa}
 `LC:` {
 …
 \subsection{Exception Handling}
 The following framework for \CFA exception handling is in place, excluding some runtime type-information and virtual functions.
+The following framework for \CFA exception-handling is in place, excluding some runtime type-information and virtual functions.
 \CFA provides two forms of exception handling: \newterm{fix-up} and \newterm{recovery} (see Figure~\ref{f:CFAExceptionHandling})~\cite{Buhr92b,Buhr00a}.
 Both mechanisms provide dynamic call to a handler using dynamic name-lookup, where fix-up has dynamic return and recovery has static return from the handler.
 …
 \begin{cquote}
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{Resumption}}      & \multicolumn{1}{c}{\textbf{Termination}}      \\
+\begin{tabular}{@{}l|@{\hspace{\parindentlnth}}l@{}}
+\multicolumn{1}{@{}c|@{\hspace{\parindentlnth}}}{\textbf{Resumption}}   & \multicolumn{1}{c@{}}{\textbf{Termination}}   \\
 \begin{cfa}
 `exception R { int fix; };`
 …
 If an exception is raised and caught, the handler is run before the finally clause.
 Like a destructor (see Section~\ref{s:ConstructorsDestructors}), a finally clause can raise an exception but not if there is an exception being propagated.
 Mimicking the @finally@ clause with mechanisms like RAII is non-trivially when there are multiple types and local accesses.
+Mimicking the @finally@ clause with mechanisms like RAII is non-trivial when there are multiple types and local accesses.
 …
 with ( s, t ) {
         j + k;                                                                  $\C{// unambiguous, s.j + t.k}$
         m = 5.0;                                                                $\C{// unambiguous, t.m = 5.0}$
         m = 1;                                                                  $\C{// unambiguous, s.m = 1}$
         int a = m;                                                              $\C{// unambiguous, a = s.i }$
         double b = m;                                                   $\C{// unambiguous, b = t.m}$
+        m = 5.0;                                                                $\C{// unambiguous, s.m = 5.0}$
+        m = 1;                                                                  $\C{// unambiguous, t.m = 1}$
+        int a = m;                                                              $\C{// unambiguous, a = t.m }$
+        double b = m;                                                   $\C{// unambiguous, b = s.m}$
         int c = s.i + t.i;                                              $\C{// unambiguous, qualification}$
         (double)m;                                                              $\C{// unambiguous, cast}$
+        (double)m;                                                              $\C{// unambiguous, cast s.m}$
+}
 \end{cfa}
 …
 and implicitly opened \emph{after} a function-body open, to give them higher priority:
 \begin{cfa}
 void ?{}( S & s, int `i` ) with ( s ) `with( $\emph{\color{red}params}$ )` {
+void ?{}( S & s, int `i` ) with ( s ) `{` `with( $\emph{\color{red}params}$ )` {
         s.i = `i`; j = 3; m = 5.5;
+}
+} `}`
 \end{cfa}
 Finally, a cast may be used to disambiguate among overload variables in a @with@ expression:
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{C}}        \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{}}{\textbf{C}}     \\
 \begin{cfa}
 `[5] *` int x1;
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{C}}        \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{}}{\textbf{C}}     \\
 \begin{cfa}
 `*` int x, y;
 int y;
 \end{cfa}
+&
 \begin{cfa}
 int `*`x, `*`y;
+int z;
+\end{cfa}
+&
+\begin{cfa}
+int `*`x, `*`y, z;
 \end{cfa}
 …
 \lstMakeShortInline@%
 \end{cquote}
+The downside of the \CFA semantics is the need to separate regular and pointer declarations.
+% The downside of the \CFA semantics is the need to separate regular and pointer declarations.
+The separation of regular and pointer declarations by \CFA declarations enforces greater clarity with only slightly more syntax.
 \begin{comment}
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{C}}     \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{C}}     \\
 \begin{cfa}
 [ 5 ] int z;
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{C}}     \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{C}}     \\
 \begin{cfa}
 extern const * const int x;
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{C}}        \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{}}{\textbf{C}}     \\
 \begin{cfa}
 y = (* int)x;
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{C}}        \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{}}{\textbf{C}}     \\
 \begin{cfa}
 [double] foo(), foo( int ), foo( double ) {...}
 …
 * [ * int ] ( int y ) gp;               $\C{// pointer to function returning pointer to int with int parameter}$
 * [ ] ( int, char ) hp;                 $\C{// pointer to function returning no result with int and char parameters}$
+* [ * int, int ] ( int ) jp;    $\C{// pointer to function returning pointer to int and int with int parameter}$
+\end{cfa}
+Note, a function name cannot be specified:
+\begin{cfa}
+* [ int x ] f () fp;                    $\C{// function name "f" is disallowed}\CRT$
+\end{cfa}
+* [ * int, int ] ( int ) jp;    $\C{// pointer to function returning pointer to int and int with int parameter}\CRT$
+\end{cfa}
+Note, the name of the function pointer is specified last, as for other variable declarations.
 Finally, new \CFA declarations may appear together with C declarations in the same program block, but cannot be mixed within a specific declaration.
 …
 This provides a much more orthogonal design for library implementors, obviating the need for workarounds such as @std::reference_wrapper@.
 Secondly, \CFA references are rebindable, whereas \CC references have a fixed address.
-\newsavebox{\LstBox}
-\begin{lrbox}{\LstBox}
-\lstset{basicstyle=\footnotesize\linespread{0.9}\sf}
-\begin{cfa}
-int & r = *new( int );
-...                                                                                     $\C{// non-null reference}$
-delete &r;                                                                      $\C{// unmanaged (programmer) memory-management}$
-r += 1;                                                                         $\C{// undefined reference}$
-\end{cfa}
-\end{lrbox}
 Rebinding allows \CFA references to be default-initialized (\eg to a null pointer\footnote{
+While effort has been made into non-null reference checking in \CC and Java, the exercise seems moot for any non-managed languages (C/\CC), given that it only handles one of many different error situations:
+\begin{cquote}
+\usebox{\LstBox}
+\end{cquote}
+}%
+) and point to different addresses throughout their lifetime, like pointers.
+While effort has been made into non-null reference checking in \CC and Java, the exercise seems moot for any non-managed languages (C/\CC), given that it only handles one of many different error situations, \eg using a pointer after its storage is deleted.}) and point to different addresses throughout their lifetime, like pointers.
 Rebinding is accomplished by extending the existing syntax and semantics of the address-of operator in C.
 …
 \begin{itemize}
 \item
 if @R@ is an rvalue of type {@T &@$_1 \cdots$@ &@$_r$} where $r \ge 1$ references (@&@ symbols) than @&R@ has type {@T `*`&@$_{\color{red}2} \cdots$@ &@$_{\color{red}r}$}, \\ \ie @T@ pointer with $r-1$ references (@&@ symbols).
+if @R@ is an rvalue of type {@T &@$_1 \cdots$@ &@$_r$} where $r \ge 1$ references (@&@ symbols) then @&R@ has type {@T `*`&@$_{\color{red}2} \cdots$@ &@$_{\color{red}r}$}, \\ \ie @T@ pointer with $r-1$ references (@&@ symbols).
 \item
 …
 \end{cfa}
 This allows complex values to be succinctly and efficiently passed to functions, without the syntactic overhead of explicit definition of a temporary variable or the runtime cost of pass-by-value.
 \CC allows a similar binding, but only for @const@ references; the more general semantics of \CFA are an attempt to avoid the \newterm{const hell} problem, in which addition of a @const@ qualifier to one reference requires a cascading chain of added qualifiers.
+\CC allows a similar binding, but only for @const@ references; the more general semantics of \CFA are an attempt to avoid the \newterm{const poisoning} problem~\cite{Taylor10}, in which addition of a @const@ qualifier to one reference requires a cascading chain of added qualifiers.
 …
 \begin{tabular}{@{}l@{\hspace{3em}}l|l@{}}
 \multicolumn{1}{c@{\hspace{3em}}}{\textbf{C Type Nesting}}      & \multicolumn{1}{c|}{\textbf{C Implicit Hoisting}}     & \multicolumn{1}{c}{\textbf{\CFA}}     \\
-\hline
 \begin{cfa}
 struct S {
 …
 The symbol \lstinline+^+ is used for the destructor name because it was the last binary operator that could be used in a unary context.}.
 The name @{}@ comes from the syntax for the initializer: @struct S { int i, j; } s = `{` 2, 3 `}`@.
 Like other \CFA operators, these names represent the syntax used to call the constructor or destructor, \eg @?{}(x, ...)@ or @^{}(x, ...)@.
+Like other \CFA operators, these names represent the syntax used to explicitly call the constructor or destructor, \eg @s{...}@ or @^s{...}@.
 The constructor and destructor have return type @void@, and the first parameter is a reference to the object type to be constructed or destructed.
 While the first parameter is informally called the @this@ parameter, as in object-oriented languages, any variable name may be used.
 Both constructors and destructors allow additional parametes after the @this@ parameter for specifying values for initialization/de-initialization\footnote{
+Both constructors and destructors allow additional parameters after the @this@ parameter for specifying values for initialization/de-initialization\footnote{
 Destruction parameters are useful for specifying storage-management actions, such as de-initialize but not deallocate.}.
 \begin{cfa}
 …
 void ^?{}( VLA & vla ) with ( vla ) { free( data ); } $\C{// destructor}$
+{
         VLA x;                                                                  $\C{// implicit:  ?\{\}( x );}$
 }                                                                                       $\C{// implicit:  ?\^{}\{\}( x );}$
+        VLA x;                                                                  $\C{// implicit:\ \ x\{\};}$
+}                                                                                       $\C{// implicit:\ \textasciicircum{}x\{\};}$
 \end{cfa}
 @VLA@ is a \newterm{managed type}\footnote{
 …
 appropriate care is taken to not recursively call the copy constructor when initializing the second parameter.
 \CFA constructors may be explicitly call, like Java, and destructors may be explicitly called, like \CC.
+\CFA constructors may be explicitly called, like Java, and destructors may be explicitly called, like \CC.
 Explicit calls to constructors double as a \CC-style \emph{placement syntax}, useful for construction of member fields in user-defined constructors and reuse of existing storage allocations.
 While existing call syntax works for explicit calls to constructors and destructors, \CFA also provides a more concise \newterm{operator syntax} for both:
+Like the other operators in \CFA, there is a concise syntax for constructor/destructor function calls:
 \begin{cfa}
+{
         VLA  x,            y = { 20, 0x01 },     z = y; $\C{// z points to y}$
         //      ?{}( x );   ?{}( y, 20, 0x01 );   ?{}( z, y );
+        //    x{};         y{ 20, 0x01 };          z{ z, y };
         ^x{};                                                                   $\C{// deallocate x}$
         x{};                                                                    $\C{// reallocate x}$
 …
         y{ x };                                                                 $\C{// reallocate y, points to x}$
         x{};                                                                    $\C{// reallocate x, not pointing to y}$
         // ^?{}(z);  ^?{}(y);  ^?{}(x);
+        //  ^z{};  ^y{};  ^x{};
+}
 \end{cfa}
 …
 In these cases, \CFA provides the initialization syntax \lstinline|S x `@=` {}|, and the object becomes unmanaged, so implicit constructor and destructor calls are not generated.
 Any C initializer can be the right-hand side of an \lstinline|@=| initializer, \eg \lstinline|VLA a @= { 0, 0x0 }|, with the usual C initialization semantics.
 The same syntax can be used in a compound literal, \eg \lstinline|a = VLA`@`{ 0, 0x0 }|, to create a C-style literal.
+The same syntax can be used in a compound literal, \eg \lstinline|a = (VLA)`@`{ 0, 0x0 }|, to create a C-style literal.
 The point of \lstinline|@=| is to provide a migration path from legacy C code to \CFA, by providing a mechanism to incrementally convert to implicit initialization.
 …
 In C, @0@ has the special property that it is the only ``false'' value;
 from the standard, any value that compares equal to @0@ is false, while any value that compares unequal to @0@ is true.
+by the standard, any value that compares equal to @0@ is false, while any value that compares unequal to @0@ is true.
 As such, an expression @x@ in any boolean context (such as the condition of an @if@ or @while@ statement, or the arguments to @&&@, @||@, or @?:@\,) can be rewritten as @x != 0@ without changing its semantics.
 Operator overloading in \CFA provides a natural means to implement this truth-value comparison for arbitrary types, but the C type system is not precise enough to distinguish an equality comparison with @0@ from an equality comparison with an arbitrary integer or pointer.
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{\hspace{2\parindentlnth}}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{postfix function}}        & \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{constant}}      & \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{variable/expression}}   & \multicolumn{1}{c}{\textbf{postfix pointer}}  \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{postfix function}}     & \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{constant}}      & \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{variable/expression}}   & \multicolumn{1}{c@{}}{\textbf{postfix pointer}}       \\
 \begin{cfa}
 int |?`h|( int s );
 …
 \lstset{language=CFA,moredelim=**[is][\color{red}]{|}{|},deletedelim=**[is][]{`}{`}}
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{\CC}}      \\
+\begin{tabular}{@{}l@{\hspace{1.25\parindentlnth}}l@{}}
+\multicolumn{1}{@{}c@{\hspace{1.25\parindentlnth}}}{\textbf{\CFA}}      & \multicolumn{1}{c@{}}{\textbf{\CC}}   \\
 \begin{cfa}
 struct W {
 …
         W w, heavy = { 20 };
         w = 155|_lb|;
         w = 0b1111|_lb|;       // error, binary unsupported
+        // binary unsupported
         w = 0${\color{red}\LstBasicStyle{'}}$233|_lb|;          // quote separator
         w = 0x9b|_kg|;
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{Definition}}      & \multicolumn{1}{c}{\textbf{Usage}}    \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{Definition}}   & \multicolumn{1}{c@{}}{\textbf{Usage}} \\
 \begin{cfa}
 const short int `MIN` = -32768;
 …
 \begin{cquote}
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{C}}        \\
+\begin{tabular}{@{}l@{\hspace{\parindentlnth}}l@{}}
+\multicolumn{1}{@{}c@{\hspace{\parindentlnth}}}{\textbf{\CFA}}  & \multicolumn{1}{c@{}}{\textbf{C}}     \\
 \begin{cfa}
 MIN
 MAX
 PI
+E
 …
+&
 \begin{cfa}
+SCHAR_MIN, CHAR_MIN, SHRT_MIN, INT_MIN, LONG_MIN,
+        LLONG_MIN, FLT_MIN, DBL_MIN, LDBL_MIN
+SCHAR_MAX, UCHAR_MAX, SHRT_MAX, INT_MAX, LONG_MAX,
+        LLONG_MAX, FLT_MAX, DBL_MAX, LDBL_MAX
+CHAR_MIN, SHRT_MIN, INT_MIN, LONG_MIN, LLONG_MIN, FLT_MIN, DBL_MIN, LDBL_MIN
+UCHAR_MAX, SHRT_MAX, INT_MAX, LONG_MAX, LLONG_MAX, FLT_MAX, DBL_MAX, LDBL_MAX
 M_PI, M_PIl
 M_E, M_El
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{Definition}}      & \multicolumn{1}{c}{\textbf{Usage}}    \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{Definition}}   & \multicolumn{1}{c@{}}{\textbf{Usage}} \\
 \begin{cfa}
 float `log`( float x );
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{C}}        \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{}}{\textbf{C}}     \\
 \begin{cfa}
 log
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{Definition}}      & \multicolumn{1}{c}{\textbf{Usage}}    \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{Definition}}   & \multicolumn{1}{c@{}}{\textbf{Usage}} \\
 \begin{cfa}
 unsigned int `abs`( int );
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{C}}        \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{}}{\textbf{C}}     \\
 \begin{cfa}
 abs
 …
 an allocation with a specified character.
 \item[resize]
 an existing allocation to decreased or increased its size.
+an existing allocation to decrease or increase its size.
 In either case, new storage may or may not be allocated and, if there is a new allocation, as much data from the existing allocation is copied.
 For an increase in storage size, new storage after the copied data may be filled.
 …
 \begin{table}
+\caption{Storage-Management Operations}
+\label{t:StorageManagementOperations}
 \centering
 \lstDeleteShortInline@%
 …
 \lstDeleteShortInline~%
 \lstMakeShortInline@%
-\caption{Storage-Management Operations}
-\label{t:StorageManagementOperations}
 \end{table}
 \begin{figure}
 \centering
+\begin{cquote}
+\begin{cfa}[aboveskip=0pt]
+\begin{cfa}[aboveskip=0pt,xleftmargin=0pt]
 size_t  dim = 10;                                                       $\C{// array dimension}$
 char fill = '\xff';                                                     $\C{// initialization fill value}$
 …
 \end{cfa}
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{C}}        \\
 \begin{cfa}
+\begin{tabular}{@{}l@{\hspace{\parindentlnth}}l@{}}
+\multicolumn{1}{@{}c@{\hspace{\parindentlnth}}}{\textbf{\CFA}}  & \multicolumn{1}{c@{}}{\textbf{C}}     \\
+\begin{cfa}[xleftmargin=-10pt]
 ip = alloc();
 ip = alloc( fill );
 …
+&
 \begin{cfa}
+ip = (int *)malloc( sizeof( int ) );
+ip = (int *)malloc( sizeof( int ) ); memset( ip, fill, sizeof( int ) );
+ip = (int *)malloc( dim * sizeof( int ) );
+ip = (int *)malloc( sizeof( int ) ); memset( ip, fill, dim * sizeof( int ) );
+ip = (int *)realloc( ip, 2 * dim * sizeof( int ) );
+ip = (int *)realloc( ip, 4 * dim * sizeof( int ) );
+                        memset( ip, fill, 4 * dim * sizeof( int ) );
+ip = memalign( 16, sizeof( int ) );
+ip = memalign( 16, sizeof( int ) ); memset( ip, fill, sizeof( int ) );
+ip = memalign( 16, dim * sizeof( int ) );
+ip = memalign( 16, dim * sizeof( int ) ); memset( ip, fill, dim * sizeof( int ) );
+\end{cfa}
+\end{tabular}
+\lstMakeShortInline@%
+\end{cquote}
+ip = (int *)malloc( sizeof(int) );
+ip = (int *)malloc( sizeof(int) ); memset( ip, fill, sizeof(int) );
+ip = (int *)malloc( dim * sizeof(int) );
+ip = (int *)malloc( sizeof(int) ); memset( ip, fill, dim * sizeof(int) );
+ip = (int *)realloc( ip, 2 * dim * sizeof(int) );
+ip = (int *)realloc( ip, 4 * dim * sizeof(int) ); memset( ip, fill, 4 * dim * sizeof(int));
+ip = memalign( 16, sizeof(int) );
+ip = memalign( 16, sizeof(int) ); memset( ip, fill, sizeof(int) );
+ip = memalign( 16, dim * sizeof(int) );
+ip = memalign( 16, dim * sizeof(int) ); memset( ip, fill, dim * sizeof(int) );
+\end{cfa}
+\end{tabular}
+\lstMakeShortInline@%
 \caption{\CFA versus C Storage-Allocation}
 \label{f:StorageAllocation}
 …
 S * as = anew( dim, 2, 3 );                                     $\C{// each array element initialized to 2, 3}$
 \end{cfa}
 Note, \CC can only initialization array elements via the default constructor.
+Note, \CC can only initialize array elements via the default constructor.
 Finally, the \CFA memory-allocator has \newterm{sticky properties} for dynamic storage: fill and alignment are remembered with an object's storage in the heap.
 …
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{c}{\textbf{\CC}}      \\
+\multicolumn{1}{@{}c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{}}{\textbf{\CC}}   \\
 \begin{cfa}
 int x = 1, y = 2, z = 3;
 …
 \end{cquote}
 There is a weak similarity between the \CFA logical-or operator and the Shell pipe-operator for moving data, where data flows in the correct direction for input but the opposite direction for output.
+\begin{comment}
 The implicit separator character (space/blank) is a separator not a terminator.
 The rules for implicitly adding the separator are:
 …
 }%
 \end{itemize}
+\end{comment}
 There are functions to set and get the separator string, and manipulators to toggle separation on and off in the middle of output.
 …
 \centering
 \lstDeleteShortInline@%
 \begin{tabular}{@{}l@{\hspace{2\parindentlnth}}@{\hspace{2\parindentlnth}}l@{}}
 \multicolumn{1}{c@{\hspace{2\parindentlnth}}}{\textbf{\CFA}}    & \multicolumn{1}{@{\hspace{2\parindentlnth}}c}{\textbf{C}}     \\
+\begin{tabular}{@{}l@{\hspace{3\parindentlnth}}l@{}}
+\multicolumn{1}{@{}c@{\hspace{3\parindentlnth}}}{\textbf{\CFA}} & \multicolumn{1}{c@{}}{\textbf{C}}     \\
 \begin{cfa}
 #include <gmp>
 …
 \section{Evaluation}
+\section{Polymorphism Evaluation}
 \label{sec:eval}
+Though \CFA provides significant added functionality over C, these features have a low runtime penalty.
+In fact, \CFA's features for generic programming can enable faster runtime execution than idiomatic @void *@-based C code.
+This claim is demonstrated through a set of generic-code-based micro-benchmarks in C, \CFA, and \CC (see stack implementations in Appendix~\ref{sec:BenchmarkStackImplementations}).
+\CFA adds parametric polymorphism to C.
+A runtime evaluation is performed to compare the cost of alternative styles of polymorphism.
+The goal is to compare just the underlying mechanism for implementing different kinds of polymorphism.
+% Though \CFA provides significant added functionality over C, these features have a low runtime penalty.
+% In fact, it is shown that \CFA's generic programming can enable faster runtime execution than idiomatic @void *@-based C code.
+The experiment is a set of generic-stack micro-benchmarks~\cite{CFAStackEvaluation} in C, \CFA, and \CC (see implementations in Appendix~\ref{sec:BenchmarkStackImplementations}).
 Since all these languages share a subset essentially comprising standard C, maximal-performance benchmarks should show little runtime variance, differing only in length and clarity of source code.
 A more illustrative comparison measures the costs of idiomatic usage of each language's features.
 …
 \end{figure}
 The structure of each benchmark implemented is: C with @void *@-based polymorphism, \CFA with the presented features, \CC with templates, and \CC using only class inheritance for polymorphism, called \CCV.
+The structure of each benchmark implemented is: C with @void *@-based polymorphism, \CFA with parametric polymorphism, \CC with templates, and \CC using only class inheritance for polymorphism, called \CCV.
 The \CCV variant illustrates an alternative object-oriented idiom where all objects inherit from a base @object@ class, mimicking a Java-like interface;
 hence runtime checks are necessary to safely down-cast objects.
 The most notable difference among the implementations is in memory layout of generic types: \CFA and \CC inline the stack and pair elements into corresponding list and pair nodes, while C and \CCV lack such a capability and instead must store generic objects via pointers to separately-allocated objects.
 Note that the C benchmark uses unchecked casts as there is no runtime mechanism to perform such checks, while \CFA and \CC provide type-safety statically.
+Note, the C benchmark uses unchecked casts as C has no runtime mechanism to perform such checks, while \CFA and \CC provide type-safety statically.
 Figure~\ref{fig:eval} and Table~\ref{tab:eval} show the results of running the benchmark in Figure~\ref{fig:BenchmarkTest} and its C, \CC, and \CCV equivalents.
 …
 \begin{table}
-\centering
 \caption{Properties of benchmark code}
 \label{tab:eval}
+\centering
 \newcommand{\CT}[1]{\multicolumn{1}{c}{#1}}
 \begin{tabular}{rrrrr}
 …
 The C and \CCV variants are generally the slowest with the largest memory footprint, because of their less-efficient memory layout and the pointer-indirection necessary to implement generic types;
 this inefficiency is exacerbated by the second level of generic types in the pair benchmarks.
 By contrast, the \CFA and \CC variants run in roughly equivalent time for both the integer and pair of @short@ and @char@ because the storage layout is equivalent, with the inlined libraries (\ie no separate compilation) and greater maturity of the \CC compiler contributing to its lead.
+By contrast, the \CFA and \CC variants run in roughly equivalent time for both the integer and pair because of equivalent storage layout, with the inlined libraries (\ie no separate compilation) and greater maturity of the \CC compiler contributing to its lead.
 \CCV is slower than C largely due to the cost of runtime type-checking of down-casts (implemented with @dynamic_cast@);
+The outlier in the graph for \CFA, pop @pair@, results from the complexity of the generated-C polymorphic code.
+The gcc compiler is unable to optimize some dead code and condense nested calls; a compiler designed for \CFA could easily perform these optimizations.
+The outlier for \CFA, pop @pair@, results from the complexity of the generated-C polymorphic code.
+The gcc compiler is unable to optimize some dead code and condense nested calls;
+a compiler designed for \CFA could easily perform these optimizations.
 Finally, the binary size for \CFA is larger because of static linking with the \CFA libraries.
 …
 Line-count is a fairly rough measure of code complexity;
 another important factor is how much type information the programmer must specify manually, especially where that information is not compiler-checked.
 Such unchecked type information produces a heavier documentation burden and increased potential for runtime bugs, and is much less common in \CFA than C, with its manually specified function pointer arguments and format codes, or \CCV, with its extensive use of untype-checked downcasts, \eg @object@ to @integer@ when popping a stack.
+Such unchecked type information produces a heavier documentation burden and increased potential for runtime bugs, and is much less common in \CFA than C, with its manually specified function pointer arguments and format codes, or \CCV, with its extensive use of un-type-checked downcasts, \eg @object@ to @integer@ when popping a stack.
 To quantify this manual typing, the ``redundant type annotations'' line in Table~\ref{tab:eval} counts the number of lines on which the type of a known variable is respecified, either as a format specifier, explicit downcast, type-specific function, or by name in a @sizeof@, struct literal, or @new@ expression.
 The \CC benchmark uses two redundant type annotations to create a new stack nodes, while the C and \CCV benchmarks have several such annotations spread throughout their code.
 The \CFA benchmark is able to eliminate all redundant type annotations through use of the polymorphic @alloc@ function discussed in Section~\ref{sec:libraries}.
+We conjecture these results scale across most generic data-types as the underlying polymorphism implement is constant.
 \section{Related Work}
 …
 \subsection{Polymorphism}
+ML~\cite{ML} was the first language to support parametric polymorphism.
+Like \CFA, it supports universal type parameters, but not the use of assertions and traits to constrain type arguments.
+Haskell~\cite{Haskell10} combines ML-style polymorphism, polymorphic data types, and type inference with the notion of type classes, collections of overloadable methods that correspond in intent to traits in \CFA.
+Unlike \CFA, Haskell requires an explicit association between types and their classes that specifies the implementation of operations.
+These associations determine the functions that are assertion arguments for particular combinations of class and type, in contrast to \CFA where the assertion arguments are selected at function call sites based upon the set of operations in scope at that point.
+Haskell also severely restricts the use of overloading: an overloaded name can only be associated with a single class, and methods with overloaded names can only be defined as part of instance declarations.
 \CC provides three disjoint polymorphic extensions to C: overloading, inheritance, and templates.
 …
 Go does not have tuples but supports MRVF.
 Java's variadic functions appear similar to C's but are type-safe using homogeneous arrays, which are less useful than \CFA's heterogeneously-typed variadic functions.
 Tuples are a fundamental abstraction in most functional programming languages, such as Standard ML~\cite{sml} and~\cite{Scala}, which decompose tuples using pattern matching.
+Tuples are a fundamental abstraction in most functional programming languages, such as Standard ML~\cite{sml}, Haskell, and Scala~\cite{Scala}, which decompose tuples using pattern matching.
 …
 Finally, we demonstrate that \CFA performance for some idiomatic cases is better than C and close to \CC, showing the design is practically applicable.
+There is ongoing work on a wide range of \CFA features, including arrays with size, runtime type-information, virtual functions, user-defined conversions, concurrent primitives, and modules.
+While all examples in the paper compile and run, a public beta-release of \CFA will take another 8--12 months to finalize these extensions.
+There are also interesting future directions for the polymorphism design.
+Notably, \CC template functions trade compile time and code bloat for optimal runtime of individual instantiations of polymorphic functions.
+\CFA polymorphic functions use dynamic virtual-dispatch;
+the runtime overhead of this approach is low, but not as low as inlining, and it may be beneficial to provide a mechanism for performance-sensitive code.
+While all examples in the paper compile and run, a public beta-release of \CFA will take 6--8 months to reduce compilation time, provide better debugging, and add a few more libraries.
+There is also new work on a number of \CFA features, including arrays with size, runtime type-information, virtual functions, user-defined conversions, and modules.
+While \CFA polymorphic functions use dynamic virtual-dispatch with low runtime overhead (see Section~\ref{sec:eval}), it is not as low as \CC template-inlining.
+Hence it may be beneficial to provide a mechanism for performance-sensitive code.
 Two promising approaches are an @inline@ annotation at polymorphic function call sites to create a template-specialization of the function (provided the code is visible) or placing an @inline@ annotation on polymorphic function-definitions to instantiate a specialized version for some set of types (\CC template specialization).
 These approaches are not mutually exclusive and allow performance optimizations to be applied only when necessary, without suffering global code-bloat.
 …
 The authors would like to recognize the design assistance of Glen Ditchfield, Richard Bilson, Thierry Delisle, Andrew Beach and Brice Dobry on the features described in this paper, and thank Magnus Madsen for feedback on the writing.
+This work is supported by a corporate partnership with Huawei Ltd.\ (\url{http://www.huawei.com}), and Aaron Moss and Peter Buhr are partially funded by the Natural Sciences and Engineering Research Council of Canada.
+Funding for this project has been provided by Huawei Ltd.\ (\url{http://www.huawei.com}), and Aaron Moss and Peter Buhr are partially funded by the Natural Sciences and Engineering Research Council of Canada.
+{%
+\fontsize{9bp}{12bp}\selectfont%
 \bibliography{pl}
+}%
 \appendix

doc/papers/general/evaluation/timing.gp

r7d0a3ba	r358cba0
25	25
26	26	set label "23.9" at 7.125,10.5
27
	27	set style fill pattern 4 border lt -1
28	28	# set datafile separator ","
29	29	plot for [COL=2:5] 'evaluation/timing.dat' using (column(COL)/SCALE):xticlabels(1) title columnheader

src/CodeGen/CodeGenerator.cc

-              r7d0a3ba
+              r358cba0
 // Created On       : Mon May 18 07:44:20 2015
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Sun Sep  3 20:42:52 2017
 // Update Count     : 490
+// Last Modified On : Sat May  5 09:08:32 2018
+// Update Count     : 494
 //
 #include "CodeGenerator.h"
 …
         void CodeGenerator::postvisit( Constant * constant ) {
                 output << constant->get_value() ;
+                output << constant->get_value();
+        }
 …
                 output << "(";
                 if ( castExpr->get_result()->isVoid() ) {
                         output << "(void)" ;
+                        output << "(void)";
                 } else {
                         // at least one result type of cast.
 …
                         } // for
                 } // if
                 output << " );" ;
+                output << " );";
+        }
 …
                 output << "( ";
                 if ( asmStmt->get_instruction() ) asmStmt->get_instruction()->accept( *visitor );
                 output << " )" ;
+                output << " )";
+        }
         void CodeGenerator::postvisit( DirectiveStmt * dirStmt ) {
                 output << dirStmt->directive;
+                output << endl << dirStmt->directive;                   // endl prevents spaces before directive
+        }
 …
         void CodeGenerator::postvisit( SwitchStmt * switchStmt ) {
                 output << "switch ( " ;
+                output << "switch ( ";
                 switchStmt->get_condition()->accept( *visitor );
                 output << " ) ";
 …
                 ++indent;
                 for ( std::list<Statement *>::iterator i = sts.begin(); i != sts.end();  i++) {
                         output << indent << printLabels( (*i)->get_labels() )  ;
+                        output << indent << printLabels( (*i)->get_labels() ) ;
                         (*i)->accept( *visitor );
                         output << endl;
 …
         void CodeGenerator::postvisit( WhileStmt * whileStmt ) {
                 if ( whileStmt->get_isDoWhile() ) {
                         output << "do" ;
                 } else {
                         output << "while (" ;
+                        output << "do";
+                } else {
+                        output << "while (";
                         whileStmt->get_condition()->accept( *visitor );
                         output << ")";
 …
                 if ( whileStmt->get_isDoWhile() ) {
                         output << " while (" ;
+                        output << " while (";
                         whileStmt->get_condition()->accept( *visitor );
                         output << ");";

src/CodeGen/FixNames.cc

-              r7d0a3ba
+              r358cba0
                 auto && name = SymTab::Mangler::mangle( mainDecl.get() );
                 // std::cerr << name << std::endl;
                 return name;
+                return std::move(name);
+        }
         std::string mangle_main_args() {
 …
                 auto&& name = SymTab::Mangler::mangle( mainDecl.get() );
                 // std::cerr << name << std::endl;
                 return name;
+                return std::move(name);
+        }

src/Common/Heap.cc

-              r7d0a3ba
+              r358cba0
 // Heap.cc --
 //
 // Author           : Peter A. Buhr
 // Created On       :
+// Author           : Thierry Delisle
+// Created On       : Thu May  3 16:16:10 2018
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Thu May  3 16:16:10 2018
 // Update Count     : 2
+// Last Modified On : Fri May  4 17:27:31 2018
+// Update Count     : 28
 //
+namespace HeapStats{
+  void newPass( const char * const name ) {}
+  void printStats() {}
+#include <cassert>
+#include <cmath>
+#include <cstddef>
+#include <cstring>
+#include <iomanip>
+#include <iostream>
+//#define WITH_HEAP_STATISTICS
+namespace HeapStats {
+#if !defined( WITH_HEAP_STATISTICS )
+        void newPass( const char * const ) {}
+        void printStats() {}
+#else
+        struct StatBlock {
+                const char * name = nullptr;
+                size_t mallocs    = 0;
+                size_t frees      = 0;
+        };
+        StatBlock    passes[100] = {{ "Pre-Parse", 0, 0 }};
+        const size_t passes_size = sizeof(passes) / sizeof(passes[0]);
+        size_t       passes_cnt = 1;
+        void newPass( const char * const name ) {
+                passes[passes_cnt].name    = name;
+                passes[passes_cnt].mallocs = 0;
+                passes[passes_cnt].frees   = 0;
+                passes_cnt++;
+                assertf(passes_cnt < passes_size, "Too many passes for HeapStats, increase the size of the array in Heap.h");
+        }
+        void print(size_t value, size_t total) {
+                std::cerr << std::setw(12) << value;
+                std::cerr << "(" << std::setw(3);
+                std::cerr << (value == 0 ? 0 : value * 100 / total);
+                std::cerr << "%) | ";
+        }
+        void print(const StatBlock& stat, size_t nc, size_t total_mallocs, size_t total_frees) {
+                std::cerr << std::setw(nc) << stat.name;
+                std::cerr << " | ";
+                print(stat.mallocs, total_mallocs);
+                print(stat.frees  , total_frees  );
+                std::cerr << "\n";
+        }
+        void print(char c, size_t nc) {
+                for(size_t i = 0; i < nc; i++) {
+                        std::cerr << c;
+                }
+                std::cerr << '\n';
+        }
+        void printStats() {
+                size_t nc = 0;
+                size_t total_mallocs = 0;
+                size_t total_frees   = 0;
+                for(size_t i = 0; i < passes_cnt; i++) {
+                        nc = std::max(nc, std::strlen(passes[i].name));
+                        total_mallocs += passes[i].mallocs;
+                        total_frees   += passes[i].frees;
+                }
+                size_t nct = nc + 44;
+                const char * const title = "Heap Usage Statistic";
+                print('=', nct);
+                for(size_t i = 0; i < (nct - std::strlen(title)) / 2; i++) std::cerr << ' ';
+                std::cerr << title << std::endl;
+                print('-', nct);
+                std::cerr << std::setw(nc) << "Pass";
+                std::cerr << " |       Malloc Count |         Free Count |" << std::endl;
+                print('-', nct);
+                for(size_t i = 0; i < passes_cnt; i++) {
+                        print(passes[i], nc, total_mallocs, total_frees);
+                }
+                print('-', nct);
+                print({"Sum", total_mallocs, total_frees}, nc, total_mallocs, total_frees);
+        }
+#include <stdarg.h>
+#include <stddef.h>
+#include <stdio.h>
+#include <string.h>
+#include <unistd.h>
+#include <signal.h>
+        extern "C" {
+#include <dlfcn.h>
+#include <execinfo.h>
+        }
+//=============================================================================================
+// Interposing helpers
+//=============================================================================================
+        typedef void (* generic_fptr_t)(void);
+        generic_fptr_t interpose_symbol( const char * symbol, const char * version ) {
+                const char * error;
+                static void * library;
+                if ( ! library ) {
+#if defined( RTLD_NEXT )
+                        library = RTLD_NEXT;
+#else
+                        // missing RTLD_NEXT => must hard-code library name, assuming libstdc++
+                        library = dlopen( "libc.so.6", RTLD_LAZY );
+                        error = dlerror();
+                        if ( error ) {
+                                std::cerr << "interpose_symbol : failed to open libc, " << error << std::endl;
+                                abort();
+                        }
+#endif // RTLD_NEXT
+                } // if
+                generic_fptr_t fptr;
+#if defined( _GNU_SOURCE )
+                if ( version ) {
+                        fptr = (generic_fptr_t)dlvsym( library, symbol, version );
+                } else {
+                        fptr = (generic_fptr_t)dlsym( library, symbol );
+                }
+#else
+                fptr = (generic_fptr_t)dlsym( library, symbol );
+#endif // _GNU_SOURCE
+                error = dlerror();
+                if ( error ) {
+                        std::cerr << "interpose_symbol : internal error, " << error << std::endl;
+                        abort();
+                }
+                return fptr;
+        }
+        extern "C" {
+                void * malloc( size_t size ) __attribute__((malloc));
+                void * malloc( size_t size ) {
+                        static auto __malloc = reinterpret_cast<void * (*)(size_t)>(interpose_symbol( "malloc", nullptr ));
+                        if( passes_cnt > 0 ) passes[passes_cnt - 1].mallocs++;
+                        return __malloc( size );
+                }
+                void free( void * ptr ) {
+                        static auto __free = reinterpret_cast<void   (*)(void *)>(interpose_symbol( "free", nullptr ));
+                        if( passes_cnt > 0 ) passes[passes_cnt - 1].frees++;
+                        return __free( ptr );
+                }
+                void * calloc( size_t nelem, size_t size ) {
+                        static auto __calloc = reinterpret_cast<void * (*)(size_t, size_t)>(interpose_symbol( "calloc", nullptr ));
+                        if( passes_cnt > 0 ) passes[passes_cnt - 1].mallocs++;
+                        return __calloc( nelem, size );
+                }
+                void * realloc( void * ptr, size_t size ) {
+                        static auto __realloc = reinterpret_cast<void * (*)(void *, size_t)>(interpose_symbol( "realloc", nullptr ));
+                        void * s = __realloc( ptr, size );
+                        if ( s != ptr && passes_cnt > 0 ) {                     // did realloc get new storage ?
+                                passes[passes_cnt - 1].mallocs++;
+                                passes[passes_cnt - 1].frees++;
+                        } // if
+                        return s;
+                }
+        }
+#endif
+}

src/Common/Heap.h

-              r7d0a3ba
+              r358cba0
 // Heap.h --
 //
 // Author           : Peter A. Buhr
 // Created On       :
+// Author           : Thierry Delisle
+// Created On       : Thu May  3 16:16:10 2018
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Thu May  3 16:16:10 2018
 // Update Count     : 2
+// Last Modified On : Fri May  4 14:34:08 2018
+// Update Count     : 3
 //
 …
 namespace HeapStats {
   void newPass( const char * const name );
   void printStats();
+        void newPass( const char * const name );
+        void printStats();
+}

src/Common/PassVisitor.proto.h

-              r7d0a3ba
+              r358cba0
         operator bool() { return m_ref ? *m_ref : true; }
         bool operator=( bool val ) { return *m_ref = val; }
+        bool operator=( bool val ) { assert(m_ref); return *m_ref = val; }
 private:
 …
         friend class ChildrenGuard;
         bool * set( bool & val ) {
+        bool * set( bool * val ) {
                 bool * prev = m_ref;
                 m_ref = &val;
+                m_ref = val;
                 return prev;
+        }
 …
         ChildrenGuard( bool_ref * ref )
                 : m_val ( true )
                 , m_prev( ref ? ref->set( m_val ) : nullptr )
+                , m_prev( ref ? ref->set( &m_val ) : nullptr )
                 , m_ref ( ref )
         {}
 …
         ~ChildrenGuard() {
                 if( m_ref ) {
                         m_ref->set( *m_prev );
+                        m_ref->set( m_prev );
+                }
+        }

src/Common/utility.h

-              r7d0a3ba
+              r358cba0
 // Created On       : Mon May 18 07:44:20 2015
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Thu May  3 12:18:31 2018
 // Update Count     : 39
+// Last Modified On : Sun May  6 22:24:16 2018
+// Update Count     : 40
 //
 …
 template<typename T>
 inline
 #if __GNUC__ > 4
+#if defined(__GNUC__) && __GNUC__ > 4
 constexpr
 #endif

src/Parser/parser.yy

-              r7d0a3ba
+              r358cba0
 // Created On       : Sat Sep  1 20:22:55 2001
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Thu May  3 08:20:09 2018
 // Update Count     : 3225
+// Last Modified On : Fri May 11 17:51:38 2018
+// Update Count     : 3261
 //
 …
 %type<decl> field_declaration field_declaration_list field_declarator field_declaring_list
 %type<en> field field_list field_name fraction_constants
+%type<en> field field_list field_name fraction_constants_opt
 %type<decl> external_function_definition function_definition function_array function_declarator function_no_ptr function_ptr
 …
         | type_name '.' no_attr_identifier                                      // CFA, nested type
                 { SemanticError( yylloc, "Qualified names are currently unimplemented." ); $$ = nullptr; }
+//              { $$ = nullptr; }
         | type_name '.' '[' push field_list pop ']'                     // CFA, nested type / tuple field selector
                 { SemanticError( yylloc, "Qualified names are currently unimplemented." ); $$ = nullptr; }
+//              { $$ = nullptr; }
         | GENERIC '(' assignment_expression ',' generic_assoc_list ')' // C11
                 { SemanticError( yylloc, "_Generic is currently unimplemented." ); $$ = nullptr; }
 …
         | postfix_expression '.' no_attr_identifier
                 { $$ = new ExpressionNode( build_fieldSel( $1, build_varref( $3 ) ) ); }
+        | postfix_expression '.' INTEGERconstant                        // CFA, tuple index
+                { $$ = new ExpressionNode( build_fieldSel( $1, build_constantInteger( *$3 ) ) ); }
+        | postfix_expression FLOATING_FRACTIONconstant          // CFA, tuple index
+                { $$ = new ExpressionNode( build_fieldSel( $1, build_field_name_FLOATING_FRACTIONconstant( *$2 ) ) ); }
         | postfix_expression '.' '[' push field_list pop ']' // CFA, tuple field selector
                 { $$ = new ExpressionNode( build_fieldSel( $1, build_tuple( $5 ) ) ); }
-        | postfix_expression FLOATING_FRACTIONconstant          // CFA, tuple index
-                { $$ = new ExpressionNode( build_fieldSel( $1, build_field_name_FLOATING_FRACTIONconstant( *$2 ) ) ); }
         | postfix_expression ARROW no_attr_identifier
+                {
                         $$ = new ExpressionNode( build_pfieldSel( $1, *$3 == "0" || *$3 == "1" ? build_constantInteger( *$3 ) : build_varref( $3 ) ) );
+                }
-        | postfix_expression ARROW '[' push field_list pop ']' // CFA, tuple field selector
-                        { $$ = new ExpressionNode( build_pfieldSel( $1, build_tuple( $5 ) ) ); }
         | postfix_expression ARROW INTEGERconstant                      // CFA, tuple index
                 { $$ = new ExpressionNode( build_pfieldSel( $1, build_constantInteger( *$3 ) ) ); }
+        | postfix_expression ARROW '[' push field_list pop ']' // CFA, tuple field selector
+                { $$ = new ExpressionNode( build_pfieldSel( $1, build_tuple( $5 ) ) ); }
         | postfix_expression ICR
                 { $$ = new ExpressionNode( build_unary_ptr( OperKinds::IncrPost, $1 ) ); }
 …
 field_name:
         INTEGERconstant fraction_constants
+        INTEGERconstant fraction_constants_opt
                 { $$ = new ExpressionNode( build_field_name_fraction_constants( build_constantInteger( *$1 ), $2 ) ); }
         | FLOATINGconstant fraction_constants
+        | FLOATINGconstant fraction_constants_opt
                 { $$ = new ExpressionNode( build_field_name_fraction_constants( build_field_name_FLOATINGconstant( *$1 ), $2 ) ); }
         | no_attr_identifier fraction_constants
+        | no_attr_identifier fraction_constants_opt
+                {
                         $$ = new ExpressionNode( build_field_name_fraction_constants( build_varref( $1 ), $2 ) );
 …
+        ;
 fraction_constants:
+fraction_constants_opt:
         // empty
                 { $$ = nullptr; }
         | fraction_constants FLOATING_FRACTIONconstant
+        | fraction_constants_opt FLOATING_FRACTIONconstant
+                {
                         Expression * constant = build_field_name_FLOATING_FRACTIONconstant( *$2 );
 …
 external_definition_list:
         external_definition
+        | external_definition_list { forall = xxx; } push external_definition
+        | external_definition_list
+                { forall = xxx; }
+          push external_definition
                 { $$ = $1 ? $1->appendList( $4 ) : $4; }
+        ;
 …
+                {
                         for ( DeclarationNode * iter = $5; iter != nullptr; iter = (DeclarationNode *)iter->get_next() ) {
+                                iter->addQualifiers( $1->clone() );
+                                if ( isMangled( iter->linkage ) ) {             // ignore extern "C"
+                                        iter->addQualifiers( $1->clone() );
+                                } // if
                         } // for
                         xxx = false;
 …
+                {
                         for ( DeclarationNode * iter = $5; iter != nullptr; iter = (DeclarationNode *)iter->get_next() ) {
+                                iter->addQualifiers( $1->clone() );
+                                if ( isMangled( iter->linkage ) ) {             // ignore extern "C"
+                                        iter->addQualifiers( $1->clone() );
+                                } // if
                         } // for
                         xxx = false;
 …
+                {
                         for ( DeclarationNode * iter = $6; iter != nullptr; iter = (DeclarationNode *)iter->get_next() ) {
+                                iter->addQualifiers( $1->clone() );
+                                iter->addQualifiers( $2->clone() );
+                                if ( isMangled( iter->linkage ) && isMangled( $2->linkage ) ) { // ignore extern "C"
+                                        iter->addQualifiers( $1->clone() );
+                                        iter->addQualifiers( $2->clone() );
+                                } // if
                         } // for
                         xxx = false;

src/benchmark/Makefile.am

r7d0a3ba	r358cba0
43	43
44	44	%.runquiet :
45		@+make $(basename $@)
	45	@+make $(basename $@) CFLAGS="-w"
46	46	@taskset -c 1 ./a.out
47	47	@rm -f a.out

src/benchmark/Makefile.in

r7d0a3ba	r358cba0
459	459
460	460	%.runquiet :
461		@+make $(basename $@)
	461	@+make $(basename $@) CFLAGS="-w"
462	462	@taskset -c 1 ./a.out
463	463	@rm -f a.out

src/driver/cc1.cc

-              r7d0a3ba
+              r358cba0
 // Created On       : Fri Aug 26 14:23:51 2005
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Wed Jan 18 08:14:21 2017
 // Update Count     : 81
+// Last Modified On : Sat May 12 16:11:53 2018
+// Update Count     : 94
 //
 …
 string compiler_name( CFA_BACKEND_CC );                                 // path/name of C compiler
+string D__GCC_X__( "-D__GCC_X__=" );
 string D__GCC_BPREFIX__( "-D__GCC_BPREFIX__=" );
 string D__CFA_FLAGPREFIX__( "-D__CFA_FLAG__=" );
 …
                                 cargs[ncargs] = ( *new string( string( argv[i + 1] ).substr( D__CFA_FLAGPREFIX__.size() - 2 ) ) ).c_str();
                                 ncargs += 1;
+                                i += 1;                                                                 // and the argument
+                        } else if ( prefix( arg, D__GCC_X__ ) ) {
+                                args[nargs] = "-x";
+                                nargs += 1;
+                                args[nargs] = ( *new string( arg.substr( D__GCC_X__.size() ) ) ).c_str(); // pass the flag along
+                                nargs += 1;
+                        } else if ( arg == "-D" && prefix( argv[i + 1], D__GCC_X__.substr(2) ) ) {
+                                args[nargs] = "-x";
+                                nargs += 1;
+                                args[nargs] = ( *new string( string( argv[i + 1] ).substr( D__GCC_X__.size() - 2 ) ) ).c_str(); // pass the flag along
+                                nargs += 1;
                                 i += 1;                                                                 // and the argument
                         } else if ( prefix( arg, D__GCC_BPREFIX__ ) ) {

src/driver/cfa.cc

-              r7d0a3ba
+              r358cba0
 // Created On       : Tue Aug 20 13:44:49 2002
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Wed May  2 17:57:43 2018
 // Update Count     : 224
+// Last Modified On : Mon May 14 07:52:50 2018
+// Update Count     : 243
 //
 …
                                 args[nargs] = argv[i];                                  // pass the argument along
                                 nargs += 1;
                         } else if ( prefix( arg, "-std=" ) ) {
+                        } else if ( prefix( arg, "-std=" ) || prefix( arg, "--std=" ) ) {
                                 std_flag = true;                                                // -std=XX provided
                                 args[nargs] = argv[i];                                  // pass the argument along
+                                nargs += 1;
+                        } else if ( arg == "-x" ) {                                     // lost so force along
+                                args[nargs] = argv[i];                                  // pass the argument along
+                                nargs += 1;
+                                i += 1;                                                                 // advance to argument
+                                args[nargs] = argv[i];                                  // pass the argument along
+                                nargs += 1;
+                                args[nargs] = ( *new string( string("-D__GCC_X__=") + argv[i] ) ).c_str(); // add the argument for -x
+                                nargs += 1;
+                        } else if ( prefix( arg, "-x" ) ) {                     // lost so force along
+                                args[nargs] = argv[i];                                  // pass the argument along
+                                nargs += 1;
+                                args[nargs] = ( *new string( string("-D__GCC_X__=") + arg.substr(2) ) ).c_str(); // add the argument for -x
                                 nargs += 1;
                         } else if ( arg == "-w" ) {
 …
         } // for
+#ifdef __x86_64__
+        args[nargs] = "-mcx16";                                                         // allow double-wide CAA
+        nargs += 1;
+#endif // __x86_64__
 #ifdef __DEBUG_H__
         cerr << "args:";
 …
         if ( link ) {
                 #if ! defined(HAVE_LIBCFA_RELEASE)
                         if( !debug ) {
+                        if ( ! debug ) {
                                 cerr << "error: Option -nodebug is unavailable, libcfa was not installed." << endl;
                                 exit( EXIT_FAILURE );
+                                }
+                        } // if
                 #endif
                 #if ! defined(HAVE_LIBCFA_DEBUG)
                         if( debug ) {
+                        if ( debug ) {
                                 cerr << "error: Option -debug is unavailable, libcfa-d was not installed." << endl;
                                 exit( EXIT_FAILURE );
+                                }
+                        } // if
                 #endif
 …
                 args[nargs] = "-L" CFA_LIBDIR;
                 nargs += 1;
                 if( debug ) {
+                if ( debug ) {
                         args[nargs] = "-lcfa-d";
                 } else {
                         args[nargs] = "-lcfa";
+                }
+                } // if
                 nargs += 1;
                 args[nargs] = "-lpthread";

src/libcfa/bits/containers.h

-              r7d0a3ba
+              r358cba0
 #endif
+//-----------------------------------------------------------------------------
+// Doubly Linked List
+//-----------------------------------------------------------------------------
+#ifdef __cforall
+        forall(dtype TYPE | sized(TYPE))
+        #define T TYPE
+        #define __getter_t * [T * & next, T * & prev] ( T & )
+#else
+        typedef void (*__generit_c_getter_t)();
+        #define T void
+        #define __getter_t __generit_c_getter_t
+#endif
+struct __dllist {
+        T * head;
+        __getter_t __get;
+};
+#undef T
+#undef __getter_t
+#ifdef __cforall
+#define __dllist_t(T) __dllist(T)
+#else
+#define __dllist_t(T) struct __dllist
+#endif
+#ifdef __cforall
+        forall(dtype T | sized(T))
+        static inline [void] ?{}( __dllist(T) & this, * [T * & next, T * & prev] ( T & ) __get ) {
+                this.head{ NULL };
+                this.__get = __get;
+        }
+        #define _next .0
+        #define _prev .1
+        forall(dtype T | sized(T))
+        static inline void push_front( __dllist(T) & this, T & node ) with( this ) {
+                if ( head ) {
+                        __get( node )_next = head;
+                        __get( node )_prev = __get( *head )_prev;
+                        // inserted node must be consistent before it is seen
+                        // prevent code movement across barrier
+                        asm( "" : : : "memory" );
+                        __get( *head )_prev = &node;
+                        T & prev = *__get( node )_prev;
+                        __get( prev )_next = &node;
+                }
+                else {
+                        __get( node )_next = &node;
+                        __get( node )_prev = &node;
+                }
+                // prevent code movement across barrier
+                asm( "" : : : "memory" );
+                head = &node;
+        }
+        forall(dtype T | sized(T))
+        static inline void remove( __dllist(T) & this, T & node ) with( this ) {
+                if ( &node == head ) {
+                        if ( __get( *head )_next == head ) {
+                                head = NULL;
+                        }
+                        else {
+                                head = __get( *head )_next;
+                        }
+                }
+                __get( *__get( node )_next )_prev = __get( node )_prev;
+                __get( *__get( node )_prev )_next = __get( node )_next;
+                __get( node )_next = NULL;
+                __get( node )_prev = NULL;
+        }
+        #undef _next
+        #undef _prev
+#endif
 //-----------------------------------------------------------------------------
 // Tools

src/libcfa/concurrency/coroutine

-              r7d0a3ba
+              r358cba0
 // Suspend implementation inlined for performance
 static inline void suspend() {
+        coroutine_desc * src = TL_GET( this_coroutine );                        // optimization
+        // optimization : read TLS once and reuse it
+        // Safety note: this is preemption safe since if
+        // preemption occurs after this line, the pointer
+        // will also migrate which means this value will
+        // stay in syn with the TLS
+        coroutine_desc * src = TL_GET( this_coroutine );
         assertf( src->last != 0,
 …
 forall(dtype T | is_coroutine(T))
 static inline void resume(T & cor) {
+        coroutine_desc * src = TL_GET( this_coroutine );                        // optimization
+        // optimization : read TLS once and reuse it
+        // Safety note: this is preemption safe since if
+        // preemption occurs after this line, the pointer
+        // will also migrate which means this value will
+        // stay in syn with the TLS
+        coroutine_desc * src = TL_GET( this_coroutine );
         coroutine_desc * dst = get_coroutine(cor);
 …
                 dst->last = src;
                 dst->starter = dst->starter ? dst->starter : src;
         } // if
+        }
         // always done for performance testing
 …
 static inline void resume(coroutine_desc * dst) {
+        coroutine_desc * src = TL_GET( this_coroutine );                        // optimization
+        // optimization : read TLS once and reuse it
+        // Safety note: this is preemption safe since if
+        // preemption occurs after this line, the pointer
+        // will also migrate which means this value will
+        // stay in syn with the TLS
+        coroutine_desc * src = TL_GET( this_coroutine );
         // not resuming self ?
 …
                 // set last resumer
                 dst->last = src;
         } // if
+        }
         // always done for performance testing

src/libcfa/concurrency/coroutine.c

-              r7d0a3ba
+              r358cba0
 // Wrapper for co
 void CoroutineCtxSwitch(coroutine_desc* src, coroutine_desc* dst) {
+      verify( TL_GET( preemption_state ).enabled || TL_GET( this_processor )->do_terminate );
+      // Safety note : This could cause some false positives due to preemption
+      verify( TL_GET( preemption_state.enabled ) || TL_GET( this_processor )->do_terminate );
       disable_interrupts();
 …
       // set new coroutine that task is executing
       TL_SET( this_coroutine, dst );
+      kernelTLS.this_coroutine = dst;
       // context switch to specified coroutine
 …
       enable_interrupts( __cfaabi_dbg_ctx );
+      verify( TL_GET( preemption_state ).enabled || TL_GET( this_processor )->do_terminate );
+      // Safety note : This could cause some false positives due to preemption
+      verify( TL_GET( preemption_state.enabled ) || TL_GET( this_processor )->do_terminate );
 } //ctxSwitchDirect

src/libcfa/concurrency/invoke.c

r7d0a3ba	r358cba0
69	69	// Fetch the thread handle from the user defined thread structure
70	70	struct thread_desc* thrd = get_thread( this );
	71	thrd->self_cor.last = NULL;
71	72
72	73	// Officially start the thread by enabling preemption

src/libcfa/concurrency/invoke.h

-              r7d0a3ba
+              r358cba0
 #include "bits/locks.h"
 #define TL_GET( member ) kernelThreadData.member
 #define TL_SET( member, value ) kernelThreadData.member = value;
+#define TL_GET( member ) kernelTLS.member
+#define TL_SET( member, value ) kernelTLS.member = value;
 #ifdef __cforall
 …
                                 volatile bool in_progress;
                         } preemption_state;
                 } kernelThreadData;
+                } kernelTLS;
+        }
         static inline struct coroutine_desc * volatile active_coroutine() { return TL_GET( this_coroutine ); }
         static inline struct thread_desc * volatile active_thread() { return TL_GET( this_thread ); }
         static inline struct processor * volatile active_processor() { return TL_GET( this_processor ); }
+        static inline struct thread_desc    * volatile active_thread   () { return TL_GET( this_thread    ); }
+        static inline struct processor      * volatile active_processor() { return TL_GET( this_processor ); } // UNSAFE
         #endif
 …
                 struct thread_desc * next;
+                __cfaabi_dbg_debug_do(
+                        // instrusive link field for debugging
+                        struct thread_desc * dbg_next;
+                        struct thread_desc * dbg_prev;
+                )
+                struct {
+                        struct thread_desc * next;
+                        struct thread_desc * prev;
+                } node;
      };
 …
                 static inline thread_desc * & get_next( thread_desc & this ) {
                         return this.next;
+                }
+                static inline [thread_desc *&, thread_desc *& ] __get( thread_desc & this ) {
+                        return this.node.[next, prev];
+                }

src/libcfa/concurrency/kernel

-              r7d0a3ba
+              r358cba0
 //-----------------------------------------------------------------------------
+// Cluster
+struct cluster {
+        // Ready queue locks
+        __spinlock_t ready_queue_lock;
+// Processor
+extern struct cluster * mainCluster;
-        // Ready queue for threads
-        __queue_t(thread_desc) ready_queue;
-        // Name of the cluster
-        const char * name;
-        // Preemption rate on this cluster
-        Duration preemption_rate;
-};
-extern struct cluster * mainCluster;
-extern Duration default_preemption();
-void ?{} (cluster & this, const char * name, Duration preemption_rate);
-void ^?{}(cluster & this);
-static inline void ?{} (cluster & this)                           { this{"Anonymous Cluster", default_preemption()}; }
-static inline void ?{} (cluster & this, Duration preemption_rate) { this{"Anonymous Cluster", preemption_rate}; }
-static inline void ?{} (cluster & this, const char * name)        { this{name, default_preemption()}; }
-//-----------------------------------------------------------------------------
-// Processor
 enum FinishOpCode { No_Action, Release, Schedule, Release_Schedule, Release_Multi, Release_Multi_Schedule };
 …
         // Cluster from which to get threads
         cluster * cltr;
+        struct cluster * cltr;
         // Name of the processor
 …
         bool pending_preemption;
+        // Idle lock
+        // Link lists fields
+        struct {
+                struct processor * next;
+                struct processor * prev;
+        } node;
 #ifdef __CFA_DEBUG__
         // Last function to enable preemption on this processor
 …
 };
 void  ?{}(processor & this, const char * name, cluster & cltr);
+void  ?{}(processor & this, const char * name, struct cluster & cltr);
 void ^?{}(processor & this);
 static inline void  ?{}(processor & this)                    { this{ "Anonymous Processor", *mainCluster}; }
 static inline void  ?{}(processor & this, cluster & cltr)    { this{ "Anonymous Processor", cltr}; }
+static inline void  ?{}(processor & this, struct cluster & cltr)    { this{ "Anonymous Processor", cltr}; }
 static inline void  ?{}(processor & this, const char * name) { this{name, *mainCluster }; }
+static inline [processor *&, processor *& ] __get( processor & this ) {
+        return this.node.[next, prev];
+}
+//-----------------------------------------------------------------------------
+// Cluster
+struct cluster {
+        // Ready queue locks
+        __spinlock_t ready_queue_lock;
+        // Ready queue for threads
+        __queue_t(thread_desc) ready_queue;
+        // Name of the cluster
+        const char * name;
+        // Preemption rate on this cluster
+        Duration preemption_rate;
+        // List of processors
+        __spinlock_t proc_list_lock;
+        __dllist_t(struct processor) procs;
+        __dllist_t(struct processor) idles;
+        // Link lists fields
+        struct {
+                cluster * next;
+                cluster * prev;
+        } node;
+};
+extern Duration default_preemption();
+void ?{} (cluster & this, const char * name, Duration preemption_rate);
+void ^?{}(cluster & this);
+static inline void ?{} (cluster & this)                           { this{"Anonymous Cluster", default_preemption()}; }
+static inline void ?{} (cluster & this, Duration preemption_rate) { this{"Anonymous Cluster", preemption_rate}; }
+static inline void ?{} (cluster & this, const char * name)        { this{name, default_preemption()}; }
+static inline [cluster *&, cluster *& ] __get( cluster & this ) {
+        return this.node.[next, prev];
+}
 // Local Variables: //

src/libcfa/concurrency/kernel.c

-              r7d0a3ba
+              r358cba0
 thread_desc * mainThread;
+struct { __dllist_t(thread_desc) list; __spinlock_t lock; } global_threads ;
+struct { __dllist_t(cluster    ) list; __spinlock_t lock; } global_clusters;
 //-----------------------------------------------------------------------------
 // Global state
 …
 // volatile thread_local unsigned short disable_preempt_count = 1;
 thread_local struct KernelThreadData kernelThreadData = {
+thread_local struct KernelThreadData kernelTLS = {
         NULL,
         NULL,
 …
         self_mon_p = &self_mon;
         next = NULL;
+        __cfaabi_dbg_debug_do(
+                dbg_next = NULL;
+                dbg_prev = NULL;
+                __cfaabi_dbg_thread_register(&this);
+        )
+        node.next = NULL;
+        node.prev = NULL;
+        doregister(this);
         monitors{ &self_mon_p, 1, (fptr_t)0 };
 …
                 terminate(&this);
                 verify(this.do_terminate);
                 verify(TL_GET( this_processor ) != &this);
+                verify( kernelTLS.this_processor != &this);
                 P( terminated );
                 verify(TL_GET( this_processor ) != &this);
+                verify( kernelTLS.this_processor != &this);
                 pthread_join( kernel_thread, NULL );
+        }
 …
         ready_queue{};
         ready_queue_lock{};
+        procs{ __get };
+        idles{ __get };
+        doregister(this);
+}
 void ^?{}(cluster & this) {
+        unregister(this);
+}
 …
         __cfaabi_dbg_print_safe("Kernel : core %p starting\n", this);
+        doregister(this->cltr, this);
+        {
                 // Setup preemption data
 …
                         if(readyThread)
+                        {
                                 verify( ! TL_GET( preemption_state ).enabled );
+                                verify( ! kernelTLS.preemption_state.enabled );
                                 runThread(this, readyThread);
                                 verify( ! TL_GET( preemption_state ).enabled );
+                                verify( ! kernelTLS.preemption_state.enabled );
                                 //Some actions need to be taken from the kernel
 …
+        }
+        unregister(this->cltr, this);
         V( this->terminated );
 …
+}
+// KERNEL ONLY
 // runThread runs a thread by context switching
 // from the processor coroutine to the target thread
 …
         coroutine_desc * thrd_cor = dst->curr_cor;
         //Reset the terminating actions here
+        // Reset the terminating actions here
         this->finish.action_code = No_Action;
         //Update global state
         TL_SET( this_thread, dst );
+        // Update global state
+        kernelTLS.this_thread = dst;
         // Context Switch to the thread
 …
+}
+// KERNEL_ONLY
 void returnToKernel() {
         coroutine_desc * proc_cor = get_coroutine(TL_GET( this_processor )->runner);
         coroutine_desc * thrd_cor = TL_GET( this_thread )->curr_cor = TL_GET( this_coroutine );
+        coroutine_desc * proc_cor = get_coroutine(kernelTLS.this_processor->runner);
+        coroutine_desc * thrd_cor = kernelTLS.this_thread->curr_cor = kernelTLS.this_coroutine;
         ThreadCtxSwitch(thrd_cor, proc_cor);
+}
+// KERNEL_ONLY
 // Once a thread has finished running, some of
 // its final actions must be executed from the kernel
 void finishRunning(processor * this) with( this->finish ) {
         if( action_code == Release ) {
                 verify( ! TL_GET( preemption_state ).enabled );
+                verify( ! kernelTLS.preemption_state.enabled );
                 unlock( *lock );
+        }
 …
+        }
         else if( action_code == Release_Schedule ) {
                 verify( ! TL_GET( preemption_state ).enabled );
+                verify( ! kernelTLS.preemption_state.enabled );
                 unlock( *lock );
                 ScheduleThread( thrd );
+        }
         else if( action_code == Release_Multi ) {
                 verify( ! TL_GET( preemption_state ).enabled );
+                verify( ! kernelTLS.preemption_state.enabled );
                 for(int i = 0; i < lock_count; i++) {
                         unlock( *locks[i] );
 …
+}
+// KERNEL_ONLY
 // Context invoker for processors
 // This is the entry point for processors (kernel threads)
 …
 void * CtxInvokeProcessor(void * arg) {
         processor * proc = (processor *) arg;
         TL_SET( this_processor, proc );
         TL_SET( this_coroutine, NULL );
         TL_SET( this_thread, NULL );
         TL_GET( preemption_state ).[enabled, disable_count] = [false, 1];
+        kernelTLS.this_processor = proc;
+        kernelTLS.this_coroutine = NULL;
+        kernelTLS.this_thread    = NULL;
+        kernelTLS.preemption_state.[enabled, disable_count] = [false, 1];
         // SKULLDUGGERY: We want to create a context for the processor coroutine
         // which is needed for the 2-step context switch. However, there is no reason
 …
         //Set global state
         TL_SET( this_coroutine, get_coroutine(proc->runner) );
         TL_SET( this_thread, NULL );
+        kernelTLS.this_coroutine = get_coroutine(proc->runner);
+        kernelTLS.this_thread    = NULL;
         //We now have a proper context from which to schedule threads
 …
+}
+// KERNEL_ONLY
 void kernel_first_resume(processor * this) {
         coroutine_desc * src = TL_GET( this_coroutine );
+        coroutine_desc * src = kernelTLS.this_coroutine;
         coroutine_desc * dst = get_coroutine(this->runner);
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         create_stack(&dst->stack, dst->stack.size);
         CtxStart(&this->runner, CtxInvokeCoroutine);
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         dst->last = src;
 …
         // set new coroutine that task is executing
         TL_SET( this_coroutine, dst );
+        kernelTLS.this_coroutine = dst;
         // SKULLDUGGERY normally interrupts are enable before leaving a coroutine ctxswitch.
 …
         src->state = Active;
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
+}
 //-----------------------------------------------------------------------------
 // Scheduler routines
+// KERNEL ONLY
 void ScheduleThread( thread_desc * thrd ) {
-        // if( ! thrd ) return;
         verify( thrd );
         verify( thrd->self_cor.state != Halted );
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         verifyf( thrd->next == NULL, "Expected null got %p", thrd->next );
 …
+        }
+        verify( ! TL_GET( preemption_state ).enabled );
+}
+        verify( ! kernelTLS.preemption_state.enabled );
+}
+// KERNEL ONLY
 thread_desc * nextThread(cluster * this) with( *this ) {
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         lock( ready_queue_lock __cfaabi_dbg_ctx2 );
         thread_desc * head = pop_head( ready_queue );
         unlock( ready_queue_lock );
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         return head;
+}
 …
 void BlockInternal() {
         disable_interrupts();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
+}
 …
 void BlockInternal( __spinlock_t * lock ) {
         disable_interrupts();
         with( *TL_GET( this_processor ) ) {
+        with( *kernelTLS.this_processor ) {
                 finish.action_code = Release;
                 finish.lock        = lock;
+        }
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
 …
 void BlockInternal( thread_desc * thrd ) {
         disable_interrupts();
         with( *TL_GET( this_processor ) ) {
+        with( * kernelTLS.this_processor ) {
                 finish.action_code = Schedule;
                 finish.thrd        = thrd;
+        }
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
 …
         assert(thrd);
         disable_interrupts();
         with( *TL_GET( this_processor ) ) {
+        with( * kernelTLS.this_processor ) {
                 finish.action_code = Release_Schedule;
                 finish.lock        = lock;
 …
+        }
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
 …
 void BlockInternal(__spinlock_t * locks [], unsigned short count) {
         disable_interrupts();
         with( *TL_GET( this_processor ) ) {
+        with( * kernelTLS.this_processor ) {
                 finish.action_code = Release_Multi;
                 finish.locks       = locks;
 …
+        }
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
 …
 void BlockInternal(__spinlock_t * locks [], unsigned short lock_count, thread_desc * thrds [], unsigned short thrd_count) {
         disable_interrupts();
         with( *TL_GET( this_processor ) ) {
+        with( *kernelTLS.this_processor ) {
                 finish.action_code = Release_Multi_Schedule;
                 finish.locks       = locks;
 …
+        }
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         returnToKernel();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
+}
+// KERNEL ONLY
 void LeaveThread(__spinlock_t * lock, thread_desc * thrd) {
         verify( ! TL_GET( preemption_state ).enabled );
         with( *TL_GET( this_processor ) ) {
+        verify( ! kernelTLS.preemption_state.enabled );
+        with( * kernelTLS.this_processor ) {
                 finish.action_code = thrd ? Release_Schedule : Release;
                 finish.lock        = lock;
 …
 // Kernel boot procedures
 void kernel_startup(void) {
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         __cfaabi_dbg_print_safe("Kernel : Starting\n");
+        global_threads. list{ __get };
+        global_threads. lock{};
+        global_clusters.list{ __get };
+        global_clusters.lock{};
         // Initialize the main cluster
 …
         //initialize the global state variables
         TL_SET( this_processor, mainProcessor );
         TL_SET( this_thread, mainThread );
         TL_SET( this_coroutine, &mainThread->self_cor );
+        kernelTLS.this_processor = mainProcessor;
+        kernelTLS.this_thread    = mainThread;
+        kernelTLS.this_coroutine = &mainThread->self_cor;
         // Enable preemption
 …
         // context. Hence, the main thread does not begin through CtxInvokeThread, like all other threads. The trick here is that
         // mainThread is on the ready queue when this call is made.
         kernel_first_resume( TL_GET( this_processor ) );
+        kernel_first_resume( kernelTLS.this_processor );
 …
         __cfaabi_dbg_print_safe("Kernel : Started\n--------------------------------------------------\n\n");
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         enable_interrupts( __cfaabi_dbg_ctx );
         verify( TL_GET( preemption_state ).enabled );
+        verify( TL_GET( preemption_state.enabled ) );
+}
 …
         __cfaabi_dbg_print_safe("\n--------------------------------------------------\nKernel : Shutting down\n");
         verify( TL_GET( preemption_state ).enabled );
+        verify( TL_GET( preemption_state.enabled ) );
         disable_interrupts();
         verify( ! TL_GET( preemption_state ).enabled );
+        verify( ! kernelTLS.preemption_state.enabled );
         // SKULLDUGGERY: Notify the mainProcessor it needs to terminates.
 …
 //=============================================================================================
+// Kernel Quiescing
+//=============================================================================================
+// void halt(processor * this) with( this ) {
+//      pthread_mutex_lock( &idle.lock );
+//      // SKULLDUGGERY: Even if spurious wake-up is a thing
+//      // spuriously waking up a kernel thread is not a big deal
+//      // if it is very rare.
+//      pthread_cond_wait( &idle.cond, &idle.lock);
+//      pthread_mutex_unlock( &idle.lock );
+// }
+// void wake(processor * this) with( this ) {
+//      pthread_mutex_lock  (&idle.lock);
+//      pthread_cond_signal (&idle.cond);
+//      pthread_mutex_unlock(&idle.lock);
+// }
+//=============================================================================================
 // Unexpected Terminating logic
 //=============================================================================================
 …
 static __spinlock_t kernel_abort_lock;
-static __spinlock_t kernel_debug_lock;
 static bool kernel_abort_called = false;
 void * kernel_abort    (void) __attribute__ ((__nothrow__)) {
+void * kernel_abort(void) __attribute__ ((__nothrow__)) {
         // abort cannot be recursively entered by the same or different processors because all signal handlers return when
         // the globalAbort flag is true.
 …
         // first task to abort ?
+        if ( ! kernel_abort_called ) {                  // not first task to abort ?
+        if ( kernel_abort_called ) {                    // not first task to abort ?
+                unlock( kernel_abort_lock );
+                sigset_t mask;
+                sigemptyset( &mask );
+                sigaddset( &mask, SIGALRM );            // block SIGALRM signals
+                sigsuspend( &mask );                    // block the processor to prevent further damage during abort
+                _exit( EXIT_FAILURE );                  // if processor unblocks before it is killed, terminate it
+        }
+        else {
                 kernel_abort_called = true;
                 unlock( kernel_abort_lock );
+        }
+        else {
+                unlock( kernel_abort_lock );
+                sigset_t mask;
+                sigemptyset( &mask );
+                sigaddset( &mask, SIGALRM );                    // block SIGALRM signals
+                sigaddset( &mask, SIGUSR1 );                    // block SIGUSR1 signals
+                sigsuspend( &mask );                            // block the processor to prevent further damage during abort
+                _exit( EXIT_FAILURE );                          // if processor unblocks before it is killed, terminate it
+        }
+        return TL_GET( this_thread );
+        return kernelTLS.this_thread;
+}
 …
         thread_desc * thrd = kernel_data;
+        int len = snprintf( abort_text, abort_text_size, "Error occurred while executing task %.256s (%p)", thrd->self_cor.name, thrd );
+        __cfaabi_dbg_bits_write( abort_text, len );
+        if ( get_coroutine(thrd) != TL_GET( this_coroutine ) ) {
+                len = snprintf( abort_text, abort_text_size, " in coroutine %.256s (%p).\n", TL_GET( this_coroutine )->name, TL_GET( this_coroutine ) );
+        if(thrd) {
+                int len = snprintf( abort_text, abort_text_size, "Error occurred while executing thread %.256s (%p)", thrd->self_cor.name, thrd );
                 __cfaabi_dbg_bits_write( abort_text, len );
+                if ( get_coroutine(thrd) != kernelTLS.this_coroutine ) {
+                        len = snprintf( abort_text, abort_text_size, " in coroutine %.256s (%p).\n", kernelTLS.this_coroutine->name, kernelTLS.this_coroutine );
+                        __cfaabi_dbg_bits_write( abort_text, len );
+                }
+                else {
+                        __cfaabi_dbg_bits_write( ".\n", 2 );
+                }
+        }
         else {
                 __cfaabi_dbg_bits_write( ".\n", 2 );
+                int len = snprintf( abort_text, abort_text_size, "Error occurred outside of any thread.\n" );
+        }
+}
 int kernel_abort_lastframe( void ) __attribute__ ((__nothrow__)) {
+        return get_coroutine(TL_GET( this_thread )) == get_coroutine(mainThread) ? 4 : 2;
+}
+        return get_coroutine(kernelTLS.this_thread) == get_coroutine(mainThread) ? 4 : 2;
+}
+static __spinlock_t kernel_debug_lock;
 extern "C" {
 …
         if ( count < 0 ) {
                 // queue current task
                 append( waiting, (thread_desc *)TL_GET( this_thread ) );
+                append( waiting, kernelTLS.this_thread );
                 // atomically release spin lock and block
 …
 //-----------------------------------------------------------------------------
+// Global Queues
+void doregister( thread_desc & thrd ) {
+        // lock      ( global_thread.lock );
+        // push_front( global_thread.list, thrd );
+        // unlock    ( global_thread.lock );
+}
+void unregister( thread_desc & thrd ) {
+        // lock  ( global_thread.lock );
+        // remove( global_thread.list, thrd );
+        // unlock( global_thread.lock );
+}
+void doregister( cluster     & cltr ) {
+        // lock      ( global_cluster.lock );
+        // push_front( global_cluster.list, cltr );
+        // unlock    ( global_cluster.lock );
+}
+void unregister( cluster     & cltr ) {
+        // lock  ( global_cluster.lock );
+        // remove( global_cluster.list, cltr );
+        // unlock( global_cluster.lock );
+}
+void doregister( cluster * cltr, processor * proc ) {
+        // lock      (cltr->proc_list_lock __cfaabi_dbg_ctx2);
+        // push_front(cltr->procs, *proc);
+        // unlock    (cltr->proc_list_lock);
+}
+void unregister( cluster * cltr, processor * proc ) {
+        // lock  (cltr->proc_list_lock __cfaabi_dbg_ctx2);
+        // remove(cltr->procs, *proc );
+        // unlock(cltr->proc_list_lock);
+}
+//-----------------------------------------------------------------------------
 // Debug
 __cfaabi_dbg_debug_do(
-        struct {
-                thread_desc * tail;
-        } __cfaabi_dbg_thread_list = { NULL };
-        void __cfaabi_dbg_thread_register( thread_desc * thrd ) {
-                if( !__cfaabi_dbg_thread_list.tail ) {
-                        __cfaabi_dbg_thread_list.tail = thrd;
-                        return;
+                }
-                __cfaabi_dbg_thread_list.tail->dbg_next = thrd;
-                thrd->dbg_prev = __cfaabi_dbg_thread_list.tail;
-                __cfaabi_dbg_thread_list.tail = thrd;
+        }
-        void __cfaabi_dbg_thread_unregister( thread_desc * thrd ) {
-                thread_desc * prev = thrd->dbg_prev;
-                thread_desc * next = thrd->dbg_next;
-                if( next ) { next->dbg_prev = prev; }
-                else       {
-                        assert( __cfaabi_dbg_thread_list.tail == thrd );
-                        __cfaabi_dbg_thread_list.tail = prev;
+                }
-                if( prev ) { prev->dbg_next = next; }
-                thrd->dbg_prev = NULL;
-                thrd->dbg_next = NULL;
+        }
         void __cfaabi_dbg_record(__spinlock_t & this, const char * prev_name) {
                 this.prev_name = prev_name;
                 this.prev_thrd = TL_GET( this_thread );
+                this.prev_thrd = kernelTLS.this_thread;
+        }
+)

src/libcfa/concurrency/kernel_private.h

-              r7d0a3ba
+              r358cba0
 #define KERNEL_STORAGE(T,X) static char storage_##X[sizeof(T)]
+void doregister( struct thread_desc & thrd );
+void unregister( struct thread_desc & thrd );
+void doregister( struct cluster     & cltr );
+void unregister( struct cluster     & cltr );
+void doregister( struct cluster * cltr, struct processor * proc );
+void unregister( struct cluster * cltr, struct processor * proc );
 // Local Variables: //
 // mode: c //

src/libcfa/concurrency/monitor.c

-              r7d0a3ba
+              r358cba0
                 // Lock the monitor spinlock
                 lock( this->lock __cfaabi_dbg_ctx2 );
+                thread_desc * thrd = TL_GET( this_thread );
+                // Interrupts disable inside critical section
+                thread_desc * thrd = kernelTLS.this_thread;
                 __cfaabi_dbg_print_safe( "Kernel : %10p Entering mon %p (%p)\n", thrd, this, this->owner);
 …
                 // Lock the monitor spinlock
                 lock( this->lock __cfaabi_dbg_ctx2 );
+                thread_desc * thrd = TL_GET( this_thread );
+                // Interrupts disable inside critical section
+                thread_desc * thrd = kernelTLS.this_thread;
                 __cfaabi_dbg_print_safe( "Kernel : %10p Entering dtor for mon %p (%p)\n", thrd, this, this->owner);
 …
                         // Create the node specific to this wait operation
                         wait_ctx_primed( TL_GET( this_thread ), 0 )
+                        wait_ctx_primed( thrd, 0 )
                         // Some one else has the monitor, wait for him to finish and then run
 …
                         __cfaabi_dbg_print_safe( "Kernel :  blocking \n" );
                         wait_ctx( TL_GET( this_thread ), 0 )
+                        wait_ctx( thrd, 0 )
                         this->dtor_node = &waiter;
 …
                 lock( this->lock __cfaabi_dbg_ctx2 );
                 __cfaabi_dbg_print_safe( "Kernel : %10p Leaving mon %p (%p)\n", TL_GET( this_thread ), this, this->owner);
                 verifyf( TL_GET( this_thread ) == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", TL_GET( this_thread ), this->owner, this->recursion, this );
+                __cfaabi_dbg_print_safe( "Kernel : %10p Leaving mon %p (%p)\n", kernelTLS.this_thread, this, this->owner);
+                verifyf( kernelTLS.this_thread == this->owner, "Expected owner to be %p, got %p (r: %i, m: %p)", kernelTLS.this_thread, this->owner, this->recursion, this );
                 // Leaving a recursion level, decrement the counter
 …
 // Sorts monitors before entering
 void ?{}( monitor_guard_t & this, monitor_desc * m [], __lock_size_t count, fptr_t func ) {
+        thread_desc * thrd = TL_GET( this_thread );
         // Store current array
         this.m = m;
 …
         // Save previous thread context
         this.prev = TL_GET( this_thread )->monitors;
+        this.prev = thrd->monitors;
         // Update thread context (needed for conditions)
         (TL_GET( this_thread )->monitors){m, count, func};
+        (thrd->monitors){m, count, func};
         // __cfaabi_dbg_print_safe( "MGUARD : enter %d\n", count);
 …
 // Sorts monitors before entering
 void ?{}( monitor_dtor_guard_t & this, monitor_desc * m [], fptr_t func ) {
+        // optimization
+        thread_desc * thrd = TL_GET( this_thread );
         // Store current array
         this.m = *m;
         // Save previous thread context
         this.prev = TL_GET( this_thread )->monitors;
+        this.prev = thrd->monitors;
         // Update thread context (needed for conditions)
         (TL_GET( this_thread )->monitors){m, 1, func};
+        (thrd->monitors){m, 1, func};
         __enter_monitor_dtor( this.m, func );
 …
         // Create the node specific to this wait operation
         wait_ctx_primed( TL_GET( this_thread ), 0 )
+        wait_ctx_primed( kernelTLS.this_thread, 0 )
         //save contexts
 …
                                 // Create the node specific to this wait operation
                                 wait_ctx_primed( TL_GET( this_thread ), 0 );
+                                wait_ctx_primed( kernelTLS.this_thread, 0 );
                                 // Save monitor states
 …
         // Create the node specific to this wait operation
         wait_ctx_primed( TL_GET( this_thread ), 0 );
+        wait_ctx_primed( kernelTLS.this_thread, 0 );
         monitor_save;
 …
         for( __lock_size_t i = 0; i < count; i++) {
                 verify( monitors[i]->owner == TL_GET( this_thread ) );
+                verify( monitors[i]->owner == kernelTLS.this_thread );
+        }

src/libcfa/concurrency/preemption.c

-              r7d0a3ba
+              r358cba0
         // Disable interrupts by incrementing the counter
         void disable_interrupts() {
                 with( TL_GET( preemption_state ) ) {
+                with( kernelTLS.preemption_state ) {
                         enabled = false;
                         __attribute__((unused)) unsigned short new_val = disable_count + 1;
 …
         // If counter reaches 0, execute any pending CtxSwitch
         void enable_interrupts( __cfaabi_dbg_ctx_param ) {
                 processor   * proc = TL_GET( this_processor ); // Cache the processor now since interrupts can start happening after the atomic add
                 thread_desc * thrd = TL_GET( this_thread );       // Cache the thread now since interrupts can start happening after the atomic add
                 with( TL_GET( preemption_state ) ){
+                processor   * proc = kernelTLS.this_processor; // Cache the processor now since interrupts can start happening after the atomic add
+                thread_desc * thrd = kernelTLS.this_thread;       // Cache the thread now since interrupts can start happening after the atomic add
+                with( kernelTLS.preemption_state ){
                         unsigned short prev = disable_count;
                         disable_count -= 1;
 …
         // Don't execute any pending CtxSwitch even if counter reaches 0
         void enable_interrupts_noPoll() {
                 unsigned short prev = TL_GET( preemption_state ).disable_count;
                 TL_GET( preemption_state ).disable_count -= 1;
+                unsigned short prev = kernelTLS.preemption_state.disable_count;
+                kernelTLS.preemption_state.disable_count -= 1;
                 verifyf( prev != 0u, "Incremented from %u\n", prev );                     // If this triggers someone is enabled already enabled interrupts
                 if( prev == 1 ) {
                         TL_GET( preemption_state ).enabled = true;
+                        kernelTLS.preemption_state.enabled = true;
+                }
+        }
 …
+}
+// KERNEL ONLY
 // Check if a CtxSwitch signal handler shoud defer
 // If true  : preemption is safe
 // If false : preemption is unsafe and marked as pending
 static inline bool preemption_ready() {
+        bool ready = TL_GET( preemption_state ).enabled && !TL_GET( preemption_state ).in_progress; // Check if preemption is safe
+        TL_GET( this_processor )->pending_preemption = !ready;                  // Adjust the pending flag accordingly
+        // Check if preemption is safe
+        bool ready = kernelTLS.preemption_state.enabled && ! kernelTLS.preemption_state.in_progress;
+        // Adjust the pending flag accordingly
+        kernelTLS.this_processor->pending_preemption = !ready;
         return ready;
+}
 …
         // Start with preemption disabled until ready
         TL_GET( preemption_state ).enabled = false;
         TL_GET( preemption_state ).disable_count = 1;
+        kernelTLS.preemption_state.enabled = false;
+        kernelTLS.preemption_state.disable_count = 1;
         // Initialize the event kernel
 …
         // before the kernel thread has even started running. When that happens an iterrupt
         // we a null 'this_processor' will be caught, just ignore it.
         if(!TL_GET( this_processor )) return;
+        if(! kernelTLS.this_processor ) return;
         choose(sfp->si_value.sival_int) {
                 case PREEMPT_NORMAL   : ;// Normal case, nothing to do here
                 case PREEMPT_TERMINATE: verify(TL_GET( this_processor )->do_terminate);
+                case PREEMPT_TERMINATE: verify( kernelTLS.this_processor->do_terminate);
                 default:
                         abort( "internal error, signal value is %d", sfp->si_value.sival_int );
 …
         if( !preemption_ready() ) { return; }
+        __cfaabi_dbg_print_buffer_decl( " KERNEL: preempting core %p (%p).\n", TL_GET( this_processor ), TL_GET( this_thread ) );
+        TL_GET( preemption_state ).in_progress = true;  // Sync flag : prevent recursive calls to the signal handler
+        signal_unblock( SIGUSR1 );                          // We are about to CtxSwitch out of the signal handler, let other handlers in
+        TL_GET( preemption_state ).in_progress = false; // Clear the in progress flag
+        __cfaabi_dbg_print_buffer_decl( " KERNEL: preempting core %p (%p).\n", kernelTLS.this_processor, kernelTLS.this_thread );
+        // Sync flag : prevent recursive calls to the signal handler
+        kernelTLS.preemption_state.in_progress = true;
+        // We are about to CtxSwitch out of the signal handler, let other handlers in
+        signal_unblock( SIGUSR1 );
+        // TODO: this should go in finish action
+        // Clear the in progress flag
+        kernelTLS.preemption_state.in_progress = false;
         // Preemption can occur here
         BlockInternal( (thread_desc*)TL_GET( this_thread ) ); // Do the actual CtxSwitch
+        BlockInternal( kernelTLS.this_thread ); // Do the actual CtxSwitch
+}
 …
         // Block sigalrms to control when they arrive
         sigset_t mask;
+        sigfillset(&mask);
+        if ( pthread_sigmask( SIG_BLOCK, &mask, NULL ) == -1 ) {
+            abort( "internal error, pthread_sigmask" );
+        }
         sigemptyset( &mask );
         sigaddset( &mask, SIGALRM );
-        if ( pthread_sigmask( SIG_BLOCK, &mask, NULL ) == -1 ) {
-            abort( "internal error, pthread_sigmask" );
+        }
         // Main loop
 …
 void __cfaabi_check_preemption() {
         bool ready = TL_GET( preemption_state ).enabled;
+        bool ready = kernelTLS.preemption_state.enabled;
         if(!ready) { abort("Preemption should be ready"); }

src/libcfa/concurrency/thread.c

-              r7d0a3ba
+              r358cba0
         curr_cluster = &cl;
         next = NULL;
+        __cfaabi_dbg_debug_do(
+                dbg_next = NULL;
+                dbg_prev = NULL;
+                __cfaabi_dbg_thread_register(&this);
+        )
+        node.next = NULL;
+        node.prev = NULL;
+        doregister(this);
         monitors{ &self_mon_p, 1, (fptr_t)0 };
 …
 void ^?{}(thread_desc& this) with( this ) {
+        unregister(this);
         ^self_cor{};
+}
 …
         disable_interrupts();
         create_stack(&thrd_c->stack, thrd_c->stack.size);
         TL_SET( this_coroutine, thrd_c );
+        kernelTLS.this_coroutine = thrd_c;
         CtxStart(&this, CtxInvokeThread);
         assert( thrd_c->last->stack.context );
 …
 extern "C" {
+        // KERNEL ONLY
         void __finish_creation(void) {
                 coroutine_desc* thrd_c = TL_GET( this_coroutine );
+                coroutine_desc* thrd_c = kernelTLS.this_coroutine;
                 ThreadCtxSwitch( thrd_c, thrd_c->last );
+        }
 …
 void yield( void ) {
+        verify( TL_GET( preemption_state ).enabled );
+        // Safety note : This could cause some false positives due to preemption
+      verify( TL_GET( preemption_state.enabled ) );
         BlockInternal( TL_GET( this_thread ) );
+        verify( TL_GET( preemption_state ).enabled );
+        // Safety note : This could cause some false positives due to preemption
+      verify( TL_GET( preemption_state.enabled ) );
+}
 …
+}
+// KERNEL ONLY
 void ThreadCtxSwitch(coroutine_desc* src, coroutine_desc* dst) {
         // set state of current coroutine to inactive
 …
         // set new coroutine that the processor is executing
         // and context switch to it
         TL_SET( this_coroutine, dst );
+        kernelTLS.this_coroutine = dst;
         assert( src->stack.context );
         CtxSwitch( src->stack.context, dst->stack.context );
         TL_SET( this_coroutine, src );
+        kernelTLS.this_coroutine = src;
         // set state of new coroutine to active

src/libcfa/interpose.c

-              r7d0a3ba
+              r358cba0
 // Created On       : Wed Mar 29 16:10:31 2017
 // Last Modified By : Peter A. Buhr
+// Last Modified On : Tue May  1 15:05:35 2018
+// Update Count     : 83
+//
+#include <stdarg.h>
+#include <stddef.h>
+extern "C" {
+#include <stdio.h>
+#include <string.h>
+#include <dlfcn.h>
+#include <unistd.h>
+// Last Modified On : Sat May  5 11:37:35 2018
+// Update Count     : 111
+//
+#include <stdarg.h>                                                                             // va_start, va_end
+#include <string.h>                                                                             // strlen
+#include <unistd.h>                                                                             // _exit, getpid
 #define __USE_GNU
 #include <signal.h>
 #undef __USE_GNU
+#include <execinfo.h>
+extern "C" {
+#include <dlfcn.h>                                                                              // dlopen, dlsym
+#include <execinfo.h>                                                                   // backtrace, messages
+}
 #include "bits/debug.h"
 #include "bits/defs.h"
 #include "bits/signal.h"
 #include "startup.h"
+#include "bits/signal.h"                                                                // sigHandler_?
+#include "startup.h"                                                                    // STARTUP_PRIORITY_CORE
 //=============================================================================================
 …
 //=============================================================================================
 typedef void (*generic_fptr_t)(void);
 generic_fptr_t interpose_symbol( const char* symbol, const char *version ) {
+typedef void (* generic_fptr_t)(void);
+generic_fptr_t interpose_symbol( const char * symbol, const char * version ) {
         const char * error;
 …
         } // if
         union { generic_fptr_t fptr; void* ptr; } originalFunc;
+        union { generic_fptr_t fptr; void * ptr; } originalFunc;
         #if defined( _GNU_SOURCE )
 …
+}
+forall(dtype T)
+static inline void ptr_from_symbol( T** symbol_ptr, const char * symbol_name, const char * version) {
+        union {
+                generic_fptr_t gp;
+                T* tp;
+        } u;
+        u.gp = interpose_symbol( symbol_name, version );
+        *symbol_ptr = u.tp;
+}
+#define INTERPOSE_LIBC( x, ver ) ptr_from_symbol( (void**)&__cabi_libc.x, #x, ver)
+//=============================================================================================
+// Terminating Signals logic
+#define INTERPOSE_LIBC( x, ver ) __cabi_libc.x = (typeof(__cabi_libc.x))interpose_symbol( #x, ver )
+//=============================================================================================
+// Interposition Startup logic
 //=============================================================================================
 …
 struct {
         void (* exit)( int ) __attribute__ (( __noreturn__ ));
         void (* abort)( void ) __attribute__ (( __noreturn__ ));
+        void (* exit)( int ) __attribute__(( __noreturn__ ));
+        void (* abort)( void ) __attribute__(( __noreturn__ ));
 } __cabi_libc;
 …
                 const char *version = NULL;
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wdiscarded-qualifiers"
                 INTERPOSE_LIBC( abort, version );
                 INTERPOSE_LIBC( exit , version );
+                __cfaabi_sigaction( SIGSEGV, sigHandler_segv , SA_SIGINFO ); // Failure handler
+                __cfaabi_sigaction( SIGBUS , sigHandler_segv , SA_SIGINFO ); // Failure handler
+                __cfaabi_sigaction( SIGILL , sigHandler_ill  , SA_SIGINFO ); // Failure handler
+                __cfaabi_sigaction( SIGFPE , sigHandler_fpe  , SA_SIGINFO ); // Failure handler
+                __cfaabi_sigaction( SIGABRT, sigHandler_abort, SA_SIGINFO ); // Failure handler
+                __cfaabi_sigaction( SIGTERM, sigHandler_term , SA_SIGINFO ); // Failure handler
+                __cfaabi_sigaction( SIGINT , sigHandler_term , SA_SIGINFO ); // Failure handler
+#pragma GCC diagnostic pop
+                // Failure handler
+                __cfaabi_sigaction( SIGSEGV, sigHandler_segv , SA_SIGINFO );
+                __cfaabi_sigaction( SIGBUS , sigHandler_segv , SA_SIGINFO );
+                __cfaabi_sigaction( SIGILL , sigHandler_ill  , SA_SIGINFO );
+                __cfaabi_sigaction( SIGFPE , sigHandler_fpe  , SA_SIGINFO );
+                __cfaabi_sigaction( SIGABRT, sigHandler_abort, SA_SIGINFO | SA_RESETHAND);
+                __cfaabi_sigaction( SIGTERM, sigHandler_term , SA_SIGINFO );
+                __cfaabi_sigaction( SIGINT , sigHandler_term , SA_SIGINFO );
+        }
+}
 …
 // Forward declare abort after the __typeof__ call to avoid ambiguities
 void exit( int status, const char fmt[], ... ) __attribute__ (( format(printf, 2, 3), __nothrow__, __leaf__, __noreturn__ ));
 void abort( const char fmt[], ... ) __attribute__ (( format(printf, 1, 2), __nothrow__, __leaf__, __noreturn__ ));
+void exit( int status, const char fmt[], ... ) __attribute__(( format(printf, 2, 3), __nothrow__, __leaf__, __noreturn__ ));
+void abort( const char fmt[], ... ) __attribute__(( format(printf, 1, 2), __nothrow__, __leaf__, __noreturn__ ));
 extern "C" {
         void abort( void ) __attribute__ (( __nothrow__, __leaf__, __noreturn__ )) {
+        void abort( void ) __attribute__(( __nothrow__, __leaf__, __noreturn__ )) {
                 abort( NULL );
+        }
         void __cabi_abort( const char fmt[], ... ) __attribute__ (( format(printf, 1, 2), __nothrow__, __leaf__, __noreturn__ )) {
+        void __cabi_abort( const char fmt[], ... ) __attribute__(( format(printf, 1, 2), __nothrow__, __leaf__, __noreturn__ )) {
                 va_list argp;
                 va_start( argp, fmt );
 …
+        }
         void exit( int status ) __attribute__ (( __nothrow__, __leaf__, __noreturn__ )) {
+        void exit( int status ) __attribute__(( __nothrow__, __leaf__, __noreturn__ )) {
                 __cabi_libc.exit( status );
+        }
+}
 void * kernel_abort    ( void ) __attribute__ (( __nothrow__, __leaf__, __weak__ )) { return NULL; }
 void   kernel_abort_msg( void * data, char * buffer, int size ) __attribute__ (( __nothrow__, __leaf__, __weak__ )) {}
 int kernel_abort_lastframe( void ) __attribute__ (( __nothrow__, __leaf__, __weak__ )) { return 4; }
+void * kernel_abort    ( void ) __attribute__(( __nothrow__, __leaf__, __weak__ )) { return NULL; }
+void   kernel_abort_msg( void * data, char * buffer, int size ) __attribute__(( __nothrow__, __leaf__, __weak__ )) {}
+int kernel_abort_lastframe( void ) __attribute__(( __nothrow__, __leaf__, __weak__ )) { return 4; }
 enum { abort_text_size = 1024 };
 …
 static int abort_lastframe;
 void exit( int status, const char fmt[], ... ) __attribute__ (( format(printf, 2, 3), __nothrow__, __leaf__, __noreturn__ )) {
+void exit( int status, const char fmt[], ... ) __attribute__(( format(printf, 2, 3), __nothrow__, __leaf__, __noreturn__ )) {
     va_list args;
     va_start( args, fmt );
 …
+}
 void abort( const char fmt[], ... ) __attribute__ (( format(printf, 1, 2), __nothrow__, __leaf__, __noreturn__ )) {
+void abort( const char fmt[], ... ) __attribute__(( format(printf, 1, 2), __nothrow__, __leaf__, __noreturn__ )) {
         void * kernel_data = kernel_abort();                    // must be done here to lock down kernel
         int len;

src/libcfa/stdlib

-              r7d0a3ba
+              r358cba0
 // Created On       : Thu Jan 28 17:12:35 2016
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Tue Jan  2 12:21:04 2018
 // Update Count     : 292
+// Last Modified On : Sun May 13 23:22:23 2018
+// Update Count     : 299
 //
 #pragma once
+//#define _XOPEN_SOURCE 600                                                             // posix_memalign, *rand48
+#define __USE_ISOC11                                                                    // aligned_alloc
 #include <stdlib.h>                                                                             // strto*, *abs
 …
 //---------------------------------------
+// allocation, non-array types
+static inline forall( dtype T | sized(T) ) T * malloc( void ) {
+        // printf( "* malloc\n" );
+        return (T *)(void *)malloc( (size_t)sizeof(T) );        // C malloc
+} // malloc
+// static inline forall( dtype T | sized(T) ) T & malloc( void ) {
+//      int & p = *(T *)(void *)malloc( (size_t)sizeof(T) ); // C malloc
+//      printf( "& malloc %p\n", &p );
+//      return p;
+// //   return (T &)*(T *)(void *)malloc( (size_t)sizeof(T) ); // C malloc
+// } // malloc
+extern "C" { void * calloc( size_t dim, size_t size ); } // default C routine
+static inline forall( dtype T | sized(T) ) T * calloc( size_t dim ) {
+        //printf( "X2\n" );
+        return (T *)(void *)calloc( dim, sizeof(T) );           // C cmalloc
+}
+extern "C" { void * realloc( void * ptr, size_t size ); } // default C routine for void *
+static inline forall( dtype T | sized(T) ) T * realloc( T * ptr, size_t size ) {
+        //printf( "X3\n" );
+        return (T *)(void *)realloc( (void *)ptr, size );
+}
+extern "C" { void * memalign( size_t align, size_t size ); } // use default C routine for void *
+static inline forall( dtype T | sized(T) ) T * memalign( size_t align ) {
+        //printf( "X4\n" );
+        return (T *)memalign( align, sizeof(T) );
+} // memalign
+static inline forall( dtype T | sized(T) ) T * aligned_alloc( size_t align ) {
+        //printf( "X5\n" );
+        return (T *)memalign( align, sizeof(T) );
+} // aligned_alloc
+extern "C" { int posix_memalign( void ** ptr, size_t align, size_t size ); } // use default C routine for void *
+static inline forall( dtype T | sized(T) ) int posix_memalign( T ** ptr, size_t align ) {
+        //printf( "X6\n" );
+        return posix_memalign( (void **)ptr, align, sizeof(T) );
+} // posix_memalign
+extern "C" { void * memset( void * dest, int c, size_t size ); } // use default C routine for void *
+static inline forall( dtype T | sized(T) ) T * alloc( void ) {
+        //printf( "X7\n" );
+        return (T *)(void *)malloc( (size_t)sizeof(T) );        // C malloc
+} // alloc
+static inline forall( dtype T | sized(T) ) T * alloc( char fill ) {
+        //printf( "X8\n" );
+        T * ptr = (T *)(void *)malloc( (size_t)sizeof(T) );     // C malloc
+    return (T *)memset( ptr, (int)fill, sizeof(T) );    // initial with fill value
+} // alloc
+static inline forall( dtype T | sized(T) ) T * alloc( size_t dim ) {
+        //printf( "X9\n" );
+        return (T *)(void *)malloc( dim * (size_t)sizeof(T) ); // C malloc
+} // alloc
+static inline forall( dtype T | sized(T) ) T * alloc( size_t dim, char fill ) {
+        //printf( "X10\n" );
+        T * ptr = (T *)(void *)malloc( dim * (size_t)sizeof(T) ); // C malloc
+    return (T *)memset( ptr, (int)fill, dim * sizeof(T) );
+} // alloc
+static inline forall( dtype T | sized(T) ) T * alloc( T ptr[], size_t dim ) {
+        //printf( "X11\n" );
+        return (T *)(void *)realloc( (void *)ptr, dim * (size_t)sizeof(T) ); // C realloc
+} // alloc
+// C dynamic allocation
+static inline forall( dtype T | sized(T) ) {
+        T * malloc( void ) {
+                // printf( "* malloc\n" );
+                return (T *)(void *)malloc( (size_t)sizeof(T) ); // C malloc
+        } // malloc
+        // T & malloc( void ) {
+        //      int & p = *(T *)(void *)malloc( (size_t)sizeof(T) ); // C malloc
+        //      printf( "& malloc %p\n", &p );
+        //      return p;
+        //      //      return (T &)*(T *)(void *)malloc( (size_t)sizeof(T) ); // C malloc
+        // } // malloc
+        T * calloc( size_t dim ) {
+                //printf( "X2\n" );
+                return (T *)(void *)calloc( dim, sizeof(T) );   // C calloc
+        } // calloc
+        T * realloc( T * ptr, size_t size ) {
+                //printf( "X3\n" );
+                return (T *)(void *)realloc( (void *)ptr, size );
+        } // realloc
+        extern "C" { void * memalign( size_t align, size_t size ); } // use default C routine for void *
+        T * memalign( size_t align ) {
+                //printf( "X4\n" );
+                return (T *)memalign( align, sizeof(T) );
+        } // memalign
+        extern "C" { void * aligned_alloc( size_t align, size_t size ); } // use default C routine for void *
+        T * aligned_alloc( size_t align ) {
+                //printf( "X5\n" );
+                return (T *)aligned_alloc( align, sizeof(T) );
+        } // aligned_alloc
+        int posix_memalign( T ** ptr, size_t align ) {
+                //printf( "X6\n" );
+                return posix_memalign( (void **)ptr, align, sizeof(T) ); // C posix_memalign
+        } // posix_memalign
+        // Cforall dynamic allocation
+        extern "C" { void * memset( void * dest, int c, size_t size ); } // use default C routine for void *
+        T * alloc( void ) {
+                //printf( "X7\n" );
+                return (T *)(void *)malloc( (size_t)sizeof(T) ); // C malloc
+        } // alloc
+        T * alloc( char fill ) {
+                //printf( "X8\n" );
+                T * ptr = (T *)(void *)malloc( (size_t)sizeof(T) );     // C malloc
+                return (T *)memset( ptr, (int)fill, sizeof(T) );        // initial with fill value
+        } // alloc
+        T * alloc( size_t dim ) {
+                //printf( "X9\n" );
+                return (T *)(void *)malloc( dim * (size_t)sizeof(T) ); // C malloc
+        } // alloc
+        T * alloc( size_t dim, char fill ) {
+                //printf( "X10\n" );
+                T * ptr = (T *)(void *)malloc( dim * (size_t)sizeof(T) ); // C malloc
+                return (T *)memset( ptr, (int)fill, dim * sizeof(T) );    // initial with fill value
+        } // alloc
+        T * alloc( T ptr[], size_t dim ) {
+                //printf( "X11\n" );
+                return (T *)(void *)realloc( (void *)ptr, dim * (size_t)sizeof(T) ); // C realloc
+        } // alloc
+} // distribution
 forall( dtype T | sized(T) ) T * alloc( T ptr[], size_t dim, char fill );

src/libcfa/time.c

-              r7d0a3ba
+              r358cba0
 // Created On       : Tue Mar 27 13:33:14 2018
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Thu Apr 12 14:41:00 2018
 // Update Count     : 22
+// Last Modified On : Sun May  6 22:26:00 2018
+// Update Count     : 37
 //
 …
 #include "iostream"
 #include <stdio.h>                                                                              // snprintf
+#include <assert.h>
 static char * nanomsd( long int ns, char * buf ) {              // most significant digits
 …
         time_t s = tv / TIMEGRAN;
         tm tm;
+        gmtime_r( &s, &tm );
+        gmtime_r( &s, &tm );                                                            // tm_mon <= 11, tm_mday <= 31
+#if defined(__GNUC__) && __GNUC__ >= 7
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wformat-truncation"
+#endif
         snprintf( buf, 9, "%02d/%02d/%02d", tm.tm_year % 99, tm.tm_mon + 1, tm.tm_mday );
+#if defined(__GNUC__) && __GNUC__ >= 7
+#pragma GCC diagnostic pop
+#endif
         return buf;
 } // yy_mm_dd
 …
         time_t s = tv / TIMEGRAN;
         tm tm;
+        gmtime_r( &s, &tm );
+        gmtime_r( &s, &tm );                                                            // tm_mon <= 11, tm_mday <= 31
+#if defined(__GNUC__) && __GNUC__ >= 7
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wformat-truncation"
+#endif
         snprintf( buf, 9, "%02d/%02d/%02d", tm.tm_mon + 1, tm.tm_mday, tm.tm_year % 99 );
+#if defined(__GNUC__) && __GNUC__ >= 7
+#pragma GCC diagnostic pop
+#endif
         return buf;
 } // mm_dd_yy
 …
         time_t s = tv / TIMEGRAN;
         tm tm;
+        gmtime_r( &s, &tm );
+        gmtime_r( &s, &tm );                                                            // tm_mon <= 11, tm_mday <= 31
+#if defined(__GNUC__) && __GNUC__ >= 7
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wformat-truncation"
+#endif
         snprintf( buf, 9, "%02d/%02d/%02d", tm.tm_mday, tm.tm_mon + 1, tm.tm_year % 99 );
+#if defined(__GNUC__) && __GNUC__ >= 7
+#pragma GCC diagnostic pop
+#endif
         return buf;
 } // dd_mm_yy

src/main.cc

-              r7d0a3ba
+              r358cba0
 // Created On       : Fri May 15 23:12:02 2015
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Wed May  2 14:59:02 2018
 // Update Count     : 490
+// Last Modified On : Mon May  7 14:35:57 2018
+// Update Count     : 492
 //
 …
 #define PASS(name, pass)                   \
         if ( errorp ) { cerr << #name << endl; } \
         HeapStats::newPass(#name);               \
+        if ( errorp ) { cerr << name << endl; } \
+        HeapStats::newPass(name);               \
         pass;
 …
                 } // if
                 return 1;
+        } // try
+        } catch(...) {
+                std::exception_ptr eptr = std::current_exception();
+                try {
+                        if (eptr) {
+                                std::rethrow_exception(eptr);
+                        }
+                        else {
+                                std::cerr << "Exception Uncaught and Unkown" << std::endl;
+                        }
+                } catch(const std::exception& e) {
+                        std::cerr << "Unaught Exception \"" << e.what() << "\"\n";
+                }
+                return 1;
+        }// try
         deleteAll( translationUnit );
         HeapStats::printStats();
+        if(!libcfap && !treep) HeapStats::printStats();
         return 0;
 } // main
 …
         opterr = 0;                                                                                     // (global) prevent getopt from printing error messages
         bool Werror = false;
+        bool Wsuppress = false, Werror = false;
         int c;
         while ( (c = getopt_long( argc, argv, "abBcCdefgGlLmnNpqrstTvwW:yzZD:F:", long_opts, &long_index )) != -1 ) {
 …
                         break;
                   case 'w':
                         SemanticWarning_SuppressAll();
+                        Wsuppress = true;
                         break;
                   case 'W':
 …
                                 assertf( false, "Unknown option: %s\n", argv[optind - 1] );
                         } // if
+                        #if __GNUC__ < 7
+                        #else
+                        #if defined(__GNUC__) && __GNUC__ >= 7
                                 __attribute__((fallthrough));
                         #endif
 …
         if ( Werror ) {
                 SemanticWarning_WarningAsError();
+        } // if
+        if ( Wsuppress ) {
+                SemanticWarning_SuppressAll();
         } // if
         // for ( const auto w : WarningFormats ) {

src/tests/coroutine/fmtLines.c

-              r7d0a3ba
+              r358cba0
 // file "LICENCE" distributed with Cforall.
 //
 // fmtLines.cc --
+// fmtLines.cc -- format characters into blocks of 4 and groups of 5 blocks per line
 //
 // Author           : Peter A. Buhr
 // Created On       : Sun Sep 17 21:56:15 2017
 // Last Modified By : Peter A. Buhr
 // Last Modified On : Tue Dec  5 21:56:35 2017
 // Update Count     : 38
+// Last Modified On : Tue May 15 12:25:33 2018
+// Update Count     : 42
 //
 …
         int g, b;                                                                                       // global because used in destructor
 };
-void ?{}( Format & fmt ) {
-        resume( fmt );                                                                          // prime (start) coroutine
+}
-void ^?{}( Format & fmt ) with( fmt ) {
-        if ( g != 0 || b != 0 ) sout | endl;
+}
 void main( Format & fmt ) with( fmt ) {
 …
 } // main
+void prt( Format & fmt, char ch ) {
+        fmt.ch = ch;
+void ?{}( Format & fmt ) {
+        resume( fmt );                                                                          // prime (start) coroutine
+}
+void ^?{}( Format & fmt ) with( fmt ) {
+        if ( g != 0 || b != 0 ) sout | endl;
+}
+void format( Format & fmt ) {
         resume( fmt );
 } // prt
 int main() {
+        Format fmt;                                                                                     // format characters into blocks of 4 and groups of 5 blocks per line
+        char ch;
+        Format fmt;
         Eof: for ( ;; ) {                                                                       // read until end of file
                 sin | ch;                                                                               // read one character
           if ( eof( sin ) ) break Eof;                                          // eof ?
                 prt( fmt, ch );                                                                 // push character for formatting
+        eof: for ( ;; ) {                                                                       // read until end of file
+                sin | fmt.ch;                                                                   // read one character
+          if ( eof( sin ) ) break eof;                                          // eof ?
+                format( fmt );                                                                  // push character for formatting
         } // for
 } // main

Context Navigation

Changes in / [7d0a3ba:358cba0]

Legend:

Jenkinsfile

doc/bibliography/pl.bib

doc/papers/AMA/AMA-stix/Documents/README.txt

doc/papers/AMA/AMA-stix/ama/WileyNJD-AMA.bst

doc/papers/AMA/AMA-stix/ama/WileyNJD-v2.cls

doc/papers/general/.gitignore

doc/papers/general/Makefile

doc/papers/general/Paper.tex

doc/papers/general/evaluation/timing.gp

src/CodeGen/CodeGenerator.cc

src/CodeGen/FixNames.cc

src/Common/Heap.cc

src/Common/Heap.h

src/Common/PassVisitor.proto.h

src/Common/utility.h

src/Parser/parser.yy

src/benchmark/Makefile.am

src/benchmark/Makefile.in

src/driver/cc1.cc

src/driver/cfa.cc

src/libcfa/bits/containers.h

src/libcfa/concurrency/coroutine

src/libcfa/concurrency/coroutine.c

src/libcfa/concurrency/invoke.c

src/libcfa/concurrency/invoke.h

src/libcfa/concurrency/kernel

src/libcfa/concurrency/kernel.c

src/libcfa/concurrency/kernel_private.h

src/libcfa/concurrency/monitor.c

src/libcfa/concurrency/preemption.c

src/libcfa/concurrency/thread.c

src/libcfa/interpose.c

src/libcfa/stdlib

src/libcfa/time.c

src/main.cc

src/tests/coroutine/fmtLines.c

Download in other formats: