Context Navigation

← Previous Changeset
Next Changeset →

Changeset 7069652

Timestamp:

Apr 19, 2017, 8:12:56 AM (9 years ago)

Author:

Rob Schluntz <rschlunt@…>

Branches:

ADT, aaron-thesis, arm-eh, ast-experimental, cleanup-dtors, deferred_resn, demangler, enum, forall-pointer-decay, jacob/cs343-translation, jenkins-sandbox, master, new-ast, new-ast-unique-expr, new-env, no_list, persistent-indexer, pthread-emulation, qualifiedEnum, resolv-new, stuck-waitfor-destruct, with_gc

Children:

Parents:

e39241b (diff), de4ce0e (diff)
Note: this is a merge changeset, the changes displayed below correspond to the merge itself.
Use the (diff) links above to see all the changes relative to each parent.

Message:

Merge branch 'master' of plg.uwaterloo.ca:/u/cforall/software/cfa/cfa-cc

Location:

Files:

: 1 added
: 6 edited

bibliography/cfa.bib (modified) (2 diffs)
generic_types/evaluation/cfa-bench.c (modified) (1 diff)
generic_types/evaluation/cpp-pair.hpp (added)
generic_types/evaluation/timing.dat (modified) (1 diff)
generic_types/evaluation/timing.gp (modified) (1 diff)
generic_types/evaluation/timing.xlsx (modified) ( previous)
generic_types/generic_types.tex (modified) (31 diffs)

Legend:

: Unmodified
: Added
: Removed

doc/bibliography/cfa.bib

-              re39241b
+              r7069652
     contributer = {pabuhr@plg},
     author      = {James Gosling and Bill Joy and Guy Steele and Gilad Bracha and Alex Buckley},
     title       = {{Java} Language Specification},
+    title       = {{Java} Language Spec.},
     organization= {Oracle},
     publisher   = {Oracle},
 …
+}
+@article{Smith98,
+  keywords = {Polymorphic C},
+  contributor = {a3moss@uwaterloo.ca},
+  title={A sound polymorphic type system for a dialect of C},
+  author={Smith, Geoffrey and Volpano, Dennis},
+  journal={Science of computer programming},
+  volume={32},
+  number={1-3},
+  pages={49--72},
+  year={1998},
+  publisher={Elsevier}
+}
 @book{Campbell74,
     keywords    = {path expressions},

doc/generic_types/evaluation/cfa-bench.c

re39241b	r7069652
1		~~#include <stdlib>~~
2	1	#include <stdio.h>
3	2	#include "bench.h"

doc/generic_types/evaluation/timing.dat

-              re39241b
+              r7069652
 "400 million repetitions"       "C"     "\\CFA{}"       "\\CC{}"        "\\CC{obj}"
 "push\nint"     2958    2480    1519    3284
 "copy\nint"     2961    2014    1534    3126
 "clear\nint"    1350    817     722     1459
 "pop\nint"      1386    1174    717     5404
 "print\nint"    5702    6615    3077    3191
 "push\npair"    4160    2648    940     6566
 "copy\npair"    6195    2099    977     7234
 "clear\npair"   2834    863     723     3315
 "pop\npair"     2956    5591    775     26256
 "print\npair"   7498    10804   8750    16638
+"push\nint"     3002    2459    1520    3305
+"copy\nint"     2985    2057    1521    3152
+"clear\nint"    1374    827     718     1469
+"pop\nint"      1416    1221    717     5467
+"print\nint"    5656    6758    3120    3121
+"push\npair"    4214    2752    946     6826
+"copy\npair"    6127    2105    993     7330
+"clear\npair"   2881    885     711     3564
+"pop\npair"     3046    5434    783     26538
+"print\npair"   7514    10714   8717    16525

doc/generic_types/evaluation/timing.gp

re39241b	r7069652
1	1	# set terminal pdfcairo linewidth 3 size 6,3
2	2	# set output "timing.pdf"
3		set terminal pslatex size 6.25,2.25 color solid
	3	set terminal pslatex size 6.25,2.125 color solid
4	4	set output "timing.tex"
5	5

doc/generic_types/generic_types.tex

-              re39241b
+              r7069652
 \makeatletter
+% Default underscore is too low and wide. Cannot use lstlisting "literate" as replacing underscore
+% removes it as a variable-name character so keyworks in variables are highlighted
+\DeclareTextCommandDefault{\textunderscore}{\leavevmode\makebox[1.2ex][c]{\rule{1ex}{0.1ex}}}
 % parindent is relative, i.e., toggled on/off in environments like itemize, so store the value for
 % use rather than use \parident directly.
 …
 \setlength{\parindentlnth}{\parindent}
 \newlength{\gcolumnposn}                                % temporary hack because lstlisting does handle tabs correctly
+\newlength{\gcolumnposn}                                % temporary hack because lstlisting does not handle tabs correctly
 \newlength{\columnposn}
 \setlength{\gcolumnposn}{2.75in}
 …
 \newcommand{\CRT}{\global\columnposn=\gcolumnposn}
-\newcommand{\TODO}[1]{\textbf{TODO}: {\itshape #1}} % TODO included
-%\newcommand{\TODO}[1]{} % TODO elided
 % Latin abbreviation
 \newcommand{\abbrevFont}{\textit}       % set empty for no italics
 …
                 {\abbrevFont{et al}.\xspace}%
 }%
-% \newcommand{\eg}{\textit{e}.\textit{g}.,\xspace}
-% \newcommand{\ie}{\textit{i}.\textit{e}.,\xspace}
-% \newcommand{\etc}{\textit{etc}.,\xspace}
 \makeatother
 …
 \newcommand{\CCtwenty}{\rm C\kern-.1em\hbox{+\kern-.25em+}20\xspace} % C++20 symbolic name
 \newcommand{\CCV}{\rm C\kern-.1em\hbox{+\kern-.25em+}obj\xspace} % C++ virtual symbolic name
 \newcommand{\CS}{C\raisebox{-0.7ex}{\Large$^\sharp$}\xspace}
+\newcommand{\Csharp}{C\raisebox{-0.7ex}{\Large$^\sharp$}\xspace} % C# symbolic name
 \newcommand{\Textbf}[1]{{\color{red}\textbf{#1}}}
+\newcommand{\TODO}[1]{\textbf{TODO}: {\itshape #1}} % TODO included
+%\newcommand{\TODO}[1]{} % TODO elided
 % CFA programming language, based on ANSI C (with some gcc additions)
 …
 belowskip=3pt,
 % replace/adjust listing characters that look bad in sanserif
 literate={-}{\raisebox{-0.15ex}{\texttt{-}}}1 {^}{\raisebox{0.6ex}{$\scriptscriptstyle\land\,$}}1
         {~}{\raisebox{0.3ex}{$\scriptstyle\sim\,$}}1%{_}{\makebox[1.2ex][c]{\rule{1ex}{0.1ex}}}1 % {`}{\ttfamily\upshape\hspace*{-0.1ex}`}1
         {<-}{$\leftarrow$}2 {=>}{$\Rightarrow$}2,
+literate={-}{\makebox[1.4ex][c]{\raisebox{0.5ex}{\rule{1.2ex}{0.1ex}}}}1 {^}{\raisebox{0.6ex}{$\scriptscriptstyle\land\,$}}1
+        {~}{\raisebox{0.3ex}{$\scriptstyle\sim\,$}}1 % {`}{\ttfamily\upshape\hspace*{-0.1ex}`}1
+        {<-}{$\leftarrow$}2 {=>}{$\Rightarrow$}2 {->}{\makebox[1.4ex][c]{\raisebox{0.5ex}{\rule{1.2ex}{0.1ex}}}\kern-0.3ex\textgreater}2,
 moredelim=**[is][\color{red}]{`}{`},
 }% lstset
 …
 The C programming language is a foundational technology for modern computing with millions of lines of code implementing everything from commercial operating-systems to hobby projects.
 This installation base and the programmers producing it represent a massive software-engineering investment spanning decades and likely to continue for decades more.
 The \citet{TIOBE} ranks the top 5 most popular programming languages as: Java 16\%, \Textbf{C 7\%}, \Textbf{\CC 5\%}, \CS 4\%, Python 4\% = 36\%, where the next 50 languages are less than 3\% each with a long tail.
+The \citet{TIOBE} ranks the top 5 most popular programming languages as: Java 16\%, \Textbf{C 7\%}, \Textbf{\CC 5\%}, \Csharp 4\%, Python 4\% = 36\%, where the next 50 languages are less than 3\% each with a long tail.
 The top 3 rankings over the past 30 years are:
 \lstDeleteShortInline@%
 \begin{center}
 \setlength{\tabcolsep}{10pt}
+\begin{tabular}{@{}r|c|c|c|c|c|c|c@{}}
+                & 2017  & 2012  & 2007  & 2002  & 1997  & 1992  & 1987          \\
+\hline
+\begin{tabular}{@{}rccccccc@{}}
+                & 2017  & 2012  & 2007  & 2002  & 1997  & 1992  & 1987          \\ \hline
 Java    & 1             & 1             & 1             & 1             & 12    & -             & -                     \\
-\hline
 \Textbf{C}      & \Textbf{2}& \Textbf{2}& \Textbf{2}& \Textbf{2}& \Textbf{1}& \Textbf{1}& \Textbf{1}    \\
-\hline
 \CC             & 3             & 3             & 3             & 3             & 2             & 2             & 4                     \\
 \end{tabular}
 …
 \CC is used similarly, but has the disadvantages of multiple legacy design-choices that cannot be updated and active divergence of the language model from C, requiring significant effort and training to incrementally add \CC to a C-based project.
 \CFA is currently implemented as a source-to-source translator from \CFA to the GCC-dialect of C~\citep{GCCExtensions}, allowing it to leverage the portability and code optimizations provided by GCC, meeting goals (1)-(3).
+\CFA is currently implemented as a source-to-source translator from \CFA to the GCC-dialect of C~\citep{GCCExtensions}, allowing it to leverage the portability and code optimizations provided by GCC, meeting goals (1)--(3).
 Ultimately, a compiler is necessary for advanced features and optimal performance.
 …
 Since bare polymorphic-types provide a restricted set of available operations, \CFA provides a \emph{type assertion}~\cite[pp.~37-44]{Alphard} mechanism to provide further type information, where type assertions may be variable or function declarations that depend on a polymorphic type-variable.
 For example, the function @twice@ can be defined using the \CFA syntax for operator overloading:
-\newpage
 \begin{lstlisting}
 forall( otype T `| { T ?+?(T, T); }` ) T twice( T x ) { return x + x; } $\C{// ? denotes operands}$
 …
 int comp( const void * t1, const void * t2 ) { return *(double *)t1 < *(double *)t2 ? -1 :
                                 *(double *)t2 < *(double *)t1 ? 1 : 0; }
+double vals[10] = { /* 10 floating-point values */ };
+double key = 5.0;
+double key = 5.0, vals[10] = { /* 10 floating-point values */ };
 double * val = (double *)bsearch( &key, vals, 10, sizeof(vals[0]), comp );      $\C{// search sorted array}$
 \end{lstlisting}
 …
 Finally, \CFA allows variable overloading:
+\lstDeleteShortInline@%
+\par\smallskip
+\begin{tabular}{@{}l@{\hspace{1.5\parindent}}||@{\hspace{1.5\parindent}}l@{}}
+\begin{lstlisting}
+short int MAX = ...;
+int MAX = ...;
+double MAX = ...;
+\end{lstlisting}
+&
+\begin{lstlisting}
+short int s = MAX;  // select correct MAX
+int i = MAX;
+double d = MAX;
+\end{lstlisting}
+\end{tabular}
+\smallskip\par\noindent
+\lstMakeShortInline@%
+\begin{lstlisting}
+short int MAX = ...;   int MAX = ...;  double MAX = ...;
+short int s = MAX;    int i = MAX;    double d = MAX;   $\C{// select correct MAX}$
+\end{lstlisting}
 Here, the single name @MAX@ replaces all the C type-specific names: @SHRT_MAX@, @INT_MAX@, @DBL_MAX@.
 As well, restricted constant overloading is allowed for the values @0@ and @1@, which have special status in C, \eg the value @0@ is both an integer and a pointer literal, so its meaning depends on context.
 …
+}
 \end{lstlisting}
-%       int c = cmp( a->first, b->first );
-%       if ( c == 0 ) c = cmp( a->second, b->second );
-%       return c;
 Since @pair(T *, T * )@ is a concrete type, there are no implicit parameters passed to @lexcmp@, so the generated code is identical to a function written in standard C using @void *@, yet the \CFA version is type-checked to ensure the fields of both pairs and the arguments to the comparison function match in type.
 …
 Tuple flattening recursively expands a tuple into the list of its basic components.
 Tuple structuring packages a list of expressions into a value of tuple type, \eg:
 \lstDeleteShortInline@%
 \par\smallskip
 \begin{tabular}{@{}l@{\hspace{1.5\parindent}}||@{\hspace{1.5\parindent}}l@{}}
+%\lstDeleteShortInline@%
+%\par\smallskip
+%\begin{tabular}{@{}l@{\hspace{1.5\parindent}}||@{\hspace{1.5\parindent}}l@{}}
 \begin{lstlisting}
 int f( int, int );
 …
 int h( int, [int, int] );
 [int, int] x;
-\end{lstlisting}
+&
-\begin{lstlisting}
 int y;
 f( x );                 $\C[1in]{// flatten}$
+f( x );                 $\C{// flatten}$
 g( y, 10 );             $\C{// structure}$
+h( x, y );              $\C{// flatten and structure}\CRT{}$
+\end{lstlisting}
+\end{tabular}
+\smallskip\par\noindent
+\lstMakeShortInline@%
+h( x, y );              $\C{// flatten and structure}$
+\end{lstlisting}
+%\end{lstlisting}
+%&
+%\begin{lstlisting}
+%\end{tabular}
+%\smallskip\par\noindent
+%\lstMakeShortInline@%
 In the call to @f@, @x@ is implicitly flattened so the components of @x@ are passed as the two arguments.
 In the call to @g@, the values @y@ and @10@ are structured into a single argument of type @[int, int]@ to match the parameter type of @g@.
 …
 An assignment where the left side is a tuple type is called \emph{tuple assignment}.
 There are two kinds of tuple assignment depending on whether the right side of the assignment operator has a tuple type or a non-tuple type, called \emph{multiple} and \emph{mass assignment}, respectively.
 \lstDeleteShortInline@%
 \par\smallskip
 \begin{tabular}{@{}l@{\hspace{1.5\parindent}}||@{\hspace{1.5\parindent}}l@{}}
+%\lstDeleteShortInline@%
+%\par\smallskip
+%\begin{tabular}{@{}l@{\hspace{1.5\parindent}}||@{\hspace{1.5\parindent}}l@{}}
 \begin{lstlisting}
 int x = 10;
 double y = 3.5;
 [int, double] z;
+\end{lstlisting}
+&
+\begin{lstlisting}
+z = [x, y];             $\C[1in]{// multiple assignment}$
+[x, y] = z;             $\C{// multiple assignment}$
+z = 10;                 $\C{// mass assignment}$
+[y, x] = 3.14;  $\C{// mass assignment}\CRT{}$
+\end{lstlisting}
+\end{tabular}
+\smallskip\par\noindent
+\lstMakeShortInline@%
+z = [x, y];                                                                     $\C{// multiple assignment}$
+[x, y] = z;                                                                     $\C{// multiple assignment}$
+z = 10;                                                                         $\C{// mass assignment}$
+[y, x] = 3.14;                                                          $\C{// mass assignment}$
+\end{lstlisting}
+%\end{lstlisting}
+%&
+%\begin{lstlisting}
+%\end{tabular}
+%\smallskip\par\noindent
+%\lstMakeShortInline@%
 Both kinds of tuple assignment have parallel semantics, so that each value on the left and right side is evaluated before any assignments occur.
 As a result, it is possible to swap the values in two variables without explicitly creating any temporary variables or calling a function, \eg, @[x, y] = [y, x]@.
 …
 Here, the mass assignment sets all members of @s@ to zero.
 Since tuple-index expressions are a form of member-access expression, it is possible to use tuple-index expressions in conjunction with member tuple expressions to manually restructure a tuple (\eg rearrange, drop, and duplicate components).
 \lstDeleteShortInline@%
 \par\smallskip
 \begin{tabular}{@{}l@{\hspace{1.5\parindent}}||@{\hspace{1.5\parindent}}l@{}}
+%\lstDeleteShortInline@%
+%\par\smallskip
+%\begin{tabular}{@{}l@{\hspace{1.5\parindent}}||@{\hspace{1.5\parindent}}l@{}}
 \begin{lstlisting}
 [int, int, long, double] x;
 void f( double, long );
+\end{lstlisting}
+&
+\begin{lstlisting}
+x.[0, 1] = x.[1, 0];    $\C[1in]{// rearrange: [x.0, x.1] = [x.1, x.0]}$
+f( x.[0, 3] );            $\C{// drop: f(x.0, x.3)}\CRT{}$
+[int, int, int] y = x.[2, 0, 2]; // duplicate: [y.0, y.1, y.2] = [x.2, x.0.x.2]
+\end{lstlisting}
+\end{tabular}
+\smallskip\par\noindent
+\lstMakeShortInline@%
+x.[0, 1] = x.[1, 0];                                            $\C{// rearrange: [x.0, x.1] = [x.1, x.0]}$
+f( x.[0, 3] );                                                          $\C{// drop: f(x.0, x.3)}$
+[int, int, int] y = x.[2, 0, 2];                        $\C{// duplicate: [y.0, y.1, y.2] = [x.2, x.0.x.2]}$
+\end{lstlisting}
+%\end{lstlisting}
+%&
+%\begin{lstlisting}
+%\end{tabular}
+%\smallskip\par\noindent
+%\lstMakeShortInline@%
 It is also possible for a member access to contain other member accesses, \eg:
 \begin{lstlisting}
 …
 This example showcases a variadic-template-like decomposition of the provided argument list.
 The individual @print@ functions allow printing a single element of a type.
 The polymorphic @print@ allows printing any list of types, as long as each individual type has a @print@ function.
 The individual print functions can be used to build up more complicated @print@ functions, such as for @S@, which is something that cannot be done with @printf@ in C.
+The polymorphic @print@ allows printing any list of types, where as each individual type has a @print@ function.
+The individual print functions can be used to build up more complicated @print@ functions, such as @S@, which cannot be done with @printf@ in C.
 Finally, it is possible to use @ttype@ polymorphism to provide arbitrary argument forwarding functions.
 …
 is transformed into:
 \begin{lstlisting}
-// generated before the first 2-tuple
 forall(dtype T0, dtype T1 | sized(T0) | sized(T1)) struct _tuple2 {
         T0 field_0;
+        T0 field_0;                                                             $\C{// generated before the first 2-tuple}$
         T1 field_1;
 };
 _tuple2(int, int) f() {
         _tuple2(double, double) x;
-        // generated before the first 3-tuple
         forall(dtype T0, dtype T1, dtype T2 | sized(T0) | sized(T1) | sized(T2)) struct _tuple3 {
                 T0 field_0;
+                T0 field_0;                                                     $\C{// generated before the first 3-tuple}$
                 T1 field_1;
                 T2 field_2;
 …
+}
 \end{lstlisting}
+Tuple expressions are then simply converted directly into compound literals:
+\begin{lstlisting}
+[5, 'x', 1.24];
+\end{lstlisting}
+becomes:
+\begin{lstlisting}
+(_tuple3(int, char, double)){ 5, 'x', 1.24 };
+\end{lstlisting}
+Tuple expressions are then simply converted directly into compound literals, \eg @[5, 'x', 1.24]@ becomes @(_tuple3(int, char, double)){ 5, 'x', 1.24 }@.
 \begin{comment}
 …
 Though \CFA provides significant added functionality over C, these features have a low runtime penalty.
 In fact, \CFA's features for generic programming can enable faster runtime execution than idiomatic @void *@-based C code.
 This claim is demonstrated through a set of generic-code-based micro-benchmarks in C, \CFA, and \CC (see source-code interfaces in Appendix~\ref{sec:BenchmarkInterfaces}).
 Since all these languages share a subset comprising standard C, maximal-performance benchmarks would show little runtime variance, other than in length and clarity of source code.
 A more illustrative benchmark is to show the costs of idiomatic use of each language's features covering common usage.
+This claim is demonstrated through a set of generic-code-based micro-benchmarks in C, \CFA, and \CC (see stack implementations in Appendix~\ref{sec:BenchmarkStackImplementation}).
+Since all these languages share a subset essentially comprising standard C, maximal-performance benchmarks would show little runtime variance, other than in length and clarity of source code.
+A more illustrative benchmark measures the costs of idiomatic usage of each language's features.
 Figure~\ref{fig:BenchmarkTest} shows the \CFA benchmark tests for a generic stack based on a singly linked-list, a generic pair-data-structure, and a variadic @print@ routine similar to that in Section~\ref{sec:variadic-tuples}.
 The benchmark test is similar for C and \CC.
+The experiment uses element types @int@ and @pair(_Bool, char)@, and pushes $N=40M$ elements on a generic stack, copies the stack, clears one of the stacks, finds the maximum value in the other stack, and prints $N$ constant values.
+The experiment uses element types @int@ and @pair(_Bool, char)@, and pushes $N=40M$ elements on a generic stack, copies the stack, clears one of the stacks, finds the maximum value in the other stack, and prints $N/2$ (to reduce graph height) constants.
+\begin{figure}
+\begin{lstlisting}[xleftmargin=3\parindentlnth,aboveskip=0pt,belowskip=0pt]
+int main( int argc, char * argv[] ) {
+        FILE * out = fopen( "cfa-out.txt", "w" );
+        int maxi = 0, vali = 42;
+        stack(int) si, ti;
+        REPEAT_TIMED( "push_int", N, push( &si, vali ); )
+        TIMED( "copy_int", ti = si; )
+        TIMED( "clear_int", clear( &si ); )
+        REPEAT_TIMED( "pop_int", N,
+                int xi = pop( &ti ); if ( xi > maxi ) { maxi = xi; } )
+        REPEAT_TIMED( "print_int", N/2, print( out, vali, ":", vali, "\n" ); )
+        pair(_Bool, char) maxp = { (_Bool)0, '\0' }, valp = { (_Bool)1, 'a' };
+        stack(pair(_Bool, char)) sp, tp;
+        REPEAT_TIMED( "push_pair", N, push( &sp, valp ); )
+        TIMED( "copy_pair", tp = sp; )
+        TIMED( "clear_pair", clear( &sp ); )
+        REPEAT_TIMED( "pop_pair", N,
+                pair(_Bool, char) xp = pop( &tp ); if ( xp > maxp ) { maxp = xp; } )
+        REPEAT_TIMED( "print_pair", N/2, print( out, valp, ":", valp, "\n" ); )
+        fclose(out);
+}
+\end{lstlisting}
+\caption{\CFA Benchmark Test}
+\label{fig:BenchmarkTest}
+\end{figure}
 The structure of each benchmark implemented is: C with @void *@-based polymorphism, \CFA with the presented features, \CC with templates, and \CC using only class inheritance for polymorphism, called \CCV.
 …
 hence runtime checks are necessary to safely down-cast objects.
 The most notable difference among the implementations is in memory layout of generic types: \CFA and \CC inline the stack and pair elements into corresponding list and pair nodes, while C and \CCV lack such a capability and instead must store generic objects via pointers to separately-allocated objects.
 For the print benchmark, idiomatic printing is used: the C and \CFA variants used @stdio.h@, while the \CC and \CCV variants used @iostream@; preliminary tests show this distinction has little runtime impact.
+For the print benchmark, idiomatic printing is used: the C and \CFA variants used @stdio.h@, while the \CC and \CCV variants used @iostream@; preliminary tests show this distinction has negligible runtime impact.
 Note, the C benchmark uses unchecked casts as there is no runtime mechanism to perform such checks, while \CFA and \CC provide type-safety statically.
-\begin{figure}
-\begin{lstlisting}[xleftmargin=3\parindentlnth,aboveskip=0pt,belowskip=0pt]
-int main( int argc, char *argv[] ) {
-        FILE * out = fopen( "cfa-out.txt", "w" );
-        int maxi = 0, vali = 42;
-        stack(int) si, ti;
-        REPEAT_TIMED( "push_int", N, push( &si, vali ); )
-        TIMED( "copy_int", ti = si; )
-        TIMED( "clear_int", clear( &si ); )
-        REPEAT_TIMED( "pop_int", N,
-                int xi = pop( &ti );
-                if ( xi > maxi ) { maxi = xi; } )
-        REPEAT_TIMED( "print_int", N/2, print( out, vali, ":", vali, "\n" ); )
-        pair(_Bool, char) maxp = { (_Bool)0, '\0' }, valp = { (_Bool)1, 'a' };
-        stack(pair(_Bool, char)) sp, tp;
-        REPEAT_TIMED( "push_pair", N, push( &sp, valp ); )
-        TIMED( "copy_pair", tp = sp; )
-        TIMED( "clear_pair", clear( &sp ); )
-        REPEAT_TIMED( "pop_pair", N,
-                pair(_Bool, char) xp = pop( &tp );
-                if ( xp > maxp ) { maxp = xp; } )
-        REPEAT_TIMED( "print_pair", N/2, print( out, valp, ":", valp, "\n" ); )
-        fclose(out);
+}
-\end{lstlisting}
-\caption{\CFA Benchmark Test}
-\label{fig:BenchmarkTest}
-\end{figure}
 Figure~\ref{fig:eval} and Table~\ref{tab:eval} show the results of running the benchmark in Figure~\ref{fig:BenchmarkTest} and its C, \CC, and \CCV equivalents.
 …
                                                                         & \CT{C}        & \CT{\CFA}     & \CT{\CC}      & \CT{\CCV}             \\ \hline
 maximum memory usage (MB)                       & 10001         & 2502          & 2503          & 11253                 \\
 source code size (lines)                        & 247           & 223           & 165           & 339                   \\
+source code size (lines)                        & 247           & 222           & 165           & 339                   \\
 redundant type annotations (lines)      & 39            & 2                     & 2                     & 15                    \\
 binary size (KB)                                        & 14            & 229           & 18            & 38                    \\
 …
 The C and \CCV variants are generally the slowest with the largest memory footprint, because of their less-efficient memory layout and the pointer-indirection necessary to implement generic types;
 this inefficiency is exacerbated by the second level of generic types in the pair-based benchmarks.
 By contrast, the \CFA and \CC variants run in roughly equivalent time for both the integer and pair of @_Bool@ and @char@ because the storage layout is equivalent.
+By contrast, the \CFA and \CC variants run in roughly equivalent time for both the integer and pair of @_Bool@ and @char@ because the storage layout is equivalent, with the inlined libraries (\ie no separate compilation) and greater maturity of the \CC compiler contributing to its lead.
 \CCV is slower than C largely due to the cost of runtime type-checking of down-casts (implemented with @dynamic_cast@);
 There are two outliers in the graph for \CFA: all prints and pop of @pair@.
 Both of these cases result from the complexity of the C-generated polymorphic code, so that the GCC compiler is unable to optimize some dead code and condense nested calls.
 A compiler for \CFA could easily perform these optimizations.
+A compiler designed for \CFA could easily perform these optimizations.
 Finally, the binary size for \CFA is larger because of static linking with the \CFA libraries.
 \CC performs best because it uses header-only inlined libraries (\ie no separate compilation).
 \CFA and \CC have the advantage of a pre-written generic @pair@ and @stack@ type to reduce line count, while C and \CCV require it to written by the programmer, as C does not have a generic collections-library and \CCV does not use the \CC standard template library by construction.
+For \CCV, the definition of @object@ and wrapper classes for @bool@, @char@, @int@, and @const char *@ are included in the line count, which inflates its line count, as an actual object-oriented language would include these in the standard library;
+\CFA is also competitive in terms of source code size, measured as a proxy for programmer effort. The line counts in Table~\ref{tab:eval} include implementations of @pair@ and @stack@ types for all four languages for purposes of direct comparison, though it should be noted that \CFA and \CC have pre-written data structures in their standard libraries that programmers would generally use instead. Use of these standard library types has minimal impact on the performance benchmarks, but shrinks the \CFA and \CC benchmarks to 73 and 54 lines, respectively.
+On the other hand, C does not have a generic collections-library in its standard distribution, resulting in frequent reimplementation of such collection types by C programmers.
+\CCV does not use the \CC standard template library by construction, and in fact includes the definition of @object@ and wrapper classes for @bool@, @char@, @int@, and @const char *@ in its line count, which inflates this count somewhat, as an actual object-oriented language would include these in the standard library;
 with their omission the \CCV line count is similar to C.
 We justify the given line count by noting that many object-oriented languages do not allow implementing new interfaces on library types without subclassing or wrapper types, which may be similarly verbose.
 …
 To quantify this, the ``redundant type annotations'' line in Table~\ref{tab:eval} counts the number of lines on which the type of a known variable is re-specified, either as a format specifier, explicit downcast, type-specific function, or by name in a @sizeof@, struct literal, or @new@ expression.
 The \CC benchmark uses two redundant type annotations to create a new stack nodes, while the C and \CCV benchmarks have several such annotations spread throughout their code.
 The three instances in which the \CFA benchmark still uses redundant type specifiers are to cast the result of a polymorphic @malloc@ call (the @sizeof@ argument is inferred by the compiler).
 These uses are similar to the @new@ expressions in \CC, though ongoing work on the \CFA compiler's type resolver should shortly render even these type casts superfluous.
+The two instances in which the \CFA benchmark still uses redundant type specifiers are to cast the result of a polymorphic @malloc@ call (the @sizeof@ argument is inferred by the compiler).
+These uses are similar to the @new@ expressions in \CC, though the \CFA compiler's type resolver should shortly render even these type casts superfluous.
 …
 In contrast, \CFA has a single facility for polymorphic code supporting type-safe separate-compilation of polymorphic functions and generic (opaque) types, which uniformly leverage the C procedural paradigm.
 The key mechanism to support separate compilation is \CFA's \emph{explicit} use of assumed properties for a type.
 Until \CC~\citep{C++Concepts} are standardized (anticipated for \CCtwenty), \CC provides no way to specify the requirements of a generic function in code beyond compilation errors during template expansion;
+Until \CC~\citet{C++Concepts} are standardized (anticipated for \CCtwenty), \CC provides no way to specify the requirements of a generic function in code beyond compilation errors during template expansion;
 furthermore, \CC concepts are restricted to template polymorphism.
 …
 In \CFA terms, all Cyclone polymorphism must be dtype-static.
 While the Cyclone design provides the efficiency benefits discussed in Section~\ref{sec:generic-apps} for dtype-static polymorphism, it is more restrictive than \CFA's general model.
+\citet{Smith98} present Polymorphic C, an ML dialect with polymorphic functions and C-like syntax and pointer types; it lacks many of C's features, however, most notably structure types, and so is not a practical C replacement.
 \citet{obj-c-book} is an industrially successful extension to C.
 However, Objective-C is a radical departure from C, using an object-oriented model with message-passing.
 Objective-C did not support type-checked generics until recently~\citet{xcode7}, historically using less-efficient and more error-prone runtime checking of object types.
+Objective-C did not support type-checked generics until recently \citet{xcode7}, historically using less-efficient runtime checking of object types.
 The~\citet{GObject} framework also adds object-oriented programming with runtime type-checking and reference-counting garbage-collection to C;
 these features are more intrusive additions than those provided by \CFA, in addition to the runtime overhead of reference-counting.
+\citet{Vala} compiles to GObject-based C, and so adds the burden of learning a separate language syntax to the aforementioned demerits of GObject as a modernization path for the existing C code-bases.
+Java~\citep{Java8} included generic types in Java~5;
+Java's generic types are type-checked at compilation and type-erased at runtime, similar to \CFA's.
+\citet{Vala} compiles to GObject-based C, adding the burden of learning a separate language syntax to the aforementioned demerits of GObject as a modernization path for existing C code-bases.
+Java~\citep{Java8} included generic types in Java~5, which are type-checked at compilation and type-erased at runtime, similar to \CFA's.
 However, in Java, each object carries its own table of method pointers, while \CFA passes the method pointers separately to maintain a C-compatible layout.
 Java is also a garbage-collected, object-oriented language, with the associated resource usage and C-interoperability burdens.
 …
 There is ongoing work on a wide range of \CFA feature extensions, including reference types, exceptions, concurrent primitives and modules.
 (While all examples in the paper compile and run, a public beta-release of \CFA will take another 8--12 months to finalize these addition extensions.)
+(While all examples in the paper compile and run, a public beta-release of \CFA will take another 8--12 months to finalize these additional extensions.)
 In addition, there are interesting future directions for the polymorphism design.
 Notably, \CC template functions trade compile time and code bloat for optimal runtime of individual instantiations of polymorphic functions.
 \CFA polymorphic functions, by contrast, uses a dynamic virtual dispatch.
 The runtime overhead of this approach is low, but not as low as inlining, and it may be beneficial to provide a mechanism for performance-sensitive code.
+\CFA polymorphic functions use dynamic virtual-dispatch;
+the runtime overhead of this approach is low, but not as low as inlining, and it may be beneficial to provide a mechanism for performance-sensitive code.
 Two promising approaches are an @inline@ annotation at polymorphic function call sites to create a template-specialization of the function (provided the code is visible) or placing an @inline@ annotation on polymorphic function-definitions to instantiate a specialized version for some set of types.
 These approaches are not mutually exclusive and allow performance optimizations to be applied only when necessary, without suffering global code-bloat.
 …
 \begin{acks}
 The authors would like to recognize the design assistance of Glen Ditchfield, Richard Bilson, and Thierry Delisle on the features described in this paper. They also thank Magnus Madsen and three anonymous reviewers for valuable editorial feedback.
 This work is supported in part by a corporate partnership with \grantsponsor{Huawei}{Huawei Ltd.}{http://www.huawei.com}\ and the first author's \grantsponsor{NSERC-PGS}{NSERC PGS D}{http://www.nserc-crsng.gc.ca/Students-Etudiants/PG-CS/BellandPostgrad-BelletSuperieures_eng.asp} scholarship.
+The authors would like to recognize the design assistance of Glen Ditchfield, Richard Bilson, and Thierry Delisle on the features described in this paper, and thank Magnus Madsen and the three anonymous reviewers for valuable feedback.
+This work is supported in part by a corporate partnership with \grantsponsor{Huawei}{Huawei Ltd.}{http://www.huawei.com}, and Aaron Moss and Peter Buhr are funded by the \grantsponsor{Natural Sciences and Engineering Research Council} of Canada.
+% the first author's \grantsponsor{NSERC-PGS}{NSERC PGS D}{http://www.nserc-crsng.gc.ca/Students-Etudiants/PG-CS/BellandPostgrad-BelletSuperieures_eng.asp} scholarship.
 \end{acks}
 …
 \appendix
 \section{Benchmark Interfaces}
 \label{sec:BenchmarkInterfaces}
+\section{Benchmark Stack Implementation}
+\label{sec:BenchmarkStackImplementation}
 \lstset{basicstyle=\linespread{0.9}\sf\small}
+Throughout, @/***/@ designates a counted redundant type annotation.
+\medskip\noindent
 \CFA
 \begin{lstlisting}[xleftmargin=2\parindentlnth,aboveskip=0pt,belowskip=0pt]
+forall(otype T) struct stack_node;
+forall(otype T) struct stack { stack_node(T) * head; };
+forall(otype T) void ?{}(stack(T) * s);
+forall(otype T) void ?{}(stack(T) * s, stack(T) t);
+forall(otype T) stack(T) ?=?(stack(T) * s, stack(T) t);
+forall(otype T) void ^?{}(stack(T) * s);
+forall(otype T) _Bool empty(const stack(T) * s);
+forall(otype T) void push(stack(T) * s, T value);
+forall(otype T) T pop(stack(T) * s);
+forall(otype T) void clear(stack(T) * s);
+void print( FILE * out, const char * x );
+void print( FILE * out, _Bool x );
+void print( FILE * out, char x );
+void print( FILE * out, int x );
+forall(otype T, ttype Params | { void print( FILE *, T ); void print( FILE *, Params ); })
+        void print( FILE * out, T arg, Params rest );
+forall(otype R, otype S | { void print( FILE *, R ); void print( FILE *, S ); })
+        void print( FILE * out, pair(R, S) x );
+forall(otype T) struct stack_node {
+        T value;
+        stack_node(T) * next;
+};
+forall(otype T) void ?{}(stack(T) * s) { (&s->head){ 0 }; }
+forall(otype T) void ?{}(stack(T) * s, stack(T) t) {
+        stack_node(T) ** crnt = &s->head;
+        for ( stack_node(T) * next = t.head; next; next = next->next ) {
+                *crnt = ((stack_node(T) *)malloc()){ next->value }; /***/
+                stack_node(T) * acrnt = *crnt;
+                crnt = &acrnt->next;
+        }
+        *crnt = 0;
+}
+forall(otype T) stack(T) ?=?(stack(T) * s, stack(T) t) {
+        if ( s->head == t.head ) return *s;
+        clear(s);
+        s{ t };
+        return *s;
+}
+forall(otype T) void ^?{}(stack(T) * s) { clear(s); }
+forall(otype T) _Bool empty(const stack(T) * s) { return s->head == 0; }
+forall(otype T) void push(stack(T) * s, T value) {
+        s->head = ((stack_node(T) *)malloc()){ value, s->head }; /***/
+}
+forall(otype T) T pop(stack(T) * s) {
+        stack_node(T) * n = s->head;
+        s->head = n->next;
+        T x = n->value;
+        ^n{};
+        free(n);
+        return x;
+}
+forall(otype T) void clear(stack(T) * s) {
+        for ( stack_node(T) * next = s->head; next; ) {
+                stack_node(T) * crnt = next;
+                next = crnt->next;
+                delete(crnt);
+        }
+        s->head = 0;
+}
 \end{lstlisting}
 …
 \CC
 \begin{lstlisting}[xleftmargin=2\parindentlnth,aboveskip=0pt,belowskip=0pt]
+std::pair
+std::forward_list wrapped in std::stack interface
+template<typename T> void print(ostream& out, const T& x) { out << x; }
+template<> void print<bool>(ostream& out, const bool& x) { out << (x ? "true" : "false"); }
+template<> void print<char>(ostream& out, const char& x ) { out << "'" << x << "'"; }
+template<typename R, typename S> ostream& operator<< (ostream& out, const pair<R, S>& x) {
+        out << "["; print(out, x.first); out << ", "; print(out, x.second); return out << "]"; }
+template<typename T, typename... Args> void print(ostream& out, const T& arg, const Args&... rest) {
+        out << arg;     print(out, rest...); }
+template<typename T> class stack {
+        struct node {
+                T value;
+                node * next;
+                node( const T & v, node * n = nullptr ) : value(v), next(n) {}
+        };
+        node * head;
+        void copy(const stack<T>& o) {
+                node ** crnt = &head;
+                for ( node * next = o.head;; next; next = next->next ) {
+                        *crnt = new node{ next->value }; /***/
+                        crnt = &(*crnt)->next;
+                }
+                *crnt = nullptr;
+        }
+  public:
+        stack() : head(nullptr) {}
+        stack(const stack<T>& o) { copy(o); }
+        stack(stack<T> && o) : head(o.head) { o.head = nullptr; }
+        ~stack() { clear(); }
+        stack & operator= (const stack<T>& o) {
+                if ( this == &o ) return *this;
+                clear();
+                copy(o);
+                return *this;
+        }
+        stack & operator= (stack<T> && o) {
+                if ( this == &o ) return *this;
+                head = o.head;
+                o.head = nullptr;
+                return *this;
+        }
+        bool empty() const { return head == nullptr; }
+        void push(const T & value) { head = new node{ value, head };  /***/ }
+        T pop() {
+                node * n = head;
+                head = n->next;
+                T x = std::move(n->value);
+                delete n;
+                return x;
+        }
+        void clear() {
+                for ( node * next = head; next; ) {
+                        node * crnt = next;
+                        next = crnt->next;
+                        delete crnt;
+                }
+                head = nullptr;
+        }
+};
 \end{lstlisting}
 …
+C
 \begin{lstlisting}[xleftmargin=2\parindentlnth,aboveskip=0pt,belowskip=0pt]
+struct pair { void * first, second; };
+struct pair * new_pair( void * first, void * second );
+struct pair * copy_pair( const struct pair * src,
+        void * (*copy_first)( const void * ), void * (*copy_second)( const void * ) );
+void free_pair( struct pair * p, void (*free_first)( void * ), void (*free_second)( void * ) );
+int cmp_pair( const struct pair * a, const struct pair * b,
+        int (*cmp_first)( const void *, const void * ), int (*cmp_second)( const void *, const void * ) );
+struct stack_node;
+struct stack { struct stack_node * head; };
+struct stack new_stack();
+void copy_stack( struct stack * dst, const struct stack * src, void * (*copy)( const void * ) );
+void clear_stack( struct stack * s, void (*free_el)( void * ) );
+_Bool stack_empty( const struct stack * s );
+void push_stack( struct stack * s, void * value );
+void * pop_stack( struct stack * s );
+void print_string( FILE * out, const char * x );
+void print_bool( FILE * out, _Bool x );
+void print_char( FILE * out, char x );
+void print_int( FILE * out, int x );
+void print( FILE * out, const char * fmt, ... );
+struct stack_node {
+        void * value;
+        struct stack_node * next;
+};
+struct stack new_stack() { return (struct stack){ NULL }; /***/ }
+void copy_stack(struct stack * s, const struct stack * t, void * (*copy)(const void *)) {
+        struct stack_node ** crnt = &s->head;
+        for ( struct stack_node * next = t->head; next; next = next->next ) {
+                *crnt = malloc(sizeof(struct stack_node)); /***/
+                **crnt = (struct stack_node){ copy(next->value) }; /***/
+                crnt = &(*crnt)->next;
+        }
+        *crnt = 0;
+}
+_Bool stack_empty(const struct stack * s) { return s->head == NULL; }
+void push_stack(struct stack * s, void * value) {
+        struct stack_node * n = malloc(sizeof(struct stack_node)); /***/
+        *n = (struct stack_node){ value, s->head }; /***/
+        s->head = n;
+}
+void * pop_stack(struct stack * s) {
+        struct stack_node * n = s->head;
+        s->head = n->next;
+        void * x = n->value;
+        free(n);
+        return x;
+}
+void clear_stack(struct stack * s, void (*free_el)(void *)) {
+        for ( struct stack_node * next = s->head; next; ) {
+                struct stack_node * crnt = next;
+                next = crnt->next;
+                free_el(crnt->value);
+                free(crnt);
+        }
+        s->head = NULL;
+}
+\end{lstlisting}
+\medskip\noindent
+\CCV
+\begin{lstlisting}[xleftmargin=2\parindentlnth,aboveskip=0pt,belowskip=0pt]
+stack::node::node( const object & v, node * n ) : value( v.new_copy() ), next( n ) {}
+void stack::copy(const stack & o) {
+        node ** crnt = &head;
+        for ( node * next = o.head; next; next = next->next ) {
+                *crnt = new node{ *next->value };
+                crnt = &(*crnt)->next;
+        }
+        *crnt = nullptr;
+}
+stack::stack() : head(nullptr) {}
+stack::stack(const stack & o) { copy(o); }
+stack::stack(stack && o) : head(o.head) { o.head = nullptr; }
+stack::~stack() { clear(); }
+stack & stack::operator= (const stack & o) {
+        if ( this == &o ) return *this;
+        clear();
+        copy(o);
+        return *this;
+}
+stack & stack::operator= (stack && o) {
+        if ( this == &o ) return *this;
+        head = o.head;
+        o.head = nullptr;
+        return *this;
+}
+bool stack::empty() const { return head == nullptr; }
+void stack::push(const object & value) { head = new node{ value, head }; /***/ }
+ptr<object> stack::pop() {
+        node * n = head;
+        head = n->next;
+        ptr<object> x = std::move(n->value);
+        delete n;
+        return x;
+}
+void stack::clear() {
+        for ( node * next = head; next; ) {
+                node * crnt = next;
+                next = crnt->next;
+                delete crnt;
+        }
+        head = nullptr;
+}
 \end{lstlisting}
 \begin{comment}
-Throughout, @/***/@ designates a counted redundant type annotation.
 \subsubsection{bench.h}

Note: See TracChangeset for help on using the changeset viewer.

Download in other formats: