source: doc/theses/jiada_liang_MMath/trait.tex@ 38e17b0

Last change on this file since 38e17b0 was 0bda8d7, checked in by JiadaL <j82liang@…>, 13 months ago

Small updates

  • Property mode set to 100644
File size: 15.6 KB
RevLine 
[38e20a80]1\chapter{Enumeration Traits}
2\label{c:trait}
[956299b]3
[8cb2ff6]4\CC introduced the @std::is_enum@ trait in \CC{11} and concept feature in \CC{20}.
[aa14aafe]5This combination makes it possible to write a polymorphic function over an enumerated type.
[8cb2ff6]6\begin{c++}
[21f4dff]7#include <type_traits>
[8cb2ff6]8template<typename T> @concept Enumerable@ = std::is_enum<T>::value;
[aa14aafe]9template<@Enumerable@ E> E f( E e ) { $\C{// constrained type}$
10 E w = e; $\C{// allocation and copy}$
[8cb2ff6]11 cout << e << ' ' << w << endl; $\C{// value}$
12 return w; $\C{// copy}$
13}
14int main() {
15 enum E { A = 42, B, C } e = C;
16 e = f( e );
17}
1844 44
19\end{c++}
[0bda8d7]20The @std::is_enum@ and other \CC @traits@ are compile-time interfaces to query type information.
21While named the same as @trait@ in other programming languages, it is orthogonal to the \CFA trait, with the latter being defined as a collection of assertions to be satisfied by a polymorphic type.
[21f4dff]22
[8cb2ff6]23The following sections cover the underlying implementation features I created to generalize and restrict enumerations in the \CFA type-system using the @trait@ mechanism.
[21f4dff]24
[d1276f8]25
[aa14aafe]26\section{Traits \texorpdfstring{\lstinline{CfaEnum}}{CfaEnum} and \texorpdfstring{\lstinline{TypedEnum}}{TypedEnum}}
[8cb2ff6]27
28Traits @CfaEnum@ and @TypedEnum@ define the enumeration attributes: @label@, @posn@, @value@, and @Countof@.
29These traits support polymorphic functions for \CFA enumeration, \eg:
[21f4dff]30\begin{cfa}
[8cb2ff6]31forall( E ) | @CfaEnum( E )@ )
32void f( E e ) {
33 // access enumeration properties for e
34}
[21f4dff]35\end{cfa}
[aa14aafe]36\newpage
[0bda8d7]37Trait @CfaEnum@ defines attribute functions @label@ and @posn@ for all \CFA enumerations, and internally \CFA enumerations fulfill this assertion.
[d1276f8]38\begin{cfa}
39forall( E ) trait CfaEnum {
40 const char * @label@( E e );
41 unsigned int @posn@( E e );
42};
43\end{cfa}
[8cb2ff6]44This trait covers opaque enumerations that do not have an explicit @value@.
[d1276f8]45
[8cb2ff6]46The trait @TypedEnum@ extends @CfaEnum@ with the @value@ assertion for typed enumerations.
[d1276f8]47\begin{cfa}
48forall( E, V | CfaEnum( E ) ) trait TypedEnum {
49 V @value@( E e );
50};
51\end{cfa}
[8cb2ff6]52Here, the associate type-parameter @V@ is the base type of the typed enumeration, and hence, the return type of @value@.
53These two traits provide a way to define functions over all \CFA enumerations.
[d1276f8]54
[8cb2ff6]55For example, \VRef[Figure]{f:GeneralizedEnumerationFormatter} shows a generalized enumeration formatter for any enumeration type.
56The formatter prints an enumerator name and its value in the form @"label( value )"@.
[0bda8d7]57The trait for @format_enum@ requires a function named @str@ to print the value (payload) of the enumerator.
58Hence, enumeration defines how its value appears, and @format_enum@ displays this value within the label name.
[38e20a80]59
[8cb2ff6]60\begin{figure}
61\begin{cfa}
62forall( @E, V | TypedEnum( E, V )@ | { string str( V ); } ) $\C{// format any enumeration}$
63string format_enum( E e ) {
64 return label( e ) + '(' + str( value( e ) ) + ')'; $\C{// "label( value )"}$
[d1276f8]65}
[8cb2ff6]66enum(size_t) RGB { Red = 0xFF0000, Green = 0x00FF00, Blue = 0x0000FF };
67// string library has conversion function str from size_t to string
68
69struct color_code { int R, G, B; };
[38e20a80]70enum(color_code) Rainbow {
[8cb2ff6]71 Red = {255, 0, 0}, Orange = {255, 127, 0}, Yellow = {255, 255, 0}, Green = {0, 255, 0}, // ...
[38e20a80]72};
[8cb2ff6]73string str( color_code cc ) with( cc ) { $\C{// format payload, "ddd,ddd,ddd"}$
74 return str( R ) + ',' + str( G ) + ',' + str( B ); $\C{// "R,G,B"}$
75}
76int main() {
77 sout | format_enum( RGB.Green ); $\C{// "Green(65280)"}$
78 sout | format_enum( Rainbow.Green ); $\C{// "Green(0,255,0)"}$
79}
[d1276f8]80\end{cfa}
[8cb2ff6]81\caption{Generalized Enumeration Formatter}
82\label{f:GeneralizedEnumerationFormatter}
83\end{figure}
[d1276f8]84
[8cb2ff6]85Other types may work with traits @CfaEnum@ and @TypedEnum@, by supplying appropriate @label@, @posn@, and @value@ functions.
[4c63025]86For example, \VRef[Figure]{f:ExtendCEnumeration} extends a (possibly predefined) C enumeration to work with all the \CFA extensions.
[38e20a80]87
[8cb2ff6]88\begin{figure}
[d1276f8]89\begin{cfa}
[8cb2ff6]90enum Fruit { Apple, Banana, Cherry }; $\C{// C enum}$
91const char * @label@( Fruit f ) {
92 static const char * labels[] = { "Apple", "Banana", "Cherry" };
93 return labels[f];
[d1276f8]94}
[8cb2ff6]95int @posn@( Fruit f ) { return f; }
96int @value@( Fruit f ) {
97 static const char values[] = { 'a', 'b', 'c' };
98 return values[f];
[38e20a80]99}
[8cb2ff6]100sout | format_enum( Cherry ); $\C{// "Cherry(c)"}$
[d1276f8]101\end{cfa}
[4c63025]102\caption{Extend C Enumeration to \CFA Enumeration}
103\label{f:ExtendCEnumeration}
[8cb2ff6]104\end{figure}
[d1276f8]105
[6740533e]106
[8cb2ff6]107\section{Discussion: Genericity}
108
[aa14aafe]109At the start of this chapter, the \CC concept is introduced to constrained template types, \eg:
[8cb2ff6]110\begin{c++}
111concept Enumerable = std::is_enum<T>::value;
112\end{c++}
113Here, @concept@ is referring directly to types with kind @enum@;
114other @concept@s can refer to all types with kind @int@ with @long@ or @long long@ qualifiers, \etc.
[0bda8d7]115Hence, the @concept@ is the first level of restriction, allowing only the specified kinds of types and rejecting others.
[8cb2ff6]116The template expansion is the second level of restriction verifying if the type passing the @concept@ test provides the necessary functionality.
117Hence, a @concept@ is querying precise aspects of the programming language set of types.
118
119Alternatively, languages using traits, like \CFA, Scala, Go, and Rust, are defining a restriction based on a set of operations, variables, or structure fields that must exist to match with usages in a function or aggregate type.
[0bda8d7]120Hence, the \CFA enumeration traits are never connected with the specific @enum@ kind.
[aa14aafe]121Instead, anything that can look like the @enum@ kind is considered an enumeration (static structural typing).
[dcfcf368]122However, Scala, Go, and Rust traits are nominative: a type explicitly declares a named trait to be of its type, while in \CFA, any type implementing all requirements declared in a trait implicitly satisfy its restrictions.
[8cb2ff6]123
124One of the key differences between concepts and traits, which is leveraged heavily by \CFA, is the ability to apply new \CFA features to C legacy code.
125For example, \VRef[Figure]{f:GeneralizedEnumerationFormatter} shows that pre-existing C enumerations can be upgraded to work and play with new \CFA enumeration facilities.
126Another example is adding constructors and destructors to pre-existing C types by simply declaring them for the old C type.
[aa14aafe]127\CC fails at certain levels of legacy extension because many of the new \CC features must appear \emph{within} an aggregate definition due to the object-oriented nature of the type system, where it is impossible to change legacy library types.
[6740533e]128
129
130\section{Bounded and Serial}
[8cb2ff6]131
132A bounded trait defines a lower and upper bound for a type.
[d1276f8]133\begin{cfa}
134forall( E ) trait Bounded {
[38e20a80]135 E lowerBound();
[aa14aafe]136 E upperBound();
[d1276f8]137};
138\end{cfa}
[8cb2ff6]139Both functions are necessary for the implementation of \CFA enumeration, with @lowerBound@ returning the first enumerator and @upperBound@ returning the last enumerator.
[d1276f8]140\begin{cfa}
[8cb2ff6]141enum(int) Week { Mon, Tue, Wed, Thu, Fri, Sat, Sun };
142enum(int) Fruit { Apple, Banana, Cherry };
143Week first_day = lowerBound(); $\C{// Mon}$
144Fruit last_fruit = upperBound(); $\C{// Cherry}$
[d1276f8]145\end{cfa}
[0bda8d7]146The @lowerBound@ and @upperBound@ are functions overloaded on return type only, meaning their type resolution depends solely on the call-site context, such as the parameter type for a function argument or the left-hand side of an assignment expression.
[8cb2ff6]147Calling either function without a context results in a type ambiguity, unless the type environment has only one type overloading the functions.
[d1276f8]148\begin{cfa}
[8cb2ff6]149sout | @lowerBound()@; $\C[2.5in]{// ambiguous as Week and Fruit implement Bounded}$
150void foo( Fruit );
151foo( lowerBound() ); $\C{// parameter provides type Fruit}$
152Week day = upperBound(); $\C{// day provides type Week}\CRT$
[d1276f8]153\end{cfa}
154
[8cb2ff6]155Trait @Serial@ is a subset of @Bounded@, with functions mapping enumerators to integers, and implementing a sequential order between enumerators.
[d1276f8]156\begin{cfa}
157forall( E | Bounded( E ) ) trait Serial {
[8cb2ff6]158 int fromInstance( E e );
[38e20a80]159 E fromInt( unsigned int i );
[d1276f8]160 E pred( E e );
[8cb2ff6]161 E succ( E e );
162 unsigned Countof( E );
[d1276f8]163};
164\end{cfa}
[8cb2ff6]165Function @fromInstance@ projects a @Bounded@ member to a number and @fromInt@ is the inverse.
[92a0ee8]166Function @pred@ and @succ@ are advancement functions:
167@pred@ takes an enumerator and returns the previous enumerator, if there is one, in sequential order, and @succ@ returns the next enumerator.
[38e20a80]168\begin{cfa}
[8cb2ff6]169sout | fromInstance( Wed ) | fromInt( 2 ) | succ( Wed ) | pred( Wed );
1702 Wed Thu Tue
[38e20a80]171\end{cfa}
[8cb2ff6]172Bound checking is provided for @fromInt@, @pred@, and @succ@, and the program is terminated if the lower or upper bound is exceeded, \eg:
173\begin{cfa}
174fromInt( 100 );
175Cforall Runtime error: call to fromInt has index 100 outside of enumeration range 0-6.
176\end{cfa}
177Function @fromInstance@ or a position cast using @(int)@ is always safe, \ie within the enumeration range.
178
[0bda8d7]179Function @Countof@ is the generic counterpart to the built-in pseudo-function @countof@.
[8cb2ff6]180@countof@ only works on enumeration types and instances, so it is locked into the language type system;
181as such, @countof( enum-type)@ becomes a compile-time constant.
[0bda8d7]182@Countof@ works on any type that matches the @Serial@ trait.
[8cb2ff6]183Hence, @Countof@ does not use its argument;
184only the parameter type is needed to compute the range size.
185\begin{cfa}
186int Countof( E ) {
187 E upper = upperBound();
188 E lower = lowerBound();
[aa14aafe]189 return fromInstance( upper ) - fromInstance( lower ) + 1;
[8cb2ff6]190}
191\end{cfa}
192
193@countof@ also works for any type @E@ that defines @Countof@ and @lowerBound@, becoming a call to @Countof( E )@.
194The resolution step on expression @countof( E )@ are:
[38e20a80]195\begin{enumerate}
[8cb2ff6]196\item Look for an enumeration named @E@, such as @enum E {... }@.
197If such an enumeration @E@ exists, replace @countof( E )@ with the number of enumerators.
198\item Look for a non-enumeration type named @E@ that defines @Countof@ and @lowerBound@, including @E@ being a polymorphic type, such as @forall( E )@.
[0bda8d7]199If type @E@ exists, replace it with @Countof(lowerBound())@, where @lowerBound@ is defined for type @E@.
[8cb2ff6]200\item Look for an enumerator @A@ defined in enumeration @E@.
201If such an enumerator @A@ exists, replace @countof( A )@ with the number of enumerators in @E@.
[0bda8d7]202\item Look for a name @A@ in the lexical context with the type @E@.
203If the name @A@ exists, replace @countof( A )@ with a function call @Countof( E )@.
[8cb2ff6]204\item If 1-4 fail, report a type error on expression @countof( E )@.
[38e20a80]205\end{enumerate}
206
[8cb2ff6]207
208\section{Enumerating}
209
210The fundamental aspect of an enumeration type is the ability to enumerate over its enumerators.
[0bda8d7]211\CFA supports \newterm{for} loops, \newterm{while} loop, and \newterm{range} loop. This section covers @for@ loops and @range@ loops for enumeration, but the concept transitions to @while@ loop.
[8cb2ff6]212
[96de72b]213
214\subsection{For Loop}
[38e20a80]215
[8cb2ff6]216A for-loop consists of loop control and body.
[aa14aafe]217The loop control is often a 3-tuple: initializers, looping condition, and advancement.
[0bda8d7]218It is a common practice to declare one or more loop-index variables in initializers, whether the variables satisfy the loop condition, and update the variables in advancement.
[8cb2ff6]219Such a variable is called an \newterm{index} and is available for reading and writing within the loop body.
220(Some languages make the index read-only in the loop body.)
221This style of iteration can be written for an enumeration using functions from the @Bounded@ and @Serial@ traits:
[96de72b]222\begin{cfa}
[8cb2ff6]223enum() E { A, B, C, D };
224for ( unsigned int i = 0; i < countof(E); i += 1 ) $\C{// (1)}$
225 sout | label( fromInt( i ) ) | nonl;
226sout | nl;
227for ( E e = lowerBound(); ; e = succ(e) ) { $\C{// (2)}$
228 sout | label(e) | nonl;
229 if (e == upperBound()) break;
[38e20a80]230}
[8cb2ff6]231sout | nl;
232A B C D
233A B C D
[38e20a80]234\end{cfa}
[d1276f8]235
[8cb2ff6]236A caveat in writing loop control using @pred@ and @succ@ is unintentionally exceeding the range.
[96de72b]237\begin{cfa}
[8cb2ff6]238for ( E e = upperBound(); e >= lowerBound(); e = pred( e ) ) {}
239for ( E e = lowerBound(); e <= upperBound(); e = succ( e ) ) {}
[96de72b]240\end{cfa}
[0bda8d7]241Both of these loops look correct but fail because there is an additional bound check within the advancement \emph{before} the conditional test to stop the loop, resulting in a failure at the endpoints of the iteration.
[aa14aafe]242These loops must be restructured by moving the loop test to the end of the loop (@do-while@), as in loop (2) above, which is safe because an enumeration always has at least one enumerator.
[96de72b]243
244
245\subsection{Range Loop}
[8cb2ff6]246
247Instead of writing the traditional 3-tuple loop control, \CFA supports a \newterm{range loop}.
248\begin{cfa}
249for ( @E e; A ~= D@ ) { sout | label( e ) | nonl; } sout | nl;
250for ( @e; A ~= D@ ) { sout | label( e ) | nonl; } sout | nl;
251for ( @E e; A -~= D@ ) { sout | label( e ) | nonl; } sout | nl;
252for ( @e; A -~= D ~ 2@ ) { sout | label( e ) | nonl; } sout | nl;
[96de72b]253\end{cfa}
[8cb2ff6]254Every range loop above has an index declaration and a @range@ bounded by \newterm{left bound} @A@ and \newterm{right bound} @D@.
255If the index declaration-type is omitted, the index type is the type of the lower bound (@typeof( A )@).
256If a range is joined by @~=@ (range up equal) operator, the index variable is initialized by the left bound and advanced by 1 until it is greater than the right bound.
257If a range is joined by @-~=@ (range down equal) operator, the index variable is initialized by the right bound and advanced by -1 until it is less than the left bound.
258(Note, functions @pred@ and @succ@ are not used for advancement, so the advancement problem does not occur.)
259A range can be suffixed by a positive \newterm{step}, \eg @~ 2@, so advancement is incremented/decremented by step.
260
261Finally, a shorthand for enumerating over the entire set of enumerators (the most common case) is using the enumeration type for the range.
262\begin{cfa}
263for ( e; @E@ ) sout | label( e ) | nonl; sout | nl; $\C{// A B C D}$
264for ( e; @-~= E@ ) sout | label( e ) | nonl; sout | nl; $\C{// D C B A}$
[96de72b]265\end{cfa}
[8cb2ff6]266For a \CFA enumeration, the loop enumerates over all enumerators of the enumeration.
267For a type matching the @Serial@ trait: the index variable is initialized to @lowerBound@ and loop control checks the index's value for greater than the @upperBound@.
268If the range type is not a \CFA enumeration or does not match trait @Serial@, it is compile-time error.
269
[96de72b]270
271\section{Overload Operators}
[8cb2ff6]272
273\CFA overloads the comparison operators for \CFA enumeration satisfying traits @Serial@ and @CfaEnum@.
[0bda8d7]274These definitions require the operand types to be the same, and the appropriate comparison is made using the the positions of the operands.
[d1276f8]275\begin{cfa}
[8cb2ff6]276forall( E | CfaEnum( E ) | Serial( E ) ) @{@ $\C{// distribution block}$
[d1276f8]277 // comparison
278 int ?==?( E l, E r ); $\C{// true if l and r are same enumerators}$
279 int ?!=?( E l, E r ); $\C{// true if l and r are different enumerators}$
280 int ?<?( E l, E r ); $\C{// true if l is an enumerator before r}$
281 int ?<=?( E l, E r ); $\C{// true if l before or the same as r}$
282 int ?>?( E l, E r ); $\C{// true if l is an enumerator after r}$
[96de72b]283 int ?>=?( E l, E r ); $\C{// true if l after or the same as r}$
[8cb2ff6]284@}@
[d1276f8]285\end{cfa}
[0bda8d7]286(Note, all the function prototypes are wrapped in a distribution block, where all qualifiers preceding the block are distributed to each declaration with the block, which eliminates tedious repeated qualification.
[8cb2ff6]287Distribution blocks can be nested.)
[d1276f8]288
[8cb2ff6]289\CFA implements a few arithmetic operators for @CfaEnum@.
[aa14aafe]290% Unlike advancement functions in @Serial@, these operators perform direct arithmetic, so there is no implicit bound checks.
[0bda8d7]291Bound checks are added to these operations to ensure the outputs fulfill the @Bounded@ invariant.
[96de72b]292\begin{cfa}
[8cb2ff6]293forall( E | CfaEnum( E ) | Serial( E ) ) { $\C{// distribution block}$
[96de72b]294 // comparison
295 E ++?( E & l );
296 E --?( E & l );
297 E ?+=? ( E & l, one_t );
298 E ?-=? ( E & l, one_t );
299 E ?+=? ( E & l, int i );
300 E ?-=? ( E & l, int i );
301 E ?++( E & l );
302 E ?--( E & l );
303}
304\end{cfa}
[d1276f8]305
[8cb2ff6]306Lastly, \CFA does not define @zero_t@ for \CFA enumeration.
307Users can define the boolean @false@ for \CFA enumerations on their own, \eg:
[d1276f8]308\begin{cfa}
[8cb2ff6]309forall( E | CfaEnum( E ) )
310int ?!=?( E lhs, zero_t ) {
311 return posn( lhs ) != 0;
[d1276f8]312}
313\end{cfa}
[0bda8d7]314which effectively turns the first enumeration into a logical @false@ and @true@ for the others.
Note: See TracBrowser for help on using the repository browser.