source: doc/theses/jiada_liang_MMath/CFAenum.tex @ 02101a4

Last change on this file since 02101a4 was 29c8675, checked in by JiadaL <j82liang@…>, 2 months ago

update thesis

  • Property mode set to 100644
File size: 29.5 KB
Line 
1\chapter{\texorpdfstring{\CFA}{Cforall} Enumeration}
2
3\CFA extends C-Style enumeration by adding a number of new features that bring enumerations in line with other modern programming languages.
4Any enumeration extensions must be intuitive to C programmers in syntax and semantics.
5The following sections detail my new contributions to enumerations in \CFA.
6
7
8\section{Syntax}
9
10\CFA extends the C enumeration declaration \see{\VRef{s:CEnumeration}} by parameterizing with a type (like a generic type) and adding Plan-9 inheritance \see{\VRef{s:CFAInheritance}} using an @inline@ to another enumeration type.
11\begin{cfa}[identifierstyle=\linespread{0.9}\it]
12$\it enum$-specifier:
13        enum @(type-specifier$\(_{opt}\)$)@ identifier$\(_{opt}\)$ { cfa-enumerator-list }
14        enum @(type-specifier$\(_{opt}\)$)@ identifier$\(_{opt}\)$ { cfa-enumerator-list , }
15        enum @(type-specifier$\(_{opt}\)$)@ identifier
16cfa-enumerator-list:
17        cfa-enumerator
18        cfa-enumerator-list, cfa-enumerator
19cfa-enumerator:
20        enumeration-constant
21        @inline $\color{red}enum$-type-name@
22        enumeration-constant = constant-expression
23\end{cfa}
24
25
26\section{Operations}
27
28\CFA enumerations have access to the three enumerations properties \see{\VRef{s:Terminology}}: label, order (position), and value via three overloaded functions @label@, @posn@, and @value@ \see{\VRef{c:trait} for details}.
29\CFA auto-generates these functions for every \CFA enumeration.
30\begin{cfa}
31enum(int) E { A = 3 } e = A;
32sout | A | @label@( A ) | @posn@( A ) | @value@( A );
33sout | e | @label@( e ) | @posn@( e ) | @value@( e );
34A A 0 3
35A A 0 3
36\end{cfa}
37For output, the default is to print the label.
38An alternate way to get an enumerator's position is to cast it to @int@.
39\begin{cfa}
40sout | A | label( A ) | @(int)A@ | value( A );
41sout | A | label( A ) | @(int)A@ | value( A );
42A A @0@ 3
43A A @0@ 3
44\end{cfa}
45Finally, \CFA introduces an additional enumeration pseudo-function @countof@ (like @sizeof@, @typeof@) that returns the number of enumerators in an enumeration.
46\begin{cfa}
47enum(int) E { A, B, C, D } e;
48countof( E )// 4, type argument
49countof( e )// 4, variable argument
50\end{cfa}
51This built-in function replaces the C idiom for automatically computing the number of enumerators \see{\VRef{s:Usage}}.
52\begin{cfa}
53enum E { A, B, C, D, @N@ };  // N == 4
54\end{cfa}
55
56\section{Opaque Enumeration}
57\label{s:OpaqueEnum}
58
59When an enumeration type is empty. it is an \newterm{opaque} enumeration.
60\begin{cfa}
61enum@()@ Mode { O_RDONLY, O_WRONLY, O_CREAT, O_TRUNC, O_APPEND };
62\end{cfa}
63Here, the compiler chooses the internal representation, which is hidden, so the enumerators cannot be initialized.
64Compared to the C enum, opaque enums are more restrictive regarding typing and cannot be implicitly converted to integers.
65\begin{cfa}
66Mode mode = O_RDONLY;
67int www @=@ mode;                                               $\C{// disallowed}$
68\end{cfa}
69Opaque enumerations have only two attribute properties, @label@ and @posn@.
70\begin{cfa}
71char * s = label( O_TRUNC );                    $\C{// "O\_TRUNC"}$
72int open = posn( O_WRONLY );                    $\C{// 1}$
73\end{cfa}
74Equality and relational operations are available.
75\begin{cfa}
76if ( mode @==@ O_CREAT ) ...
77bool b = mode @<@ O_APPEND;
78\end{cfa}
79
80
81\section{Typed Enumeration}
82\label{s:EnumeratorTyping}
83
84When an enumeration type is specified, all enumerators have that type and can be initialized with constants of that type or compile-time convertible to that type.
85Figure~\ref{f:EumeratorTyping} shows a series of examples illustrating that all \CFA types can be used with an enumeration, and each type's values are used to set the enumerator constants.
86Note the use of the synonyms @Liz@ and @Beth@ in the last declaration.
87Because enumerators are constants, the enumeration type is implicitly @const@, so all the enumerator types in Figure~\ref{f:EumeratorTyping} are logically rewritten with @const@.
88
89\begin{figure}
90\begin{cfa}
91// integral
92        enum( @char@ ) Currency { Dollar = '$\textdollar$', Cent = '$\textcent$', Yen = '$\textyen$', Pound = '$\textsterling$', Euro = 'E' };
93        enum( @signed char@ ) srgb { Red = -1, Green = 0, Blue = 1 };
94        enum( @long long int@ ) BigNum { X = 123_456_789_012_345,  Y = 345_012_789_456_123 };
95// non-integral
96        enum( @double@ ) Math { PI_2 = 1.570796, PI = 3.141597, E = 2.718282 };
97        enum( @_Complex@ ) Plane { X = 1.5+3.4i, Y = 7+3i, Z = 0+0.5i };
98// pointer
99        enum( @char *@ ) Name { Fred = "FRED", Mary = "MARY", Jane = "JANE" };
100        int i, j, k;
101        enum( @int *@ ) ptr { I = &i,  J = &j,  K = &k };
102        enum( @int &@ ) ref { I = i,   J = j,   K = k };
103// tuple
104        enum( @[int, int]@ ) { T = [ 1, 2 ] }; $\C{// new \CFA type}$
105// function
106        void f() {...}   void g() {...}
107        enum( @void (*)()@ ) funs { F = f,  G = g };
108// aggregate
109        struct Person { char * name; int age, height; };
110        enum( @Person@ ) friends { @Liz@ = { "ELIZABETH", 22, 170 }, @Beth@ = Liz,
111                                                                        Jon = { "JONATHAN", 35, 190 } };
112\end{cfa}
113% synonym feature unimplemented
114\caption{Enumerator Typing}
115\label{f:EumeratorTyping}
116\end{figure}
117
118An advantage of the typed enumerations is eliminating the \emph{harmonizing} problem between an enumeration and companion data \see{\VRef{s:Usage}}:
119\begin{cfa}
120enum( char * ) integral_types {
121        chr = "char", schar = "signed char", uschar = "unsigned char",
122        sshort = "signed short int", ushort = "unsigned short int",
123        sint = "signed int", usint = "unsigned int",
124        ...
125};
126\end{cfa}
127Note that the enumeration type can be a structure (see @Person@ in Figure~\ref{f:EumeratorTyping}), so it is possible to have the equivalent of multiple arrays of companion data using an array of structures.
128
129While the enumeration type can be any C aggregate, the aggregate's \CFA constructors are \emph{not} used to evaluate an enumerator's value.
130\CFA enumeration constants are compile-time values (static);
131calling constructors happens at runtime (dynamic).
132
133\section{Implementation}
134\CFA-cc is is a transpiler that translates \CFA code into C, which can later be compiled by a C compiler.
135
136During the transpilation, \CFA-cc breaks a \CFA enumeration definition into a definition of a C enumeration with the same name and auxiliary arrays: a label array and a value array for a typed enumeration.
137For example:
138\begin{cfa}
139// CFA (source):
140enum(T) E { E1=t1, E2=t2, E3=t3 };
141\end{cfa}
142is compiled into:
143\begin{cfa}
144// C (transpiled by cfa-cc):
145enum E { E1, E2, E3 };
146const char * E_labels[3] = { "E1", "E2", "E3" };
147const T E_values [3] = { t1, t2, t3 };
148\end{cfa}
149The generated C enumeration will have enumerator values equals to their positions thanks to C's auto-initialization scheme. Notice that value and label arrays are dynamically allocated data structures that take up
150memory. If an enumeration is globally defined, the arrays are allocated in the @.data@ section and will be initialized before the program execution.
151Otherwise, if an enumeration has its definition in a local scope, these arrays will be allocated on the stack and be initialized when the program counter
152reaches the code location of the enumeration definition.
153
154% This bring a considerable overhead to the program, in terms of both execution time and storage.
155% An opaque enumeration has no overhead
156% for values, and it has been suggested as a future work to leave as an option to not generate the label array.
157
158Alongs with the enumeration defintion, \CFA-cc adds defintions of attribute functions: @posn@, @label@ and @value@:
159\begin{cfa}
160inline int posn( E e ) { return (int) e; }
161inline const * label( E e ) { return E_labels[ (int) e ]; }
162inline const * E_value( E e ) { return E_values[ (int) e ]; }
163\end{cfa}
164These functions are not implemented in \CFA code: they are Abstract Syntax Tree (AST) nodes appends to the Abstract Syntax Tree (AST).
165Notably, the AST subnode for the "cast to @int@" expression inside the functions is annotated as reinterpreted casts.
166In order words, the effect of a case is only to change the type of an expression, and it stops further reduction on the expression \see{\VRef{s:ValueConversion}}.
167
168Consequently, \CFA enumeration comes with space and runtime overhead, both for enumeration definition and function call to attribute functions. \CFA made efforts to reduce the runtime
169overhead on function calls by aggressively reducing @label()@ and @value()@ function calls on an enumeration constant to a constant expression. The interpreted casts are extraneous
170after type checking and removed in later steps. A @label()@ and @value()@ call on an enumeration variable is a lookup of an element of an array of constant values, and it is up to the
171C compiler to optimize its runtime. While OpaqueEnum is effectively an "opt-out" of the value overhead, it has been suggested that an option to "opt-out" from labels be added as well.
172A @label()@ function definition is still necessary to accomplish enumeration traits. But it will return an empty string for an enumeration label when "opt-out" or the enumerator name
173when it is called on an enumeration constant. It will allow a user not to pay the overhead for labels when the enumerator names of a particular enumerated type are not helpful.
174
175\section{Value Conversion}
176\label{s:ValueConversion}
177C has an implicit type conversion from an enumerator to its base type @int@.
178Correspondingly, \CFA has an implicit conversion from a typed enumerator to its base type, allowing typed enumeration to be seamlessly used as the value of its base type
179For example, using type @Currency@ in \VRef[Figure]{f:EumeratorTyping}:
180\begin{cfa}
181char currency = Dollar;         $\C{// implicit conversion to base type}$
182void foo( char );
183foo( Dollar );                          $\C{// implicit conversion to base type}$
184\end{cfa}
185The implicit conversion induces a \newterm{value cost}, which is a new category (8 tuple) in \CFA's conversion cost model \see{\VRef{s:ConversionCost}} to disambiguate function overloading over a \CFA enumeration and its base type.
186\begin{cfa}
187void baz( char ch );            $\C{// (1)}$
188void baz( Currency cu );        $\C{// (2)}$
189baz( Dollar );
190\end{cfa}
191While both @baz@ functions are applicable to the enumerator @Dollar@, @candidate (1)@ comes with a @value@ cost for the conversion to the enumeration's base type, while @candidate (2)@ has @zero@ cost.
192Hence, \CFA chooses the exact match.
193Value cost is defined to be a more significant factor than an @unsafe@ but less than the other conversion costs: @(unsafe,@ {\color{red}@value@}@, poly, safe, sign, vars, specialization,@ @reference)@.
194\begin{cfa}
195void bar( @int@ );
196Math x = PI;                            $\C{// (1)}$
197double x = 5.5;                         $\C{// (2)}$
198bar( x );                                       $\C{// costs (1, 0, 0, 0, 0, 0, 0, 0) or (0, 1, 0, 0, 0, 0, 0, 0)}$
199\end{cfa}
200Here, the candidate (1) has a @value@ conversion cost to convert to the base type, while the candidate (2) has an @unsafe@ conversion from @double@ to @int@,
201which is a more expensive conversion.
202Hence, @bar( x )@ resolves @x@ as type @Math@.
203
204% \begin{cfa}
205% forall(T | @CfaEnum(T)@) void bar(T);
206%
207% bar(a);                                       $\C{// (3), with cost (0, 0, 1, 0, 0, 0, 0, 0)}$
208% \end{cfa}
209% % @Value@ is designed to be less significant than @poly@ to allow function being generic over \CFA enumeration (see ~\ref{c:trait}).
210% Being generic over @CfaEnum@ traits (a pre-defined interface for \CFA enums) is a practice in \CFA to implement functions over \CFA enumerations, as will see in chapter~\ref{c:trait}.
211% @Value@ is a being a more significant cost than @poly@ implies if a overloaeded function defined for @CfaEnum@ (and other generic type), \CFA always try to resolve it as a @CfaEnum@, rather to insert a @value@ conversion.
212
213
214\section{Auto Initialization}
215\CFA extends C's auto-initialization scheme to \CFA enumeration. For an enumeration type with base type T, the initialization scheme is the following:
216\begin{enumerate}
217\item the first enumerator is initialized with @T@'s @zero_t@.
218\item Every other enumerator is initialized with its previous enumerator's value "+1", where "+1" is defined in terms of overloaded operator @?+?(T, one_t)@.
219\end{enumerate}
220
221\begin{cfa}
222struct S { int i; };
223S ?+?( S & s, one_t ) { return s.i++; }
224void ?{}( S & s, zero_t ) { s.i = 0; }
225enum(S) E { A, B, C, D };
226\end{cfa}
227
228The restriction on C's enumeration initializers being constant expression is relaxed on \CFA enumeration.
229Therefore, an enumerator initializer allows function calls like @?+?( S & s, one_t )@ and @?{}( S & s, zero_t )@.
230It is because the values of \CFA enumerators are not stored in the compiled enumeration body but in the @value@ array, which
231allows dynamic initialization.
232
233\section{Subset}
234
235An enumeration's type can be another enumeration.
236\begin{cfa}
237enum( char ) Letter { A = 'A', ..., Z = 'Z' };
238enum( @Letter@ ) Greek { Alph = @A@, Beta = @B@, Gamma = @G@, ..., Zeta = @Z@ }; // alphabet intersection
239\end{cfa}
240Enumeration @Greek@ may have more or less enumerators than @Letter@, but its enumerator values \emph{must} be from @Letter@.
241Therefore, the set of @Greek@ enumerator values in a subset of the @Letter@ enumerator values.
242@Letter@ is type compatible with enumeration @Letter@ because value conversions are inserted whenever @Letter@ is used in place of @Greek@.
243\begin{cfa}
244Letter l = A;                                           $\C{// allowed}$
245Greek g = Alph;                                         $\C{// allowed}$
246l = Alph;                                                       $\C{// allowed, conversion to base type}$
247g = A;                                                          $\C{// {\color{red}disallowed}}$
248void foo( Letter );
249foo( Beta );                                            $\C{// allowed, conversion to base type}$
250void bar( Greek );
251bar( A );                                                       $\C{// {\color{red}disallowed}}$
252\end{cfa}
253Hence, @Letter@ enumerators are not type-compatible with the @Greek@ enumeration, but the reverse is true.
254
255
256\section{Inheritance}
257\label{s:CFAInheritance}
258
259\CFA Plan-9 inheritance may be used with \CFA enumerations, where Plan-9 inheritance is containment inheritance with implicit unscoping (like a nested unnamed @struct@/@union@ in C).
260Containment is nominative: an enumeration inherits all enumerators from another enumeration by declaring an @inline statement@ in its enumerator lists.
261\begin{cfa}
262enum( char * ) Names { /* $\see{\VRef[Figure]{f:EumeratorTyping}}$ */  };
263enum( char * ) Names2 { @inline Names@, Jack = "JACK", Jill = "JILL" };
264enum( char * ) Names3 { @inline Names2@, Sue = "SUE", Tom = "TOM" };
265\end{cfa}
266In the preceding example, @Names2@ is defined with five enumerators, three of which are from @Name@ through containment, and two are self-declared.
267@Names3@ inherits all five members from @Names2@ and declares two additional enumerators.
268Hence, enumeration inheritance forms a subset relationship.
269Specifically, the inheritance relationship for the example above is:
270\begin{cfa}
271Names $\(\subset\)$ Names2 $\(\subset\)$ Names3 $\C{// enum type of Names}$
272\end{cfa}
273
274Inheritance can be nested, and a \CFA enumeration can inline enumerators from more than one \CFA enumeration, forming a tree-like hierarchy.
275However, the uniqueness of the enumeration name applies to enumerators, including those from supertypes, meaning an enumeration cannot name an enumerator with the same label as its subtype's members or inherits
276from multiple enumeration that has overlapping enumerator labels. Consequently, a new type cannot inherit from an enumeration and its supertype or two enumerations with a
277common supertype (the diamond problem) since such would unavoidably introduce duplicate enumerator labels.
278
279The base type must be consistent between subtype and supertype.
280When an enumeration inherits enumerators from another enumeration, it copies the enumerators' @value@ and @label@, even if the @value@ is auto-initialized.
281However, the position of the underlying representation is the order of the enumerator in the new enumeration.
282\begin{cfa}
283enum() E1 { B };                                                                        $\C{// B}$                                             
284enum() E2 { C, D };                                             $\C{// C D}$
285enum() E3 { inline E1, inline E2, E };  $\C{// {\color{red}[\(_{E1}\)} B {\color{red}]} {\color{red}[\(_{E2}\)} C D {\color{red}]} E}$
286enum() E4 { A, inline E3, F};                   $\C{// A {\color{blue}[\(_{E3}\)} {\color{red}[\(_{E1}\)} B {\color{red}]} {\color{red}[\(_{E2}\)} C D {\color{red}]} E {\color{blue}]} F}$
287\end{cfa}
288In the example, @B@ is at position 0 in @E1@ and @E3@, but position 1 in @E4@ as @A@ takes position 0 in @E4@.
289@C@ is at position 0 in @E2@, 1 in @E3@, and 2 in @E4@.
290@D@ is at position 1 in @E2@, 2 in @E3@, and 3 in @E4@.
291
292A subtype enumeration can be casted, or implicitly converted into its supertype, with a @safe@ cost, called \newterm{enumeration conversion}.
293\begin{cfa}
294enum E2 e2 = C;
295posn( e2 );                     $\C[1.75in]{// 0}$
296enum E3 e3 = e2;        $\C{// Assignment with enumeration conversion E2 to E3}$
297posn( e2 );                     $\C{// 1 cost}$
298void foo( E3 e );
299foo( e2 );                      $\C{// Type compatible with enumeration conversion E2 to E3}$
300posn( (E3)e2 );         $\C{// Explicit cast with enumeration conversion E2 to E3}$
301E3 e31 = B;                     $\C{// No conversion: E3.B}$
302posn( e31 );            $\C{// 0 cost}\CRT$
303\end{cfa}
304The last expression is unambiguous.
305While both @E2.B@ and @E3.B@ are valid candidates, @E2.B@ has an associated safe cost and @E3.B@ needs no conversion (@zero@ cost).
306\CFA selects the lowest cost candidate @E3.B@.
307
308For the given function prototypes, the following calls are valid.
309\begin{cquote}
310\begin{tabular}{ll}
311\begin{cfa}
312void f( Names );
313void g( Names2 );
314void h( Names3 );
315void j( const char * );
316\end{cfa}
317&
318\begin{cfa}
319f( Fred );
320g( Fred );   g( Jill );
321h( Fred );   h( Jill );   h( Sue );
322j( Fred );    j( Jill );    j( Sue );    j( "WILL" );
323\end{cfa}
324\end{tabular}
325\end{cquote}
326Note, the validity of calls is the same for call-by-reference as for call-by-value, and @const@ restrictions are the same as for other types.
327
328
329\subsection{Offset Calculation}
330
331As discussed in \VRef{s:OpaqueEnum}, \CFA chooses position as a representation of a \CFA enumeration variable.
332When a cast or implicit conversion moves an enumeration from subtype to supertype, the position can be unchanged or increase.
333\CFA determines the position offset with an \newterm{offset calculation} function.
334
335\begin{figure}
336\begin{cfa}
337struct Enumerator;
338struct CFAEnum { vector<variant<CFAEnum, Enumerator>> members; string name; };
339inline static bool operator==(CFAEnum& lhs, CFAEnum& rhs) { return lhs.name == rhs.name; }
340pair<bool, int> calculateEnumOffset(CFAEnum src, CFAEnum dst) {
341        int offset = 0;
342        if ( src == dst ) return make_pair(true, 0);
343        for ( auto v : dst.members ) {
344                if ( holds_alternative<Enumerator>(v) ) {
345                        offset++;
346                } else {
347                        auto m = get<CFAEnum>(v);
348                        if ( m == src ) @return@ make_pair( true, offset );
349                        auto dist = calculateEnumOffset( src, m );
350                        if ( dist.first ) {
351                                @return@ make_pair( true, offset + dist.second );
352                        } else {
353                                offset += dist.second;
354                        }
355                }
356        }
357        @return@ make_pair( false, offset );
358}
359\end{cfa}
360\caption{Compute Offset from Subtype Enumeration to a Supertype}
361\label{s:OffsetSubtypeSuperType}
362\end{figure}
363
364Figure~\ref{s:OffsetSubtypeSuperType} shows an outline of the offset calculation in \CC.
365Structure @CFAEnum@ represents the \CFA enumeration with a vector of variants of @CFAEnum@ or @Enumerator@.
366The algorithm takes two @CFAEnums@ parameters, @src@ and @dst@, with @src@ being the type of expression the conversion applies to, and @dst@ being the type the expression is cast to.
367The algorithm iterates over the members in @dst@ to find @src@.
368If a member is an enumerator of @dst@, the positions of all subsequent members are incremented by one.
369If the current member is @dst@, the function returns true indicating \emph{found} and the accumulated offset.
370Otherwise, the algorithm recurses into the current @CFAEnum@ @m@ to check if its @src@ is convertible to @m@.
371If @src@ is convertible to the current member @m@, this means @src@ is a subtype-of-subtype of @dst@.
372The offset between @src@ and @dst@ is the sum of the offset of @m@ in @dst@ and the offset of @src@ in @m@.
373If @src@ is not a subtype of @m@, the loop continues but with the offset shifted by the size of @m@.
374If the loop ends, than @src@ is not convertible to @dst@, and false is returned.
375
376
377\section{Control Structures}
378
379Enumerators can be used in multiple contexts.
380In most programming languages, an enumerator is implicitly converted to its value (like a typed macro substitution).
381However, enumerator synonyms and typed enumerations make this implicit conversion to value incorrect in some contexts.
382In these contexts, a programmer's intuition assumes an implicit conversion to position.
383
384For example, an intuitive use of enumerations is with the \CFA @switch@/@choose@ statement, where @choose@ performs an implicit @break@ rather than a fall-through at the end of a @case@ clause.
385(For this discussion, ignore the fact that @case@ requires a compile-time constant.)
386\begin{cfa}[belowskip=0pt]
387enum Count { First, Second, Third, Fourth };
388Count e;
389\end{cfa}
390\begin{cquote}
391\setlength{\tabcolsep}{15pt}
392\noindent
393\begin{tabular}{@{}ll@{}}
394\begin{cfa}[aboveskip=0pt]
395
396choose( e ) {
397        case @First@: ...;
398        case @Second@: ...;
399        case @Third@: ...;
400        case @Fourth@: ...;
401}
402\end{cfa}
403&
404\begin{cfa}[aboveskip=0pt]
405// rewrite
406choose( @value@( e ) ) {
407        case @value@( First ): ...;
408        case @value@( Second ): ...;
409        case @value@( Third ): ...;
410        case @value@( Fourth ): ...;
411}
412\end{cfa}
413\end{tabular}
414\end{cquote}
415Here, the intuitive code on the left is implicitly transformed into the standard implementation on the right, using the value of the enumeration variable and enumerators.
416However, this implementation is fragile, \eg if the enumeration is changed to:
417\begin{cfa}
418enum Count { First, Second, Third @= First@, Fourth };
419\end{cfa}
420making @Third == First@ and @Fourth == Second@, causing a compilation error because of duplicate @case@ clauses.
421To better match with programmer intuition, \CFA toggles between value and position semantics depending on the language context.
422For conditional clauses and switch statements, \CFA uses the robust position implementation.
423\begin{cfa}
424if ( @posn@( e ) < posn( Third ) ) ...
425choose( @posn@( e ) ) {
426        case @posn@( First ): ...;
427        case @posn@( Second ): ...;
428        case @posn@( Third ): ...;
429        case @posn@( Fourth ): ...;
430}
431\end{cfa}
432
433\CFA provides a special form of for-control for enumerating through an enumeration, where the range is a type.
434\begin{cfa}
435for ( cx; @Count@ ) { sout | cx | nonl; } sout | nl;
436for ( cx; ~= Count ) { sout | cx | nonl; } sout | nl;
437for ( cx; -~= Count ) { sout | cx | nonl; } sout | nl;
438First Second Third Fourth
439First Second Third Fourth
440Fourth Third Second First
441\end{cfa}
442The enumeration type is syntax sugar for looping over all enumerators and assigning each enumerator to the loop index, whose type is inferred from the range type.
443The prefix @+~=@ or @-~=@ iterate forward or backwards through the inclusive enumeration range, where no prefix defaults to @+~=@.
444
445C has an idiom for @if@ and loop predicates of comparing the predicate result ``not equal to 0''.
446\begin{cfa}
447if ( x + y /* != 0 */  ) ...
448while ( p /* != 0 */  ) ...
449\end{cfa}
450This idiom extends to enumerations because there is a boolean conversion in terms of the enumeration value, if and only if such a conversion is available.
451For example, such a conversion exists for all numerical types (integral and floating-point).
452It is possible to explicitly extend this idiom to any typed enumeration by overloading the @!=@ operator.
453\begin{cfa}
454bool ?!=?( Name n, zero_t ) { return n != Fred; }
455Name n = Mary;
456if ( n ) ... // result is true
457\end{cfa}
458Specialize meanings are also possible.
459\begin{cfa}
460enum(int) ErrorCode { Normal = 0, Slow = 1, Overheat = 1000, OutOfResource = 1001 };
461bool ?!=?( ErrorCode ec, zero_t ) { return ec >= Overheat; }
462ErrorCode code = ...;
463if ( code ) { problem(); }
464\end{cfa}
465
466
467\section{Dimension}
468
469\VRef{s:EnumeratorTyping} introduces the harmonizing problem between an enumeration and secondary information.
470When possible, using a typed enumeration for the secondary information is the best approach.
471However, there are times when combining these two types is not possible.
472For example, the secondary information might precede the enumeration and/or its type is needed directly to declare parameters of functions.
473In these cases, having secondary arrays of the enumeration size are necessary.
474
475To support some level of harmonizing in these cases, an array dimension can be defined using an enumerator type, and the enumerators used as subscripts.
476\begin{cfa}
477enum E1 { A, B, C, N }; // possibly predefined
478enum(int) E2 { A, B, C };
479float H1[N] = { [A] :$\footnotemark$ 3.4, [B] : 7.1, [C] : 0.01 }; // C
480float H2[@E2@] = { [A] : 3.4, [B] : 7.1, [C] : 0.01 }; // CFA
481\end{cfa}
482\footnotetext{C uses symbol \lstinline{'='} for designator initialization, but \CFA changes it to \lstinline{':'} because of problems with tuple syntax.}
483This approach is also necessary for a predefined typed enumeration (unchangeable), when additional secondary-information need to be added.
484The array subscript operator, namely @?[?]@, is overloaded so that when a \CFA enumerator is used as an array index, it implicitly converts to its position over value to sustain data harmonization.
485This behaviour can be reverted by explicit overloading:
486\begin{cfa}
487float ?[?]( float * arr, E2 index ) { return arr[ value( index ) ]; }
488\end{cfa}
489While enumerator labels @A@, @B@ and @C@ are being defined twice in different enumerations, they are unambiguous within the context.
490Designators in @H1@ are unambiguous becasue @E2@ has a @value@ cost to @int@, which is more expensive than @safe@ cost from C-Enum @E1@ to @int@.
491Designators in @H2@ are resolved as @E2@ because when a \CFA enumeration type is being used as an array dimension, \CFA adds the enumeration type to the initializer's resolution context.
492
493
494\section{I/O}
495
496As seen in multiple examples, \CFA enumerations can be printed and the default property printed is the enumerator's label, which is similar in other programming languages.
497However, very few programming languages provide a mechanism to read in enumerator values.
498Even the @boolean@ type in many languages does not have a mechanism for input using the enumerators @true@ or @false@.
499\VRef[Figure]{f:EnumerationI/O} show \CFA enumeration input based on the enumerator labels.
500When the enumerator labels are packed together in the input stream, the input algorithm scans for the longest matching string.
501For basic types in \CFA, the rule is that the same constants used to initialize a variable in a program are available to initialize a variable using input, where string constants can be quoted or unquoted.
502
503\begin{figure}
504\begin{cquote}
505\setlength{\tabcolsep}{15pt}
506\begin{tabular}{@{}ll@{}}
507\begin{cfa}
508int main() {
509        enum(int ) E { BBB = 3, AAA, AA, AB, B };
510        E e;
511
512        try {
513                for () {
514                        try {
515                                @sin | e@;
516                        } catch( missing_data * ) {
517                                sout | "missing data";
518                                continue; // try again
519                        }
520                        sout | e | "= " | value( e );
521                }
522        } catch( end_of_file ) {}
523}
524\end{cfa}
525&
526\begin{cfa}
527$\rm input$
528BBBABAAAAB
529BBB AAA AA AB B
530
531$\rm output$
532BBB = 3
533AB = 6
534AAA = 4
535AB = 6
536BBB = 3
537AAA = 4
538AA = 5
539AB = 6
540B = 7
541
542\end{cfa}
543\end{tabular}
544\end{cquote}
545\caption{Enumeration I/O}
546\label{f:EnumerationI/O}
547\end{figure}
548
549
550\section{Planet Example}
551
552\VRef[Figure]{f:PlanetExample} shows an archetypal enumeration example illustrating most of the \CFA enumeration features.
553@Planet@ is an enumeration of type @MR@.
554Each planet enumerator is initialized to a specific mass/radius, @MR@, value.
555The unnamed enumeration provides the gravitational-constant enumerator @G@.
556Function @surfaceGravity@ uses the @with@ clause to remove @p@ qualification from fields @mass@ and @radius@.
557The program main uses the pseudo function @countof@ to obtain the number of enumerators in @Planet@, and safely converts the random value into a @Planet@ enumerator using @fromInt@.
558The resulting random orbital-body is used in a @choose@ statement.
559The enumerators in the @case@ clause use the enumerator position for testing.
560The prints use @label@ to print an enumerator's name.
561Finally, a loop enumerates through the planets computing the weight on each planet for a given Earth mass.
562The print statement does an equality comparison with an enumeration variable and enumerator (@p == MOON@).
563
564\begin{figure}
565\small
566\begin{cfa}
567struct MR { double mass, radius; };                     $\C[3.5in]{// planet definition}$
568enum( @MR@ ) Planet {                                           $\C{// typed enumeration}$
569        //                      mass (kg)   radius (km)
570        MERCURY = { 0.330_E24, 2.4397_E6 },
571        VENUS      = { 4.869_E24, 6.0518_E6 },
572        EARTH       = { 5.976_E24, 6.3781_E6 },
573        MOON        = { 7.346_E22, 1.7380_E6 }, $\C{// not a planet}$
574        MARS         = { 0.642_E24, 3.3972_E6 },
575        JUPITER    = { 1898._E24, 71.492_E6 },
576        SATURN     = { 568.8_E24, 60.268_E6 },
577        URANUS    = { 86.86_E24, 25.559_E6 },
578        NEPTUNE  = { 102.4_E24, 24.746_E6 },
579        PLUTO       = { 1.303_E22, 1.1880_E6 }, $\C{// not a planet}$
580};
581enum( double ) { G = 6.6743_E-11 };                     $\C{// universal gravitational constant (m3 kg-1 s-2)}$
582static double surfaceGravity( Planet p ) @with( p )@ {
583        return G * mass / ( radius @\@ 2 );             $\C{// no qualification, exponentiation}$
584}
585static double surfaceWeight( Planet p, double otherMass ) {
586        return otherMass * surfaceGravity( p );
587}
588int main( int argc, char * argv[] ) {
589        if ( argc != 2 ) @exit@ | "Usage: " | argv[0] | "earth-weight";  // terminate program
590        double earthWeight = convert( argv[1] );
591        double earthMass = earthWeight / surfaceGravity( EARTH );
592        Planet rp = @fromInt@( prng( @countof@( Planet ) ) ); $\C{// select random orbiting body}$
593        @choose( rp )@ {                                                $\C{// implicit breaks}$
594          case MERCURY, VENUS, EARTH, MARS:
595                sout | @rp@ | "is a rocky planet";
596          case JUPITER, SATURN, URANUS, NEPTUNE:
597                sout | rp | "is a gas-giant planet";
598          default:
599                sout | rp | "is not a planet";
600        }
601        for ( @p; Planet@ ) {                                   $\C{// enumerate}\CRT$
602                sout | "Your weight on" | ( @p == MOON@ ? "the" : " " ) | p
603                           | "is" | wd( 1,1,  surfaceWeight( p, earthMass ) ) | "kg";
604        }
605}
606$\$$ planet 100
607JUPITER is a gas-giant planet
608Your weight on MERCURY is 37.7 kg
609Your weight on VENUS is 90.5 kg
610Your weight on EARTH is 100.0 kg
611Your weight on the MOON is 16.6 kg
612Your weight on MARS is 37.9 kg
613Your weight on JUPITER is 252.8 kg
614Your weight on SATURN is 106.6 kg
615Your weight on URANUS is 90.5 kg
616Your weight on NEPTUNE is 113.8 kg
617Your weight on PLUTO is 6.3 kg
618\end{cfa}
619\caption{Planet Example}
620\label{f:PlanetExample}
621\end{figure}
Note: See TracBrowser for help on using the repository browser.