Context Navigation

← Previous Change
Next Change →

array.hfa

Timestamp:

Jul 29, 2024, 1:32:51 PM (4 months ago)

Author:

JiadaL <j82liang@…>

Branches:

master

Children:

f3d2a4f

Parents:

38e20a80 (diff), 1661ad7 (diff)
Note: this is a merge changeset, the changes displayed below correspond to the merge itself.
Use the (diff) links above to see all the changes relative to each parent.

Message:

Merge branch 'master' of plg.uwaterloo.ca:software/cfa/cfa-cc

File:

: 1 edited

libcfa/src/collections/array.hfa (modified) (9 diffs)

Legend:

: Unmodified
: Added
: Removed

libcfa/src/collections/array.hfa

-                      r38e20a80
+                      rce02877
 #pragma once
 #include <assert.h>
+//#include <assert.h>
 …
 #define ztag(n) ttag(n)
+#ifdef __CFA_DEBUG__
+#define subcheck( arr, sub, lb, ub ) \
+        if ( (sub) < (lb) || (sub) >= (ub) ) \
+                abort( "subscript %ld exceeds dimension range [%d,%zd) for array %p.\n", \
+                           (sub), (lb), (ub), (arr) )
+#else
+#define subcheck( arr, sub, lb, ub ) do {} while (0)
+#endif
 //
 …
 //
 forall( [N], S & | sized(S), Timmed &, Tbase & ) {
+    //
+    // Single-dim array sruct (with explicit packing and atom)
+    //
+    struct arpk {
+        S strides[N];
+    };
+    // About the choice of integral types offered as subscript overloads:
+    // Intent is to cover these use cases:
+    //    a[0]                                                // i : zero_t
+    //    a[1]                                                // i : one_t
+    //    a[2]                                                // i : int
+    //    float foo( ptrdiff_t i ) { return a[i]; }           // i : ptrdiff_t
+    //    float foo( size_t i ) { return a[i]; }              // i : size_t
+    //    forall( [N] ) ... for( i; N ) { total += a[i]; }    // i : typeof( sizeof(42) )
+    //    for( i; 5 ) { total += a[i]; }                      // i : int
+    //
+    // It gets complicated by:
+    // -  CFA does overloading on concrete types, like int and unsigned int, not on typedefed
+    //    types like size_t.  So trying to overload on ptrdiff_t vs int works in 64-bit mode
+    //    but not in 32-bit mode.
+    // -  Given bug of Trac #247, CFA gives sizeof expressions type unsigned long int, when it
+    //    should give them type size_t.
+    //
+    //                          gcc -m32         cfa -m32 given bug         gcc -m64 (and cfa)
+    // ptrdiff_t                int              int                        long int
+    // size_t                   unsigned int     unsigned int               unsigned long int
+    // typeof( sizeof(42) )     unsigned int     unsigned long int          unsigned long int
+    // int                      int              int                        int
+    //
+    // So the solution must support types {zero_t, one_t, int, unsigned int, long int, unsigned long int}
+    //
+    // The solution cannot rely on implicit conversions (e.g. just have one overload for ptrdiff_t)
+    // because assertion satisfaction requires types to match exacly.  Both higher-dimensional
+    // subscripting and operations on slices use asserted subscript operators.  The test case
+    // array-container/array-sbscr-cases covers the combinations.  Mike beleives that commenting out
+    // any of the current overloads leads to one of those cases failing, either on 64- or 32-bit.
+    // Mike is open to being shown a smaller set of overloads that still passes the test.
+    static inline Timmed & ?[?]( arpk(N, S, Timmed, Tbase) & a, zero_t ) {
+        assert( 0 < N );
+        return (Timmed &) a.strides[0];
+    }
+    static inline Timmed & ?[?]( arpk(N, S, Timmed, Tbase) & a, one_t ) {
+        assert( 1 < N );
+        return (Timmed &) a.strides[1];
+    }
+    static inline Timmed & ?[?]( arpk(N, S, Timmed, Tbase) & a, int i ) {
+        assert( i < N );
+        return (Timmed &) a.strides[i];
+    }
+    static inline const Timmed & ?[?]( const arpk(N, S, Timmed, Tbase) & a, int i ) {
+        assert( i < N );
+        return (Timmed &) a.strides[i];
+    }
+    static inline Timmed & ?[?]( arpk(N, S, Timmed, Tbase) & a, unsigned int i ) {
+        assert( i < N );
+        return (Timmed &) a.strides[i];
+    }
+    static inline const Timmed & ?[?]( const arpk(N, S, Timmed, Tbase) & a, unsigned int i ) {
+        assert( i < N );
+        return (Timmed &) a.strides[i];
+    }
+    static inline Timmed & ?[?]( arpk(N, S, Timmed, Tbase) & a, long int i ) {
+        assert( i < N );
+        return (Timmed &) a.strides[i];
+    }
+    static inline const Timmed & ?[?]( const arpk(N, S, Timmed, Tbase) & a, long int i ) {
+        assert( i < N );
+        return (Timmed &) a.strides[i];
+    }
+    static inline Timmed & ?[?]( arpk(N, S, Timmed, Tbase) & a, unsigned long int i ) {
+        assert( i < N );
+        return (Timmed &) a.strides[i];
+    }
+    static inline const Timmed & ?[?]( const arpk(N, S, Timmed, Tbase) & a, unsigned long int i ) {
+        assert( i < N );
+        return (Timmed &) a.strides[i];
+    }
+    static inline size_t ?`len( arpk(N, S, Timmed, Tbase) & a ) {
+        return N;
+    }
+    static inline void __taglen( tag(arpk(N, S, Timmed, Tbase)), tag(N) ) {}
+        //
+        // Single-dim array struct (with explicit packing and atom)
+        //
+        struct arpk {
+                S strides[N];
+        };
+        // About the choice of integral types offered as subscript overloads:
+        // Intent is to cover these use cases:
+        //    a[0]                                                // i : zero_t
+        //    a[1]                                                // i : one_t
+        //    a[2]                                                // i : int
+        //    float foo( ptrdiff_t i ) { return a[i]; }           // i : ptrdiff_t
+        //    float foo( size_t i ) { return a[i]; }              // i : size_t
+        //    forall( [N] ) ... for( i; N ) { total += a[i]; }    // i : typeof( sizeof(42) )
+        //    for( i; 5 ) { total += a[i]; }                      // i : int
+        //
+        // It gets complicated by:
+        // -  CFA does overloading on concrete types, like int and unsigned int, not on typedefed
+        //    types like size_t.  So trying to overload on ptrdiff_t vs int works in 64-bit mode
+        //    but not in 32-bit mode.
+        // -  Given bug of Trac #247, CFA gives sizeof expressions type unsigned long int, when it
+        //    should give them type size_t.
+        //
+        //                          gcc -m32         cfa -m32 given bug         gcc -m64 (and cfa)
+        // ptrdiff_t                int              int                        long int
+        // size_t                   unsigned int     unsigned int               unsigned long int
+        // typeof( sizeof(42) )     unsigned int     unsigned long int          unsigned long int
+        // int                      int              int                        int
+        //
+        // So the solution must support types {zero_t, one_t, int, unsigned int, long int, unsigned long int}
+        //
+        // The solution cannot rely on implicit conversions (e.g. just have one overload for ptrdiff_t)
+        // because assertion satisfaction requires types to match exacly.  Both higher-dimensional
+        // subscripting and operations on slices use asserted subscript operators.  The test case
+        // array-container/array-sbscr-cases covers the combinations.  Mike beleives that commenting out
+        // any of the current overloads leads to one of those cases failing, either on 64- or 32-bit.
+        // Mike is open to being shown a smaller set of overloads that still passes the test.
+        static inline Timmed & ?[?]( arpk( N, S, Timmed, Tbase ) & a, zero_t ) {
+                //assert( 0 < N );
+                subcheck( a, 0L, 0, N );
+                return (Timmed &)a.strides[0];
+        }
+        static inline Timmed & ?[?]( arpk( N, S, Timmed, Tbase ) & a, one_t ) {
+                //assert( 1 < N );
+                subcheck( a, 1L, 0, N );
+                return (Timmed &)a.strides[1];
+        }
+        static inline Timmed & ?[?]( arpk( N, S, Timmed, Tbase ) & a, int i ) {
+                //assert( i < N );
+                subcheck( a, (long int)i, 0, N );
+                return (Timmed &)a.strides[i];
+        }
+        static inline const Timmed & ?[?]( const arpk( N, S, Timmed, Tbase ) & a, int i ) {
+                //assert( i < N );
+                subcheck( a, (long int)i, 0, N );
+                return (Timmed &)a.strides[i];
+        }
+        static inline Timmed & ?[?]( arpk( N, S, Timmed, Tbase ) & a, unsigned int i ) {
+                //assert( i < N );
+                subcheck( a, (long int)i, 0, N );
+                return (Timmed &)a.strides[i];
+        }
+        static inline const Timmed & ?[?]( const arpk( N, S, Timmed, Tbase ) & a, unsigned int i ) {
+                //assert( i < N );
+                subcheck( a, (unsigned long int)i, 0, N );
+                return (Timmed &)a.strides[i];
+        }
+        static inline Timmed & ?[?]( arpk( N, S, Timmed, Tbase ) & a, long int i ) {
+                //assert( i < N );
+                subcheck( a, i, 0, N );
+                return (Timmed &)a.strides[i];
+        }
+        static inline const Timmed & ?[?]( const arpk( N, S, Timmed, Tbase ) & a, long int i ) {
+                //assert( i < N );
+                subcheck( a, i, 0, N );
+                return (Timmed &)a.strides[i];
+        }
+        static inline Timmed & ?[?]( arpk( N, S, Timmed, Tbase ) & a, unsigned long int i ) {
+                //assert( i < N );
+                subcheck( a, i, 0, N );
+                return (Timmed &)a.strides[i];
+        }
+        static inline const Timmed & ?[?]( const arpk( N, S, Timmed, Tbase ) & a, unsigned long int i ) {
+                //assert( i < N );
+                subcheck( a, i, 0, N );
+                return (Timmed &)a.strides[i];
+        }
+        static inline size_t ?`len( arpk( N, S, Timmed, Tbase ) & a ) {
+                return N;
+        }
+        static inline void __taglen( tag(arpk( N, S, Timmed, Tbase )), tag(N) ) {}
+}
 // RAII pattern has workarounds for
 //  - Trac 226:  Simplest handling would be, require immediate element to be otype, let autogen
 //    raii happen.  Performance on even a couple dimensions is unacceptable because of exponential
 //    thunk creation: ?{}() needs all four otype funcs from next level, so does ^?{}(), so do the
 //    other two.  This solution offers ?{}() that needs only ?{}(), and similar for ^?{}.
+//      raii happen.  Performance on even a couple dimensions is unacceptable because of exponential
+//      thunk creation: ?{}() needs all four otype funcs from next level, so does ^?{}(), so do the
+//      other two.  This solution offers ?{}() that needs only ?{}(), and similar for ^?{}.
 forall( [N], S & | sized(S), Timmed &, Tbase & | { void ?{}( Timmed & ); } )
 static inline void ?{}( arpk(N, S, Timmed, Tbase) & this ) {
     void ?{}( S (&)[N] ) {}
     ?{}(this.strides);
     for (i; N) ?{}( (Timmed &) this.strides[i] );
+static inline void ?{}( arpk( N, S, Timmed, Tbase ) & this ) {
+        void ?{}( S (&)[N] ) {}
+        ?{}(this.strides);
+        for (i; N) ?{}( (Timmed &)this.strides[i] );
+}
 forall( [N], S & | sized(S), Timmed &, Tbase & | { void ^?{}( Timmed & ); } )
 static inline void ^?{}( arpk(N, S, Timmed, Tbase) & this ) {
     void ^?{}( S (&)[N] ) {}
     ^?{}(this.strides);
     for (i; N ) {
         ^?{}( (Timmed &) this.strides[N-i-1] );
+    }
+static inline void ^?{}( arpk( N, S, Timmed, Tbase ) & this ) {
+        void ^?{}( S (&)[N] ) {}
+        ^?{}(this.strides);
+        for (i; N ) {
+                ^?{}( (Timmed &)this.strides[N-i-1] );
+        }
+}
 …
 forall( [N], ZTags ... , Trslt &, Tatom & | { Trslt mkar_( tag(Tatom), ZTags ); } )
 static inline arpk(N, Trslt, Trslt, Tatom) mkar_( tag(Tatom), tag(N), ZTags ) {}
+static inline arpk( N, Trslt, Trslt, Tatom) mkar_( tag(Tatom), tag(N), ZTags ) {}
 // based on https://stackoverflow.com/questions/1872220/is-it-possible-to-iterate-over-arguments-in-variadic-macros
     // Make a FOREACH macro
     #define FE_0(WHAT)
     #define FE_1(WHAT, X) WHAT(X)
     #define FE_2(WHAT, X, ...) WHAT(X)FE_1(WHAT, __VA_ARGS__)
     #define FE_3(WHAT, X, ...) WHAT(X)FE_2(WHAT, __VA_ARGS__)
     #define FE_4(WHAT, X, ...) WHAT(X)FE_3(WHAT, __VA_ARGS__)
     #define FE_5(WHAT, X, ...) WHAT(X)FE_4(WHAT, __VA_ARGS__)
     //... repeat as needed
     #define GET_MACRO(_0,_1,_2,_3,_4,_5,NAME,...) NAME
     #define FOR_EACH(action,...) \
     GET_MACRO(_0,__VA_ARGS__,FE_5,FE_4,FE_3,FE_2,FE_1,FE_0)(action,__VA_ARGS__)
+        // Make a FOREACH macro
+        #define FE_0(WHAT)
+        #define FE_1(WHAT, X) WHAT(X)
+        #define FE_2(WHAT, X, ...) WHAT(X)FE_1(WHAT, __VA_ARGS__)
+        #define FE_3(WHAT, X, ...) WHAT(X)FE_2(WHAT, __VA_ARGS__)
+        #define FE_4(WHAT, X, ...) WHAT(X)FE_3(WHAT, __VA_ARGS__)
+        #define FE_5(WHAT, X, ...) WHAT(X)FE_4(WHAT, __VA_ARGS__)
+        //... repeat as needed
+        #define GET_MACRO(_0,_1,_2,_3,_4,_5,NAME,...) NAME
+        #define FOR_EACH(action,...) \
+        GET_MACRO(_0,__VA_ARGS__,FE_5,FE_4,FE_3,FE_2,FE_1,FE_0)(action,__VA_ARGS__)
 #define COMMA_ttag(X) , ttag(X)
 …
 forall( TA &, TB &, TC &, IxAB, IxBC ... | { TB & ?[?]( TA &, IxAB ); TC & ?[?]( TB &, IxBC ); } )
 static inline TC & ?[?]( TA & this, IxAB ab, IxBC bc ) {
     return this[ab][bc];
+        return this[ab][bc];
+}
 …
 forall( TA &, TB &, TC &, IxAB_0, IxBC | { TB & ?[?]( TA &, IxAB_0 ); TC & ?[?]( TB &, IxBC ); } )
 static inline TC & ?[?]( TA & this, IxAB_0 ab, IxBC bc ) {
     return this[ab][bc];
+        return this[ab][bc];
+}
 forall( TA &, TB &, TC &, IxAB_0, IxAB_1, IxBC | { TB & ?[?]( TA &, IxAB_0, IxAB_1 ); TC & ?[?]( TB &, IxBC ); } )
 static inline TC & ?[?]( TA & this, IxAB_0 ab0, IxAB_1 ab1, IxBC bc ) {
     return this[[ab0,ab1]][bc];
+        return this[[ab0,ab1]][bc];
+}
 forall( TA &, TB &, TC &, IxAB_0, IxAB_1, IxAB_2, IxBC | { TB & ?[?]( TA &, IxAB_0, IxAB_1, IxAB_2 ); TC & ?[?]( TB &, IxBC ); } )
 static inline TC & ?[?]( TA & this, IxAB_0 ab0, IxAB_1 ab1, IxAB_2 ab2, IxBC bc ) {
     return this[[ab0,ab1,ab2]][bc];
+        return this[[ab0,ab1,ab2]][bc];
+}
 …
 // Base
 forall( [Nq], Sq & | sized(Sq), Tbase & )
 static inline tag(arpk(Nq, Sq, Tbase, Tbase)) enq_( tag(Tbase), tag(Nq), tag(Sq), tag(Tbase) ) {
     tag(arpk(Nq, Sq, Tbase, Tbase)) ret;
     return ret;
+static inline tag(arpk( Nq, Sq, Tbase, Tbase )) enq_( tag(Tbase ), tag(Nq), tag(Sq), tag(Tbase ) ) {
+        tag(arpk( Nq, Sq, Tbase, Tbase )) ret;
+        return ret;
+}
 // Rec
 forall( [Nq], Sq & | sized(Sq), [N], S & | sized(S), recq &, recr &, Tbase & | { tag(recr) enq_( tag(Tbase), tag(Nq), tag(Sq), tag(recq) ); } )
 static inline tag(arpk(N, S, recr, Tbase)) enq_( tag(Tbase), tag(Nq), tag(Sq), tag(arpk(N, S, recq, Tbase)) ) {
     tag(arpk(N, S, recr, Tbase)) ret;
     return ret;
+static inline tag(arpk( N, S, recr, Tbase )) enq_( tag(Tbase ), tag(Nq), tag(Sq), tag(arpk( N, S, recq, Tbase )) ) {
+        tag(arpk( N, S, recr, Tbase )) ret;
+        return ret;
+}
 …
 extern struct all_t {} all;
 forall( [N], S & | sized(S), Te &, result &, Tbase & | { tag(result) enq_( tag(Tbase), tag(N), tag(S), tag(Te) ); } )
 static inline result & ?[?]( arpk(N, S, Te, Tbase) & this, all_t ) {
     return (result&) this;
+static inline result & ?[?]( arpk( N, S, Te, Tbase ) & this, all_t ) {
+        return (result&) this;
+}
 …
 // forall(A &, Tv &, [N])
 // trait ar {
 //     Tv& ?[?]( A&, zero_t );
 //     Tv& ?[?]( A&, one_t  );
 //     Tv& ?[?]( A&, int    );
 //                   ...
 //     size_t ?`len( A& );
 //     void __taglen( tag(C), tag(N) );
+//       Tv& ?[?]( A&, zero_t );
+//       Tv& ?[?]( A&, one_t  );
+//       Tv& ?[?]( A&, int      );
+//                                 ...
+//       size_t ?`len( A& );
+//       void __taglen( tag(C), tag(N) );
 // };
 // working around N's not being accepted as arguments to traits
 #define ar(A, Tv, N) {                 \
     Tv& ?[?]( A&, zero_t );            \
     Tv& ?[?]( A&, one_t );             \
     Tv& ?[?]( A&, int );               \
     Tv& ?[?]( A&, unsigned int );      \
     Tv& ?[?]( A&, long int );          \
     Tv& ?[?]( A&, unsigned long int ); \
     size_t ?`len( A& );                \
     void __taglen( tag(A), tag(N) );   \
+}
+#define ar( A, Tv, N ) {                                \
+        Tv& ?[?]( A&, zero_t );                         \
+        Tv& ?[?]( A&, one_t );                          \
+        Tv& ?[?]( A&, int );                            \
+        Tv& ?[?]( A&, unsigned int );           \
+        Tv& ?[?]( A&, long int );                       \
+        Tv& ?[?]( A&, unsigned long int );      \
+        size_t ?`len( A& );                                     \
+        void __taglen( tag(A), tag(N) );        \
+}

Note: See TracChangeset for help on using the changeset viewer.

Context Navigation

Changeset ce02877 for libcfa/src/collections/array.hfa

Legend:

libcfa/src/collections/array.hfa

Download in other formats: