Context Navigation

← Previous Changeset
Next Changeset →

Changeset 1eea589f

Timestamp:

Jul 27, 2025, 2:48:31 PM (3 months ago)

Author:

Peter A. Buhr <pabuhr@…>

Branches:

Children:

Parents:

da10157 (diff), 7806f91 (diff)
Note: this is a merge changeset, the changes displayed below correspond to the merge itself.
Use the (diff) links above to see all the changes relative to each parent.

Message:

Merge branch 'master' of plg.uwaterloo.ca:software/cfa/cfa-cc

Files:

: 69 added
: 2 deleted
: 13 edited

Legend:

: Unmodified
: Added
: Removed

doc/theses/mike_brooks_MMath/benchmarks/list/Makefile

-              rda10157
+              r1eea589f
 # make results-latest.csv OP_MOVEMENTS=stack OP_POLARITIES=insfirst OP_ACCESSORS=allhead RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=thorough
 # cp results-latest.csv results-sizing.csv
+# make results-latest.csv OP_MOVEMENTS=queue OP_POLARITIES=inslast OP_ACCESSORS=remelem RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=thorough
+# cp results-latest.csv results-sizing-b.csv
+# make results-latest.csv RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=moderate FX_SOLUTIONS='lq-tailq lq-list cfa-cfa upp-upp'
+# cp results-latest.csv results-intrsv-cube.csv
 CFA = cfa
+CC = gcc-11
 CXX = g++-11
 UXX =  ~/u++/u++-7.0.0/bin/u++
 …
 RUN_NUM_REPS=3
 RUN_DATA_SIZE_MODE=none
 RUN_DURATION_SEC=5
+RUN_DURATION_SEC?=5
 RUN_TASKSET_CPULIST=6
 …
 PERFFLAGS_CC  = -DNDEBUG -O3
 else ifeq "$(MODE)" "correctness"
 PERFFLAGS_CFA = -O0 -g -debug
+PERFFLAGS_CFA = -O0 -g -nodebug -D__CFA_DEBUG__ # shortcut for not also building debug cfa
 PERFFLAGS_CC  = -O0 -g
 else
 …
 OP_POLARITIES=insfirst inslast
 OP_ACCESSORS=allhead inselem remelem
+FX_SOLUTIONS=lq-tailq lq-list cfa-cfa upp-upp cpp-stlref
+RUN_INTERLEAVE_PCTS=0
+FX_SOLUTIONS=lq-tailq lq-list cfa-cfa cfa-mandHead cfa-noListed cfa-noIter cfa-likeLq cfa-strip upp-upp cpp-stlref
 OPS=$(call cross3,-,$(OP_MOVEMENTS),$(OP_POLARITIES),$(OP_ACCESSORS))
 …
         $(COMPILER) $(EXTRA_COMP_FLAGS) -c $< $(OP_DEFINES) -include op-$(OP).h -include fx-$(FX).h -o $@ -MMD
+sayhi:
+        echo $(PERFPROGS)
+ifeq "$(RUN_DATA_SIZE_MODE)" "common5"
+RUN_DATA_SIZES=\
+# troubleshooting, e.g. `make echo_DEMOS` runs `echo $(DEMOS)`
+echo_% :
+        @echo '$($(@:echo_%=%))'
+# ifeq "$(RUN_DATA_SIZE_MODE)" "common5"
+# RUN_DATA_SIZES=\
+#   7-1000000 \
+#   71-100000 \
+#   809-10000 \
+#   9051-1000 \
+#   72421-100
+# else ifeq "$(RUN_DATA_SIZE_MODE)" "thorough"
+# RUN_DATA_SIZES=\
+#   1-1000000 \
+#   2-1000000 \
+#   3-1000000 \
+#   5-1000000 \
+#   7-1000000 \
+#   11-100000 \
+#   13-100000 \
+#   19-100000 \
+#   29-100000 \
+#   37-100000 \
+#   53-100000 \
+#   71-100000 \
+#   101-10000 \
+#   149-10000 \
+#   211-10000 \
+#   283-10000 \
+#   401-10000 \
+#   569-10000 \
+#   809-10000 \
+#   1151-1000 \
+#   1601-1000 \
+#   2267-1000 \
+#   3203-1000 \
+#   4547-1000 \
+#   6473-1000 \
+#   9051-1000 \
+#   12809-100 \
+#   18119-100 \
+#   25601-100 \
+#   36209-100 \
+#   51203-100 \
+#   72421-100 \
+#   102407-10 \
+#   144817-10 \
+#   204803-10 \
+#   289637-10 \
+#   409609-10 \
+#   579263-10 \
+#   819229-10 \
+#   1158613-1 \
+#   1638431-1 \
+#   2317057-1 \
+#   3276803-1 \
+#   4634111-1 \
+#   6553621-1 \
+#   9268211-1
+# else ifeq "$(RUN_DATA_SIZE_MODE)" "bignquick"
+# RUN_DATA_SIZES=\
+#   3-1000000 \
+#   29-100000 \
+#   283-10000 \
+#   3203-1000 \
+#   25601-100 \
+#   289637-10 \
+#   1000000-1 \
+#   3276803-1 \
+#   10000000-1
+# else ifeq "$(RUN_DATA_SIZE_MODE)" "bignthorough"
+# RUN_DATA_SIZES=\
+#   1-1000000 \
+#   3-1000000 \
+#   7-1000000 \
+#   13-100000 \
+#   29-100000 \
+#   53-100000 \
+#   101-10000 \
+#   211-10000 \
+#   401-10000 \
+#   809-10000 \
+#   1601-1000 \
+#   3203-1000 \
+#   6473-1000 \
+#   12809-100 \
+#   25601-100 \
+#   51203-100 \
+#   102407-10 \
+#   204803-10 \
+#   409609-10 \
+#   819229-10 \
+#   1638431-1 \
+#   3276803-1 \
+#   6553621-1 \
+#   12809000-1 \
+#   25601000-1 \
+#   51203000-1 \
+#   102407000-1 \
+#   204803000-1 \
+#   409609000-1
+# else ifeq "$(RUN_DATA_SIZE_MODE)" "moderate"
+# RUN_DATA_SIZES=\
+#   1-1000000 \
+#   3-1000000 \
+#   7-1000000 \
+#   13-100000 \
+#   29-100000 \
+#   53-100000 \
+#   101-10000 \
+#   211-10000 \
+#   401-10000 \
+#   1601-1000 \
+#   6473-1000 \
+#   25601-100
+# else ifeq "$(RUN_DATA_SIZE_MODE)" "sweetspot"
+# RUN_DATA_SIZES=\
+#   1-1000000 \
+#   2-1000000 \
+#   3-1000000 \
+#   5-1000000 \
+#   7-1000000 \
+#   11-100000 \
+#   13-100000 \
+#   19-100000 \
+#   29-100000 \
+#   37-100000 \
+#   53-100000 \
+#   71-100000 \
+#   101-10000 \
+#   149-10000
+# else ifeq "$(RUN_DATA_SIZE_MODE)" "manual"
+# ifeq "$(RUN_DATA_SIZES)" ""
+# $(error RUN_DATA_SIZE_MODE is manual but RUN_DATA_SIZES not given)
+# endif
+# else ifeq "$(RUN_DATA_SIZE_MODE)" "none"
+# # Assume user manages RUN_ARGS; empty RUN_ARGS just means run with compiled-in defaults
+# RUN_DATA_SIZES=none
+# else
+# $(error Bad RUN_DATA_SIZE_MODE ($(RUN_DATA_SIZE_MODE)); should be common5, thorough or manual)
+# endif
+ifeq "$(RUN_DATA_SIZE_MODE)" "manual"
+        ifeq "$(RUN_DATA_SIZES)" ""
+        $(error RUN_DATA_SIZE_MODE is manual but RUN_DATA_SIZES not given)
+        endif
+endif
+RUN_DATA_SIZES = \
+$(if $(filter $(RUN_DATA_SIZE_MODE),common5), \
 -1000000 \
 -100000 \
 -10000 \
 -1000 \
+-100
+else ifeq "$(RUN_DATA_SIZE_MODE)" "thorough"
+RUN_DATA_SIZES=\
+-100 \
+, $(if $(filter $(RUN_DATA_SIZE_MODE),thorough), \
+-1000000 \
+-1000000 \
+-1000000 \
+-1000000 \
 -1000000 \
 -100000 \
 …
   4634111-1 \
   6553621-1 \
+  9268211-1
+else ifeq "$(RUN_DATA_SIZE_MODE)" "manual"
+ifeq "$(RUN_DATA_SIZES)" ""
+$(error RUN_DATA_SIZE_MODE is manual but RUN_DATA_SIZES not given)
+endif
+else ifeq "$(RUN_DATA_SIZE_MODE)" "none"
+# Assume user manages RUN_ARGS; empty RUN_ARGS just means run with compiled-in defaults
+RUN_DATA_SIZES=none
+else
+$(error Bad RUN_DATA_SIZE_MODE ($(RUN_DATA_SIZE_MODE)); should be common5, thorough or manual)
+endif
+  9268211-1 \
+, $(if $(filter $(RUN_DATA_SIZE_MODE),bignquick), \
+-1000000 \
+-100000 \
+-10000 \
+-1000 \
+-100 \
+-10 \
+  1000000-1 \
+  3276803-1 \
+  10000000-1 \
+, $(if $(filter $(RUN_DATA_SIZE_MODE),bignthorough), \
+-1000000 \
+-1000000 \
+-1000000 \
+-100000 \
+-100000 \
+-100000 \
+-10000 \
+-10000 \
+-10000 \
+-10000 \
+-1000 \
+-1000 \
+-1000 \
+-100 \
+-100 \
+-100 \
+-10 \
+-10 \
+-10 \
+-10 \
+  1638431-1 \
+  3276803-1 \
+  6553621-1 \
+  12809000-1 \
+  25601000-1 \
+  51203000-1 \
+  102407000-1 \
+  204803000-1 \
+  409609000-1 \
+, $(if $(filter $(RUN_DATA_SIZE_MODE),moderate), \
+-1000000 \
+-1000000 \
+-1000000 \
+-100000 \
+-100000 \
+-100000 \
+-10000 \
+-10000 \
+-10000 \
+-1000 \
+-1000 \
+-100 \
+, $(if $(filter $(RUN_DATA_SIZE_MODE),sweetspot), \
+-1000000 \
+-1000000 \
+-1000000 \
+-1000000 \
+-1000000 \
+-100000 \
+-100000 \
+-100000 \
+-100000 \
+-100000 \
+-100000 \
+-100000 \
+-10000 \
+-10000 \
+, $(if $(filter $(RUN_DATA_SIZE_MODE),none), \
+, $(error Bad RUN_DATA_SIZE_MODE ($(RUN_DATA_SIZE_MODE)); see list of accepted values in Makefile's RUN_DATA_SIZES defimition) \
+)))))))
 RUN_REP_IDS=$(shell echo {1..$(RUN_NUM_REPS)})              # 1 2 3
+RUN_REP_EXTS=$(call cross3,,run,$(RUN_REP_IDS),.1csv)       # run1.1csv run2.1cav run3.1csv
+RUN_LAUNCHES=$(call cross,--,$(RUN_DATA_SIZES),$(RUN_REP_EXTS))
+RUN_REP_EXTS=$(call cross3,,run,$(RUN_REP_IDS),.1csv)       # run1.1csv run2.1csv run3.1csv
+RUN_LAUNCHES=$(call cross3,--,$(RUN_DATA_SIZES),$(RUN_INTERLEAVE_PCTS),$(RUN_REP_EXTS))
 …
 %.1csv : NUMNODES=$(call proj,-,$(SIZING),1)
 %.1csv : CHECKDONE=$(call proj,-,$(SIZING),2)
+%.1csv : REP_ID=$(subst run,,$(call proj,--,$(LAUNCH),2))
+%.1csv : RUN_ARGS=$(if $(filter none,$(SIZING)),,$(RUN_DURATION_SEC) $(CHECKDONE) $(NUMNODES) -1 $(REP_ID))  # use REP_ID as seed
+%.1csv : RUN_INTERLEAVE_PCT=$(call proj,--,$(LAUNCH),2)
+%.1csv : RUN_INTERLEAVE_FRAC=$(shell echo "scale=2; $(RUN_INTERLEAVE_PCT) / 100" | bc)
+%.1csv : REP_ID=$(subst run,,$(call proj,--,$(LAUNCH),3))
+%.1csv : SEED=$(REP_ID)
+%.1csv : RUN_ARGS=$(if $(filter none,$(SIZING)),,$(RUN_DURATION_SEC) $(CHECKDONE) $(NUMNODES) -1 $(SEED) $(RUN_INTERLEAVE_FRAC))  # use REP_ID as seed
 %.1csv : REP_TIME=$(shell date '+%F %H:%M:%S')
 %.1csv : perfprogs FORCE
         taskset --cpu-list $(RUN_TASKSET_CPULIST) ./perfexp--$(CORE) $(RUN_ARGS) | xargs -n 1 printf '%s,%s,%s,%s\n' "$(REP_TIME)" "$(REP_ID)" "$(RUN_ARGS)" | tee $@
+        taskset --cpu-list $(RUN_TASKSET_CPULIST) ./perfexp--$(CORE) $(RUN_ARGS) | xargs -n 1 printf '%s,%s,%s,%s\n' "$(REP_TIME)" "$(REP_ID)" "$(RUN_ARGS)" | tee -a $(RESULT)
 BATCHTIME=$(shell date '+%F--%H-%M-%S')
+results--$(BATCHTIME).csv : $(RESULT1S_SHUFD)
+        cat $^ | tee $@
+        rm $^
+results-latest.csv : results--$(BATCHTIME).csv
+RESULT=results--$(BATCHTIME).csv
+sub_make=$(MAKE) --no-print-directory $(1); cat $(1) >> $(2); rm $(1);
+export RESULT1S_SHUFD    # used by sh loop in $(RESULT) recipe
+export RUN_DURATION_SEC  # used by sub make; occurs free in %.1csv's variable bindings (not extracted from target name)
+NTESTS=$(words $(RESULT1S_SHUFD))
+RUNDUR = $(shell expr $(NTESTS) \* $(RUN_DURATION_SEC))
+ETA = $(shell date -d "+$(RUNDUR) seconds" +"%H:%M:%S")
+$(RESULT) :
+        @echo running $(NTESTS) tests, eta $(ETA)
+        for r in $$RESULT1S_SHUFD; do $(MAKE) --no-print-directory RESULT=$(RESULT) $$r; done
+results-latest.csv : $(RESULT)
         rm -f $@
         ln -s $< $@
 …
 -include *.d
+results-general.csv: FORCE
+        $(MAKE) results-latest.csv RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=sweetspot OP_ACCESSORS=remelem RUN_INTERLEAVE_PCTS='0 50' FX_SOLUTIONS='lq-tailq lq-list cfa-cfa cfa-mandHead'
+        cat results-latest.csv >> $@
+        $(MAKE) results-latest.csv RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=sweetspot OP_ACCESSORS='allhead inselem' RUN_INTERLEAVE_PCTS='0' FX_SOLUTIONS='lq-tailq lq-list cfa-cfa cfa-mandHead'
+        cat results-latest.csv >> $@
+        $(MAKE) results-latest.csv RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=sweetspot OP_ACCESSORS=remelem RUN_INTERLEAVE_PCTS='0 50' FX_SOLUTIONS='cfa-noListed cfa-noIter cfa-likeLq'
+        cat results-latest.csv >> $@
+        $(MAKE) results-latest.csv RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=sweetspot OP_ACCESSORS='allhead inselem' RUN_INTERLEAVE_PCTS='0' FX_SOLUTIONS='cfa-noListed cfa-noIter cfa-likeLq'
+        cat results-latest.csv >> $@
+        $(MAKE) results-latest.csv RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=sweetspot OP_ACCESSORS=remelem RUN_INTERLEAVE_PCTS='0 50' FX_SOLUTIONS='cfa-strip upp-upp cpp-stlref'
+        cat results-latest.csv >> $@
+        $(MAKE) results-latest.csv RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=sweetspot OP_ACCESSORS='allhead inselem' RUN_INTERLEAVE_PCTS='0' FX_SOLUTIONS='cfa-strip upp-upp cpp-stlref'
+        cat results-latest.csv >> $@
+results-zoomout-noshuf.csv: FORCE
+        @echo Do we need to make for tiny user iters?  If so:
+        @echo make clean
+        @echo make perfprogs CFA=$$cfa EXTRA_COMP_FLAGS=-DTINY_USER_ITEMS -j8
+        make results-latest.csv RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=bignthorough OPS=stack-insfirst-allhead FX_SOLUTIONS='lq-tailq cfa-cfa upp-upp cpp-stlref cfa-strip' SEED=-1
+        cp results-latest.csv $@
+results-zoomout-shuf.csv: FORCE
+        @echo Do we need to make for tiny user iters?  If so:
+        @echo make clean
+        @echo make perfprogs CFA=$$cfa EXTRA_COMP_FLAGS=-DTINY_USER_ITEMS -j8
+        make results-latest.csv RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=bignthorough OPS=stack-insfirst-allhead FX_SOLUTIONS='lq-tailq cfa-cfa upp-upp cpp-stlref cfa-strip'
+        cp results-latest.csv $@
+thesis: results-general.csv results-zoomout-noshuf.csv results-zoomout-shuf.csv
+# matches peter's "random"
+results-smoketest.csv: RUN_DATA_SIZE_MODE=bignquick
+results-smoketest.csv: RUN_NUM_REPS=1
+results-smoketest.csv: RUN_DURATION_SEC=1
+results-smoketest.csv: OP_MOVEMENTS=stack
+results-smoketest.csv: OP_POLARITIES=insfirst
+results-smoketest.csv: OP_ACCESSORS=allhead
+results-smoketest.csv: $(RESULT)
+        mv $< $@

doc/theses/mike_brooks_MMath/benchmarks/list/driver.c

-              rda10157
+              r1eea589f
 #include "observation.h"
+#ifdef TINY_USER_ITEMS
+  #define UDATA_T char
+  #define UDATA_LEN 1
+  #define UDATA_USE_POS 0
+#else
+  #define UDATA_T int
+  #define UDATA_LEN 64
+  #define UDATA_USE_POS 17
+#endif
 typedef struct B_UserItem
     BFX_EXTRUSION_DECL(B_UserItem)
+{
     BFX_INTRUSION(B_UserItem)
     int userdata[64];
+    UDATA_T userdata[ UDATA_LEN ];
+}
 B_UserItem;
 …
 #if defined(NDEBUG) || (defined(__cforall) && !defined(__CFA_DEBUG__))
     enum { DefaultNumNodes = 1000, DefaultExperimentDurSec = 1, DefaultCheckDonePeriod = 1000, DefaultExperimentDurOpCount = -1, DefaultSeed = 5 };
+    const double DefaultInterleaveFrac = 0.0;
     #define TRACE(tp)
 #else
     enum { DefaultNumNodes = 10, DefaultExperimentDurSec = 1, DefaultCheckDonePeriod = 2, DefaultExperimentDurOpCount = 20, DefaultSeed = 5 };
+    const double DefaultInterleaveFrac = 0.5;
     static const char * tp_filter
     // = "";
 …
 static BFX_LIST_HEAD_T(B_UserItem) lst;
 MAYBE_EXTERN_C (
 …
     volatile unsigned int bobs_prog_inserting     = 0;
     volatile unsigned int bobs_prog_removing      = 0;
+    volatile unsigned int bobs_prog_removing_end  = 0;
     volatile unsigned int bobs_prog_rollover_flag = 0;
+    //                    bobs_prog_rem_pos         (defined after BOP_REMPROGEND_IS_REMNO_BASED)
     void bobs_seek(unsigned int i) {
 …
     int bobs_getCurrentVal() {
         B_UserItem * curUI = BFX_DEREF_POS(B_UserItem, lst, observedItem);
         return curUI->userdata[17];
+        return curUI->userdata[ UDATA_USE_POS ];
+    }
 …
+)
+// Remove progress end (number) is based (upon) remove-number
+// True when an OP's REMELEM used remNo to choose which element to remove
+// False otherwise; notably including when REMELEM just bases upon first/last
+// Default to false.
+#ifndef BOP_REMPROGEND_IS_REMNO_BASED
+#define BOP_REMPROGEND_IS_REMNO_BASED false
+#endif
+MAYBE_EXTERN_C (
+    volatile unsigned int const * bobs_prog_rem_pos
+        = BOP_REMPROGEND_IS_REMNO_BASED ? & bobs_prog_removing_end : & bobs_prog_removing;
+)
 unsigned int uDefaultPreemption() {
         return 0;
 …
 int main(int argc, const char *argv[]) {
     const char * usage_args = "[ExperimentDurSec [CheckDonePeriod [NumNodes [ExperimentDurOpCount [Seed]]]]]";
     const int static_arg_posns = 5;
+    const char * usage_args = "[ExperimentDurSec [CheckDonePeriod [NumNodes [ExperimentDurOpCount [Seed [InterleaveFrac]]]]]]";
+    const int static_arg_posns = 6;
     unsigned int ExperimentDurSec     = DefaultExperimentDurSec;
 …
     size_t       ExperimentDurOpCount = DefaultExperimentDurOpCount;
     unsigned int Seed                 = DefaultSeed;
+    double       InterleaveFrac       = DefaultInterleaveFrac;
     switch (((argc - 1) < static_arg_posns) ? (argc - 1) : static_arg_posns) {
+      case 6: InterleaveFrac = atof(argv[6]);
       case 5: Seed = atoi(argv[5]);
       case 4: ExperimentDurOpCount = atol(argv[4]);
 …
+    }
+    // printf("ExperimentDurSec=%d, CheckDonePeriod=%d, NumNodes=%d, ExperimentDurOpCount=%zd, Seed=%d,\n",
+    //     ExperimentDurSec, CheckDonePeriod, NumNodes, ExperimentDurOpCount, Seed );
     if (ExperimentDurSec == 0 || CheckDonePeriod == 0 || NumNodes == 0 || ExperimentDurOpCount == 0 || Seed == 0 ) {
         printf("usage: %s %s\n", argv[0], usage_args);
 …
   #endif
+    // Shuffling makes listed items' physical order in memory different from their order within to the list.
+    // Affects insertion: next item to insert picked through insertOrdShuf.
   #ifdef DISABLE_SHUFFLING_INDIRECTION
     #define INSERTPOS(insertNum) insertNum
 …
   #endif
+    // Interleaving affects the list position where an element-oriented operation occurs: at an end vs. in the middle.
+    // Perterbs the sequence of logical insert/remove numbers presented to the OP cartridge, e.g. from [0 1 2 3 4 5 6]
+    // to [3 0 4 1 5 2 6], which is [mid end mid end mid end solo], for a perfect-alternation interleave; except that the
+    // end/mid interleave is atually selected randomly.
+  #ifdef DISABLE_INTERLEAVING
+    #define nextInterleave 0
+    printf("interleave key %x\n", 0);
+  #else
+    const unsigned int INTRL_KEYLEN = 64;
+    unsigned char interleaveKey[INTRL_KEYLEN];
+    unsigned char nextInterleavePos = 0;
+    {
+        unsigned int numOnes = INTRL_KEYLEN * InterleaveFrac;
+        unsigned int numZeros = INTRL_KEYLEN - numOnes;
+        // generate randomly drawn 0/1
+        memset( interleaveKey         , 0, numZeros );  // zeros then ones
+        memset( interleaveKey+numZeros, 1, numOnes );
+        for (unsigned int i = 0; i < 64; i++) { // shuffle it
+            unsigned int nodesRemaining = 64 - i;
+            unsigned int swapWith = i + rand() % nodesRemaining;
+            unsigned char tempValue = interleaveKey[swapWith];
+            interleaveKey[swapWith] = interleaveKey[i];
+            interleaveKey[i] = tempValue;
+        }
+        #define nextInterleave (interleaveKey[nextInterleavePos = (nextInterleavePos + 1) % 64])
+    }
+    {
+        unsigned int z = 0, o = 0;
+        for ( int i = 0; i < INTRL_KEYLEN; i++ ) {
+            if (interleaveKey[i]) o++;
+            else z++;
+        }
+        // printf("Interleaving with %u in middle and %u at end\n", o, z);
+    }
+    // printf("interleave key begins %016llx\n", *(unsigned long long*)interleaveKey);
+    // printf("interleave key begins %016llx\n", *(unsigned long long*)(interleaveKey+8));
+    // printf("sample interleave value %d\n", nextInterleave);
+    // printf("sample interleave value %d\n", nextInterleave);
+    // printf("sample interleave value %d\n", nextInterleave);
+    // printf("sample interleave value %d\n", nextInterleave);
+    // printf("sample interleave value %d\n", nextInterleave);
+    // printf("sample interleave value %d\n", nextInterleave);
+    // printf("sample interleave value %d\n", nextInterleave);
+    // printf("sample interleave value %d\n", nextInterleave);
+    // printf("sample interleave value %d\n", nextInterleave);
+    // printf("sample interleave value %d\n", nextInterleave);
+    // printf("sample interleave value %d\n", nextInterleave);
+    // printf("sample interleave value %d\n", nextInterleave);
+  #endif
     ui = (B_UserItem*) malloc( (size_t)NumNodes * (size_t)sizeof(B_UserItem) );
     if (!ui) {
 …
     memset(listedItems, 0, (size_t)NumNodes * (size_t)sizeof(BFX_LISTED_ELEM_T(B_UserItem)));
     // Fill with demo data
+    // Construct and fill with demo data
     for (unsigned int i = 0; i < NumNodes; i++) {
         B_UserItem * curUI = & ui[INSERTPOS(i)];
+        curUI->userdata[17] = i;
+      #ifdef __cforall
+        (*curUI){};
+      #endif
+        curUI->userdata[ UDATA_USE_POS ] = i;
+    }
 …
     //   lst    lvalue of the list head being added to / removed from
     //   iters  array of ADD return values, in logical-insert order; on ADD, is valid at [0..insNo)
     //   insNo  counter of the ADD calls (logical insert number)
     //   remNo  counter of the REM calls (logical remove number)
+    //   insNo  interleave-perterbed counter of the ADD calls (logical insert number)
+    //   remNo  interleave-perterbed counter of the REM calls (logical remove number)
     //   item   lvalue of the item being added
     // Logical insert number 0 and remove number n-1 are given with a distinguished hook.
 …
     double elapsed_sec = 0;
     clock_t start = clock();
+    const unsigned int numMiddleNodes = (NumNodes-1) * InterleaveFrac;
+    const unsigned int numEndNodes = NumNodes - numMiddleNodes - 1;
+    // printf("Running with %u in the middle and %u at end\n", numMiddleNodes, numEndNodes);
+    const unsigned int removeBase[] = {0, numEndNodes};
+    const unsigned int removeLimit[] = {numEndNodes, numMiddleNodes};
     size_t privateOpsCompleted = 0;
 …
     while (elapsed_sec <= (double) ExperimentDurSec && privateOpsCompleted < ExperimentDurOpCount) {
         for ( int t = 0; t < CheckDonePeriod; t += 1 ) {
             TRACE('a')
+            TRACE('a')              // insert special first
             listedItems[0] =
                 BOP_INIT(lst, listedItems, 0, ui[INSERTPOS(0)]);
             TRACE('b')
+            TRACE('b')              // insert general
             for ( int privateCurInsert = 1;
                   (bobs_prog_inserting = privateCurInsert, privateCurInsert < NumNodes);
 …
                 TRACE('+')
+            }
+            TRACE('c')
+            for ( int privateCurRemove = 1;
+                  (bobs_prog_removing = privateCurRemove, privateCurRemove < NumNodes);
+                  privateCurRemove += 1
+            TRACE('c')              // remove general
+            int removeProgress[] = { 0, 0 };
+            for ( int flip = 0;
+                  (bobs_prog_removing = removeProgress[0] + removeProgress[1] + 1,
+                     bobs_prog_removing_end = removeProgress[0] + 1,
+                     flip = nextInterleave,
+                     removeProgress[0] < removeLimit[0] && removeProgress[1] < removeLimit[1] );
+                  removeProgress[flip] += 1
                 ) {
                 TRACE('-')
                 BOP_REMOVE( lst, listedItems, privateCurRemove-1 );
+                BOP_REMOVE( lst, listedItems, removeBase[flip]+removeProgress[flip] );
                 TRACE('+')
+            }
+            TRACE('D')
+            TRACE('X')              // remove imbalanced
+            // most work done under general; it stops when either flip-side's work finishes
+            // now drain any any stragglers so both flip-sides' work finishes
+            for ( int flip = 0; flip < 2; flip ++ ) {
+                for ( ; (bobs_prog_removing = removeProgress[0] + removeProgress[1] + 1,
+                         bobs_prog_removing_end = removeProgress[0] + 1,
+                         removeProgress[flip] < removeLimit[flip] )
+                      ;  removeProgress[flip] += 1
+                    ) {
+                    TRACE('-')
+                    BOP_REMOVE( lst, listedItems, removeBase[flip]+removeProgress[flip] );
+                    TRACE('+')
+                }
+            }
+            TRACE('D')              // remove special last
             BOP_TEARDOWN(lst, listedItems, NumNodes-1);
             TRACE('d')
 …
             TRACE('e')
             bobs_prog_inserting = 0;
+            bobs_prog_removing = 0;
+            bobs_prog_removing = 0;
+            bobs_prog_removing_end = 0;
             bobs_ops_completed = privateOpsCompleted;
             TRACE('f')
 …
     free(ui);
     free(listedItems);
+  #ifndef DISABLE_SHUFFLING_INDIRECTION
     free(insertOrdShuf);
+  #endif
+}

doc/theses/mike_brooks_MMath/benchmarks/list/fx-cfa-cfa.h

-              rda10157
+              r1eea589f
+#include <containers/list.hfa>
+#define BFX_INTRUSION(S)                         inline dlink(S);
+#define BFX_EXTRUSION_DECL(S)
+#define BFX_EXTRUSION_FOLLOWUP(S)                P9_EMBEDDED( S, dlink(S) )
+#define BFX_LIST_HEAD_T(S)                       dlist(S)
+#define BFX_LISTED_ELEM_T(S)                     S*
+#define BFX_INSERT_FIRST(S, lst, item)           (insert_first (lst, item), (S*)&(item))
+#define BFX_INSERT_LAST(S, lst, item)            (insert_last  (lst, item), (S*)&(item))
+#define BFX_INSERT_BEFORE(S, lst, item, refIter) (insert_before(*refIter, item), (S*)&(item))
+#define BFX_INSERT_AFTER(S, lst, item, refIter)  (insert_after (*refIter, item), (S*)&(item))
+#define BFX_REMOVE_FIRST(S, lst)                 remove( first( lst ) )
+#define BFX_REMOVE_LAST(S, lst)                  remove( last( lst ) )
+#define BFX_REMOVE_HERE(S, lst, refIter)         remove(*refIter)
+#define BFX_INIT(S, lst)
+#define BFX_GET_AFTER(S, lst, iter)              (&next( *iter))
+#define BFX_GET_BEFORE(S, lst, iter)             (&prev( *iter ))
+#define BFX_IS_VALID_POS(S, lst, iter)           ((iter)!=NULL)
+#define BFX_DEREF_POS(S, lst, iter)              (iter)
+#include "libcfa-fork-list.hfa" // same folder: latest and greatest
+#include "fx-cfa-GENERAL.h"

doc/theses/mike_brooks_MMath/benchmarks/list/fx-lq-list.h

-              rda10157
+              r1eea589f
 #include <assert.h>
 #include <stddef.h>
+#include <stdbool.h>
 #define HEADNAME_(S)                             S ## Head
 …
 #define BFX_INSERT_BEFORE(S, lst, item, refIter) ({LIST_INSERT_BEFORE(refIter, &item, xx); &item;})
 #define BFX_INSERT_AFTER(S, lst, item, refIter)  ({LIST_INSERT_AFTER(refIter, &item, xx); &item;})
 #define BFX_REMOVE_FIRST(S, lst)                 LIST_REMOVE( LIST_FIRST( &lst ), xx )
+#define BFX_REMOVE_FIRST(S, lst)                 ({ S * first = LIST_FIRST( &lst ); LIST_REMOVE( first, xx ); })
 #define BFX_REMOVE_LAST(S, lst)                  assert(false&&"unimplemented REMOVE_LAST on lq-list")
 #define BFX_REMOVE_HERE(S, lst, refIter)         LIST_REMOVE( refIter, xx )

doc/theses/mike_brooks_MMath/benchmarks/list/fx-lq-tailq.h

rda10157	r1eea589f
1	1	#include <sys/queue.h>
	2	#include <stdbool.h>
2	3
3	4	#define HEADNAME_(S) S ## Head

doc/theses/mike_brooks_MMath/benchmarks/list/observation.c

-              rda10157
+              r1eea589f
     printSuccs(leash - 1);
+}
 static void explore(int here) {
+static void explore(int here, unsigned int leash) {
     bobs_seek(here);
     if (!bobs_hasCurrent()) {
 …
+    }
     bobs_movePrev();
     printPreds(2);
+    printPreds(leash);
     bobs_seek(here);
 …
     bobs_moveNext();
     printSuccs(2);
+    printSuccs(leash);
+}
 static void exploreRange(int validFrom, int validTo) {
 …
+    }
+    explore(listFirstmost);
+    printf(" v%d..%d ", listFirstmost, listLastmost);
+    explore(listFirstmost, 6);
     printf(" ...");
     if (gapsize > 5) {
         explore(midpoint);
         printf(" ...");
+    }
     explore(listLastmost);
+    // if (gapsize > 5) {
+    //     explore(midpoint);
+    //     printf(" ...");
+    // }
+    explore(listLastmost, 6);
+}
 …
         printf("%8zd + ? (rolling over)\n", bobs_ops_completed);
     } else {
         printf("%8zd + %6d/2 + %6d/2", bobs_ops_completed, bobs_prog_inserting, bobs_prog_removing);
+        printf("%8zd + %6d/2 + %6d/2, %6d@e %6d_u", bobs_ops_completed, bobs_prog_inserting, bobs_prog_removing, bobs_prog_removing_end, *bobs_prog_rem_pos);
         int validFrom, validTo;
 …
             case stack:
                 validFrom = 0;
                 validTo = MIN((signed)bobs_prog_inserting-1, (signed)NumNodes - (signed)bobs_prog_removing - 1);
+                validTo = MIN((signed)bobs_prog_inserting-1, (signed)NumNodes - (signed)*bobs_prog_rem_pos - 1);
                 break;
             case queue:
                 validFrom = (signed)bobs_prog_removing;
+                validFrom = (signed)*bobs_prog_rem_pos;
                 validTo = (signed)bobs_prog_inserting-1;
                 break;

doc/theses/mike_brooks_MMath/benchmarks/list/observation.h

-              rda10157
+              r1eea589f
     extern volatile unsigned int bobs_prog_inserting;
     extern volatile unsigned int bobs_prog_removing;
+    extern volatile unsigned int bobs_prog_removing_end;
     extern volatile unsigned int bobs_prog_rollover_flag;
+    extern volatile unsigned int const * bobs_prog_rem_pos;
     // observation.c defines

doc/theses/mike_brooks_MMath/benchmarks/list/op-queue-insfirst-remelem.h

rda10157	r1eea589f
7	7	#define BOP_INSERT(lst, iters, insNo, item) BFX_INSERT_FIRST(B_UserItem, lst, (item))
8	8	#define BOP_REMOVE(lst, iters, remNo) BFX_REMOVE_HERE(B_UserItem, lst, iters[(remNo)])
	9
	10	#define BOP_REMPROGEND_IS_REMNO_BASED true

doc/theses/mike_brooks_MMath/benchmarks/list/op-queue-inslast-remelem.h

rda10157	r1eea589f
7	7	#define BOP_INSERT(lst, iters, insNo, item) BFX_INSERT_LAST(B_UserItem, lst, (item))
8	8	#define BOP_REMOVE(lst, iters, remNo) BFX_REMOVE_HERE(B_UserItem, lst, iters[(remNo)])
	9
	10	#define BOP_REMPROGEND_IS_REMNO_BASED true

doc/theses/mike_brooks_MMath/benchmarks/list/op-stack-insfirst-remelem.h

rda10157	r1eea589f
7	7	#define BOP_INSERT(lst, iters, insNo, item) BFX_INSERT_FIRST(B_UserItem, lst, (item))
8	8	#define BOP_REMOVE(lst, iters, remNo) BFX_REMOVE_HERE(B_UserItem, lst, iters[NumNodes-(remNo)-1])
	9
	10	#define BOP_REMPROGEND_IS_REMNO_BASED true

doc/theses/mike_brooks_MMath/benchmarks/list/op-stack-inslast-remelem.h

rda10157	r1eea589f
7	7	#define BOP_INSERT(lst, iters, insNo, item) BFX_INSERT_LAST(B_UserItem, lst, (item))
8	8	#define BOP_REMOVE(lst, iters, remNo) BFX_REMOVE_HERE(B_UserItem, lst, iters[NumNodes-(remNo)-1])
	9
	10	#define BOP_REMPROGEND_IS_REMNO_BASED true

libcfa/src/collections/list.hfa

-              rda10157
+              r1eea589f
 // part), by failing fast.
+#if defined( __x86_64 )
+        // Preferred case: tag in the most-significant bit.  Dereference has been shown to segfault consistently.
+        // Maintenance should list more architectures as "ok" here, to let them use the preferred case, when valid.
+        #define ORIGIN_TAG_BITNO ( 8 * sizeof( size_t ) - 1 )
+#else
+        // Fallback case: tag in the least-significant bit.  Dereference will often give an alignment error, but may not,
+        // e.g. if accessing a char-typed member.  32-bit x86 uses the most- significant bit for real room on the heap.
+        #define ORIGIN_TAG_BITNO 0
+#ifdef __EXPERIMENTAL_DISABLE_OTAG__ // Perf experimention alt mode
+    // With origin tagging disabled, iteration never reports "no more elements."
+    // In this mode, the list API is buggy.
+    // This mode is used to quantify the cost of the normal tagging scheme.
+    #define ORIGIN_TAG_SET(p)   (p)
+    #define ORIGIN_TAG_CLEAR(p) (p)
+    #define ORIGIN_TAG_QUERY(p) 0
+    #define ORIGIN_TAG_ASGN(p, v) (p)
+    #define ORIGIN_TAG_EITHER(p, v) (p)
+    #define ORIGIN_TAG_NEQ(v1, v2) 0
+#else // Normal
+    #if defined( __x86_64 )
+        // Preferred case: tag in the most-significant bit.  Dereference
+        // has been shown to segfault consistently.  Maintenance should
+        // list more architectures as "ok" here, to let them use the
+        // preferred case, when valid.
+        #define ORIGIN_TAG_BITNO ( 8 * sizeof( size_t ) - 1 )
+    #else
+        // Fallback case: tag in the least-significant bit.  Dereference
+        // will often give an alignment error, but may not, e.g. if
+        // accessing a char-typed member.  32-bit x86 uses the most-
+        // significant bit for real room on the heap.
+        #define ORIGIN_TAG_BITNO 0
+    #endif
+    #define ORIGIN_TAG_MASK (((size_t)1) << ORIGIN_TAG_BITNO)
+    #define ORIGIN_TAG_SET(p) ((p) |  ORIGIN_TAG_MASK)
+    #define ORIGIN_TAG_CLEAR(p) ((p) & ~ORIGIN_TAG_MASK)
+    #define ORIGIN_TAG_QUERY(p) ((p) &  ORIGIN_TAG_MASK)
+    #define ORIGIN_TAG_ASGN(p, v) ( \
+        verify( ! ORIGIN_TAG_QUERY(p) && "p had no tagbit" ), \
+        ORIGIN_TAG_EITHER((p), (v)) \
+    )
+    #define ORIGIN_TAG_EITHER(p, v) ( \
+        verify( ! ORIGIN_TAG_CLEAR(v) && "v is a pure tagbit" ), \
+        ( (p) | (v) ) \
+    )
+    #define ORIGIN_TAG_NEQ(v1, v2) ( \
+        verify( ! ORIGIN_TAG_CLEAR(v1) && "v1 is a pure tagbit" ), \
+        verify( ! ORIGIN_TAG_CLEAR(v2) && "v2 is a pure tagbit" ), \
+        ( (v1) ^ (v2) ) \
+    )
 #endif
+#define ORIGIN_TAG_MASK (((size_t)1) << ORIGIN_TAG_BITNO)
+#define ORIGIN_TAG_SET( p )   ((p) |  ORIGIN_TAG_MASK)
+#define ORIGIN_TAG_CLEAR( p ) ((p) & ~ORIGIN_TAG_MASK)
+#define ORIGIN_TAG_QUERY( p ) ((p) &  ORIGIN_TAG_MASK)
+#ifdef __EXPERIMENTAL_LOOSE_SINGLES__ // Perf experimention alt mode
+    // In loose-singles mode, the ability to answer an "is listed" query is disabled, as is "to insert an element,
+    // it must not be listed already" checking.  The user must know separately whether an element is listed.
+    // Other than inserting it, any list-api action on an unlisted element is undefined.  Notably, list iteration
+    // starting from an unlisted element is not defined to respond "no more elements," and may instead continue
+    // iterating from a formerly occupied list position.  This mode matches LQ usage.
+    #define NOLOOSE(...)
+    #define LOOSEONLY(...) __VA_ARGS__
+#else // Normal
+    #define NOLOOSE(...) __VA_ARGS__
+    #define LOOSEONLY(...)
+#endif
 forall( tE & ) {
 …
         static inline void ?{}( dlink( tE ) & this ) {
+          NOLOOSE(
                 this.next = this.prev = 0p;
+          )
+        }
 …
 static inline forall( tE &, tLinks & | embedded( tE, tLinks, dlink( tE ) ) ) {
         bool isListed( tE & node ) {
+      NOLOOSE(
                 verify( &node != 0p );
                 dlink( tE ) & node_links = node`inner;
                 return (node_links.prev != 0p) || (node_links.next != 0p);
+          )
+          LOOSEONLY(
+        verify(false && "isListed is undefined");
+                return true;
+          )
+        }
 …
                 dlink( tE ) & linkToInsert = node`inner;
+      NOLOOSE(
                 verify( linkToInsert.next == 0p );
                 verify( linkToInsert.prev == 0p );
+          )
                 tE & list_pos_elem = *(tE *)ORIGIN_TAG_CLEAR( (size_t)&before );
 …
                 dlink( tE ) & linkToInsert = node`inner;
+      NOLOOSE(
                 verify( linkToInsert.prev == 0p );
                 verify( linkToInsert.next == 0p );
+          )
                 tE & list_pos_elem = *(tE *)ORIGIN_TAG_CLEAR( (size_t)&after );
 …
                 before_links.next = &after_raw;
                 after_links.prev = &before_raw;
+      NOLOOSE(
                 asm( "" : : : "memory" );
                 list_pos_links.prev = 0p;
                 list_pos_links.next = 0p;
                 asm( "" : : : "memory" );
+          )
                 return node;
+        }

libcfa/src/stdhdr/assert.h

-              rda10157
+              r1eea589f
         #define warnf( expr, fmt, ... ) ({ static bool check_once##__LINE__ = false; if( false == check_once##__LINE__ && false == (expr)) { check_once##__LINE__ = true; __assert_warn_f(__VSTRINGIFY__(expr), __FILE__, __LINE__, __PRETTY_FUNCTION__, fmt, ## __VA_ARGS__ ); } })
 #else
         #define verify(x)
         #define verifyf(x, ...)
         #define verifyfail(...)
         #define warnf( expr, fmt, ... )
+        #define verify(x) 0
+        #define verifyf(x, ...) 0
+        #define verifyfail(...) 0
+        #define warnf( expr, fmt, ... ) 0
 #endif

Note: See TracChangeset for help on using the changeset viewer.

Download in other formats: