[90a3a89] | 1 | # For correctness, see test-correctness.sh. |
---|
| 2 | # For performance: |
---|
[e9ed2a1] | 3 | # pushd ~/cfax |
---|
| 4 | # . ~/setcfa build-fast |
---|
| 5 | # popd |
---|
| 6 | # make perfprogs CFA=$cfa -j8 MODE=performance |
---|
| 7 | # make results-latest.csv RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=common5 |
---|
| 8 | # cp results-latest.csv results-baseline.csv |
---|
| 9 | # make results-latest.csv OP_MOVEMENTS=stack OP_POLARITIES=insfirst OP_ACCESSORS=allhead RUN_DURATION_SEC=5 RUN_NUM_REPS=5 RUN_DATA_SIZE_MODE=thorough |
---|
| 10 | # cp results-latest.csv results-sizing.csv |
---|
[0b66ef9] | 11 | |
---|
| 12 | CFA = cfa |
---|
| 13 | CXX = g++-11 |
---|
| 14 | UXX = ~/u++/u++-7.0.0/bin/u++ |
---|
| 15 | |
---|
[1dfc3d0] | 16 | MODE=performance |
---|
| 17 | EXTRA_COMP_FLAGS= |
---|
| 18 | RUN_NUM_REPS=3 |
---|
[9bb8ee42] | 19 | RUN_DATA_SIZE_MODE=none |
---|
| 20 | RUN_DURATION_SEC=5 |
---|
[e9ed2a1] | 21 | RUN_TASKSET_CPULIST=6 |
---|
[0b66ef9] | 22 | |
---|
| 23 | ifeq "$(MODE)" "performance" |
---|
[e9ed2a1] | 24 | PERFFLAGS_CFA = -DNDEBUG -O3 -nodebug |
---|
[0b66ef9] | 25 | PERFFLAGS_CC = -DNDEBUG -O3 |
---|
| 26 | else ifeq "$(MODE)" "correctness" |
---|
[e9ed2a1] | 27 | PERFFLAGS_CFA = -O0 -g -debug |
---|
| 28 | PERFFLAGS_CC = -O0 -g |
---|
[0b66ef9] | 29 | else |
---|
| 30 | $(error Bad MODE ($(MODE)); should be performance or correctness) |
---|
| 31 | endif |
---|
| 32 | |
---|
| 33 | PERFFLAGS_CXX = $(PERFFLAGS_CC) |
---|
[e9ed2a1] | 34 | PERFFLAGS_UXX = $(PERFFLAGS_CFA) |
---|
[0b66ef9] | 35 | |
---|
[2b01f8e] | 36 | CFLAGS=$(PERFFLAGS_CC) $(EXTRA_COMP_FLAGS) |
---|
| 37 | |
---|
[0b66ef9] | 38 | SHELL = /usr/bin/bash |
---|
| 39 | |
---|
| 40 | # function: project an element from a filename that contains a delimited tuple |
---|
| 41 | # (call proj,-,a-b-c.hfa,3) |
---|
| 42 | # is |
---|
| 43 | # c |
---|
| 44 | define proj |
---|
| 45 | $(word $(3),$(subst $(1), ,$(basename $(2)))) |
---|
| 46 | endef |
---|
| 47 | |
---|
| 48 | # functions: cross two lists, adding given delimiter between |
---|
| 49 | # (call cross,-,a b c,1 2) |
---|
| 50 | # is |
---|
| 51 | # a-1 a-2 b-1 b-2 c-1 c-2 |
---|
| 52 | define cross |
---|
| 53 | $(foreach x,$(2),$(foreach xs,$(3),$(x)$(1)$(xs))) |
---|
| 54 | endef |
---|
| 55 | define cross3 |
---|
| 56 | $(call cross,$(1),$(2),$(call cross,$(1),$(3),$(4))) |
---|
| 57 | endef |
---|
| 58 | define cross4 |
---|
| 59 | $(call cross,$(1),$(2),$(call cross3,$(1),$(3),$(4),$(5))) |
---|
| 60 | endef |
---|
| 61 | define cross5 |
---|
| 62 | $(call cross,$(1),$(2),$(call cross4,$(1),$(3),$(4),$(5),$(6))) |
---|
| 63 | endef |
---|
| 64 | |
---|
| 65 | OP_MOVEMENTS=stack queue |
---|
| 66 | OP_POLARITIES=insfirst inslast |
---|
| 67 | OP_ACCESSORS=allhead inselem remelem |
---|
| 68 | FX_SOLUTIONS=lq-tailq lq-list cfa-cfa upp-upp cpp-stlref |
---|
| 69 | |
---|
| 70 | OPS=$(call cross3,-,$(OP_MOVEMENTS),$(OP_POLARITIES),$(OP_ACCESSORS)) |
---|
| 71 | FXS=$(FX_SOLUTIONS) |
---|
| 72 | |
---|
| 73 | all : perfprogs results-latest.csv |
---|
| 74 | |
---|
| 75 | # Want to add functional dependency: |
---|
| 76 | # if current FX_SOLUTION is lq-list then |
---|
| 77 | # current OP_MOVEMENT must be stack and |
---|
| 78 | # current OP_POLARITY must be insfirst |
---|
| 79 | LQ_LIST_INCOMPAT_OP_MOVEMENTS=$(filter-out stack,$(OP_MOVEMENTS)) |
---|
| 80 | LQ_LIST_INCOMPAT_OP_POLARITIES=$(filter-out insfirst,$(OP_POLARITIES)) |
---|
| 81 | LQ_LIST_INCOMPAT_OPS=$(call cross3,-,$(LQ_LIST_INCOMPAT_OP_MOVEMENTS),$(OP_POLARITIES),$(OP_ACCESSORS)) \ |
---|
| 82 | $(call cross3,-,$(OP_MOVEMENTS),$(LQ_LIST_INCOMPAT_OP_POLARITIES),$(OP_ACCESSORS)) |
---|
| 83 | INCOMPAT=$(call cross,--,lq-list,$(LQ_LIST_INCOMPAT_OPS)) |
---|
| 84 | define filterFds |
---|
| 85 | $(filter-out $(INCOMPAT),$(1)) |
---|
| 86 | endef |
---|
| 87 | |
---|
| 88 | |
---|
| 89 | CORES_FULL=$(call cross,--,$(FXS),$(OPS)) # lq-tailq--stack-inslast-allhead |
---|
| 90 | CORES=$(call filterFds,$(CORES_FULL)) # lq-tailq--stack-inslast-allhead |
---|
| 91 | |
---|
| 92 | |
---|
| 93 | PERFPROGS=$(call cross,--,perfexp,$(CORES)) |
---|
| 94 | |
---|
| 95 | perfprogs : $(PERFPROGS) |
---|
| 96 | |
---|
| 97 | perfexp--% driver--%.o result--%.1csv : FX=$(call proj,--,$@,2) |
---|
| 98 | perfexp--% driver--%.o result--%.1csv : FX_COARSE=$(call proj,-,$(FX),1) |
---|
| 99 | perfexp--% driver--%.o result--%.1csv : OP=$(call proj,--,$@,3) |
---|
| 100 | perfexp--% driver--%.o result--%.1csv : OP_MOVEMENT=$(call proj,-,$(OP),1) |
---|
| 101 | perfexp--% driver--%.o result--%.1csv : OP_POLARITY=$(call proj,-,$(OP),2) |
---|
| 102 | perfexp--% driver--%.o result--%.1csv : OP_ACCESSOR=$(call proj,-,$(OP),3) |
---|
| 103 | perfexp--% driver--%.o result--%.1csv : OP_DEFINES=-DOP_MOVEMENT=$(OP_MOVEMENT) -DOP_POLARITY=$(OP_POLARITY) -DOP_ACCESSOR=$(OP_ACCESSOR) |
---|
| 104 | |
---|
| 105 | perfexp--cfa-% driver--cfa-%.o : COMPILER=$(CFA) $(PERFFLAGS_CFA) |
---|
| 106 | perfexp--lq-% driver--lq-%.o : COMPILER=$(CC) $(PERFFLAGS_CC) |
---|
| 107 | perfexp--cpp-% driver--cpp-%.o : COMPILER=$(CXX) $(PERFFLAGS_CXX) |
---|
| 108 | perfexp--upp-% driver--upp-%.o : COMPILER=$(UXX) $(PERFFLAGS_UXX) |
---|
| 109 | perfexp--% driver--%.o : COMPILER=NO-COMPILER-FOR-$(FX_COARSE) |
---|
| 110 | |
---|
[fdc042d] | 111 | # Without this %.d rule, ordinary make runs have noise about the recipe for driver--%.o being ill-formed when called on a *.d. |
---|
| 112 | # https://stackoverflow.com/questions/3714041/why-does-this-makefile-execute-a-target-on-make-clean |
---|
| 113 | # Whatever you -include gets called as a target first. |
---|
| 114 | # One such example is driver--upp-upp--stack-insfirst-allhead.d |
---|
| 115 | # Without this %.d rule, `make make driver--upp-upp--stack-insfirst-allhead.d` leads to the rule for driver--%.o firing. |
---|
| 116 | # Though my dumb human eyes don't see the pattern as matching. |
---|
| 117 | %.d: |
---|
| 118 | @touch $@ |
---|
| 119 | |
---|
[0b66ef9] | 120 | perfexp--% : driver--%.o observation.o |
---|
[1dfc3d0] | 121 | $(COMPILER) $(EXTRA_COMP_FLAGS) $^ -o $@ |
---|
[0b66ef9] | 122 | |
---|
| 123 | driver--%.o : driver.c |
---|
[1dfc3d0] | 124 | $(COMPILER) $(EXTRA_COMP_FLAGS) -c $< $(OP_DEFINES) -include op-$(OP).h -include fx-$(FX).h -o $@ -MMD |
---|
[0b66ef9] | 125 | |
---|
[1dfc3d0] | 126 | sayhi: |
---|
| 127 | echo $(PERFPROGS) |
---|
[0b66ef9] | 128 | |
---|
| 129 | |
---|
[9bb8ee42] | 130 | ifeq "$(RUN_DATA_SIZE_MODE)" "common5" |
---|
| 131 | RUN_DATA_SIZES=\ |
---|
| 132 | 7-1000000 \ |
---|
| 133 | 71-100000 \ |
---|
| 134 | 809-10000 \ |
---|
| 135 | 9051-1000 \ |
---|
| 136 | 72421-100 |
---|
| 137 | else ifeq "$(RUN_DATA_SIZE_MODE)" "thorough" |
---|
| 138 | RUN_DATA_SIZES=\ |
---|
| 139 | 7-1000000 \ |
---|
| 140 | 11-100000 \ |
---|
| 141 | 13-100000 \ |
---|
| 142 | 19-100000 \ |
---|
| 143 | 29-100000 \ |
---|
| 144 | 37-100000 \ |
---|
| 145 | 53-100000 \ |
---|
| 146 | 71-100000 \ |
---|
| 147 | 101-10000 \ |
---|
| 148 | 149-10000 \ |
---|
| 149 | 211-10000 \ |
---|
| 150 | 283-10000 \ |
---|
| 151 | 401-10000 \ |
---|
| 152 | 569-10000 \ |
---|
| 153 | 809-10000 \ |
---|
| 154 | 1151-1000 \ |
---|
| 155 | 1601-1000 \ |
---|
| 156 | 2267-1000 \ |
---|
| 157 | 3203-1000 \ |
---|
| 158 | 4547-1000 \ |
---|
| 159 | 6473-1000 \ |
---|
| 160 | 9051-1000 \ |
---|
| 161 | 12809-100 \ |
---|
| 162 | 18119-100 \ |
---|
| 163 | 25601-100 \ |
---|
| 164 | 36209-100 \ |
---|
| 165 | 51203-100 \ |
---|
| 166 | 72421-100 \ |
---|
| 167 | 102407-10 \ |
---|
| 168 | 144817-10 \ |
---|
| 169 | 204803-10 \ |
---|
| 170 | 289637-10 \ |
---|
| 171 | 409609-10 \ |
---|
| 172 | 579263-10 \ |
---|
| 173 | 819229-10 \ |
---|
| 174 | 1158613-1 \ |
---|
| 175 | 1638431-1 \ |
---|
| 176 | 2317057-1 \ |
---|
| 177 | 3276803-1 \ |
---|
| 178 | 4634111-1 \ |
---|
| 179 | 6553621-1 \ |
---|
| 180 | 9268211-1 |
---|
| 181 | else ifeq "$(RUN_DATA_SIZE_MODE)" "manual" |
---|
| 182 | ifeq "$(RUN_DATA_SIZES)" "" |
---|
| 183 | $(error RUN_DATA_SIZE_MODE is manual but RUN_DATA_SIZES not given) |
---|
| 184 | endif |
---|
| 185 | else ifeq "$(RUN_DATA_SIZE_MODE)" "none" |
---|
| 186 | # Assume user manages RUN_ARGS; empty RUN_ARGS just means run with compiled-in defaults |
---|
| 187 | RUN_DATA_SIZES=none |
---|
| 188 | else |
---|
| 189 | $(error Bad RUN_DATA_SIZE_MODE ($(RUN_DATA_SIZE_MODE)); should be common5, thorough or manual) |
---|
| 190 | endif |
---|
| 191 | |
---|
[0b66ef9] | 192 | RUN_REP_IDS=$(shell echo {1..$(RUN_NUM_REPS)}) # 1 2 3 |
---|
| 193 | RUN_REP_EXTS=$(call cross3,,run,$(RUN_REP_IDS),.1csv) # run1.1csv run2.1cav run3.1csv |
---|
| 194 | |
---|
[9bb8ee42] | 195 | RUN_LAUNCHES=$(call cross,--,$(RUN_DATA_SIZES),$(RUN_REP_EXTS)) |
---|
| 196 | |
---|
| 197 | |
---|
| 198 | |
---|
| 199 | RESULT1S=$(call cross,.,$(CORES),$(RUN_LAUNCHES)) # lq-tailq--stack-inslast-allhead.run2.1csv |
---|
| 200 | |
---|
[0b66ef9] | 201 | |
---|
| 202 | RESULT1S_SHUFD=$(shell shuf -e $(RESULT1S)) |
---|
| 203 | |
---|
| 204 | %.1csv : CORE=$(basename $(basename $@)) |
---|
[9bb8ee42] | 205 | %.1csv : LAUNCH=$(subst .,,$(suffix $(basename $@))) |
---|
| 206 | %.1csv : SIZING=$(call proj,--,$(LAUNCH),1) |
---|
| 207 | %.1csv : NUMNODES=$(call proj,-,$(SIZING),1) |
---|
| 208 | %.1csv : CHECKDONE=$(call proj,-,$(SIZING),2) |
---|
| 209 | %.1csv : REP_ID=$(subst run,,$(call proj,--,$(LAUNCH),2)) |
---|
[2b01f8e] | 210 | %.1csv : RUN_ARGS=$(if $(filter none,$(SIZING)),,$(RUN_DURATION_SEC) $(CHECKDONE) $(NUMNODES) -1 $(REP_ID)) # use REP_ID as seed |
---|
[0b66ef9] | 211 | %.1csv : REP_TIME=$(shell date '+%F %H:%M:%S') |
---|
| 212 | %.1csv : perfprogs FORCE |
---|
[e9ed2a1] | 213 | taskset --cpu-list $(RUN_TASKSET_CPULIST) ./perfexp--$(CORE) $(RUN_ARGS) | xargs -n 1 printf '%s,%s,%s,%s\n' "$(REP_TIME)" "$(REP_ID)" "$(RUN_ARGS)" | tee $@ |
---|
[9bb8ee42] | 214 | |
---|
[0b66ef9] | 215 | |
---|
| 216 | BATCHTIME=$(shell date '+%F--%H-%M-%S') |
---|
| 217 | |
---|
| 218 | results--$(BATCHTIME).csv : $(RESULT1S_SHUFD) |
---|
| 219 | cat $^ | tee $@ |
---|
| 220 | rm $^ |
---|
| 221 | |
---|
| 222 | results-latest.csv : results--$(BATCHTIME).csv |
---|
| 223 | rm -f $@ |
---|
| 224 | ln -s $< $@ |
---|
| 225 | |
---|
| 226 | |
---|
| 227 | |
---|
| 228 | clean : |
---|
| 229 | rm -f *.o *.d perfexp--* |
---|
| 230 | |
---|
| 231 | # The FORCE business means any target that mentions it is also phony |
---|
| 232 | # https://www.gnu.org/software/make/manual/html_node/Phony-Targets.html says: To always rebuild a pattern rule consider using a “force target” (see [https://www.gnu.org/software/make/manual/html_node/Force-Targets.html]). |
---|
| 233 | .PHONY: all perfprogs results-latest.csv clean |
---|
| 234 | FORCE: |
---|
| 235 | |
---|
| 236 | .PRECIOUS: result--%.1csv driver--%.o perfexp--% %.o |
---|
| 237 | |
---|
| 238 | -include *.d |
---|