Context Navigation

source: doc/theses/colby_parsons_MMAth/benchmarks/channels/run @ e2f827f

ADTast-experimental

Last change on this file since e2f827f was 2f6a9391, checked in by caparsons <caparson@…>, 15 months ago
added first channel bench and copied over scripts that will need to be edited for channel usage. intermediate commit so that benchmarks can be pulled and run on another server
Property mode set to `100755`
File size: 6.3 KB

Line
1	#!/bin/bash -
2
3	false=0; true=1
4
5	# Usage: arch [ hostname ] returns hostname, cores, startcore
6	#
7	# Define machine architecture based on starting socket, CPUs (cores) per socket, number of
8	# sockets, has hyperthreading.
9
10	start=0
11
12	arch() {
13	hostname=${1:-`hostname`} # return value
14	hashyper=${true} # assume machine has hyperthreads
15	if [ "${hostname}" = "plg2" ] ; then
16	startsocket=${start}
17	cps=16 # coresPerSocket
18	sockets=2
19	hashyper=${false} # has no hyperthreads
20	elif [ "${hostname}" = "nasus" ] ; then
21	startsocket=${start}
22	cps=64 # coresPerSocket
23	sockets=2
24	elif [ "${hostname}" = "pyke" ] ; then
25	startsocket=${start}
26	cps=24 # coresPerSocket
27	sockets=2
28	elif [ "${hostname}" = "jax" ] ; then
29	startsocket=${start}
30	cps=24 # coresPerSocket
31	sockets=4
32	else
33	echo "unsupported host" ${hostname}
34	exit 1
35	fi
36	cores=$(( ${cps} * ${sockets} ))
37	startcore=$(( ${startsocket} * ${cps} ))
38	}
39
40	# Usage: affinity (global cps, sockets, startsocket, hashyper, cores, startcore, wrap)
41	# returns taskset argument
42	#
43	# This routine assumes hyperthreading has only 2 hyperthreads per core.
44	#
45	# If hyperthread scanning is used: processor units are assigned across the low-number hyperthreads
46	# of the socket's cores. When the low-number hyperthreads are filled, the high-number hyperhtreads
47	# are assigned across the socket's cores. Then the next socket is assigned.
48	#
49	# If hyperthread wrapping is used: processor units are assigned in low/high-number pairs of
50	# hyperthreads across the socket's cores. Then the next socket is assigned.
51
52	wrap=${false} # set to control hyperthread assignment across socket cores
53
54	affinity() {
55	if [ ${wrap} -eq ${true} -a ${hashyper} -eq ${false} ] ; then
56	echo "architecture does not support hyperthreading for wrapping"
57	exit 1
58	fi
59	taskset="" # return value
60	set -- $(( ${1} - 1 )) # decrement $1
61	if [ ${1} -eq 0 ] ; then taskset="${startcore}-${startcore}"; return; fi
62	if [ ${1} -ge $(( ${cps} * ( ${sockets} - ${startsocket} ) * ( ${hashyper} + 1 ) )) ] ; then # error
63	echo "not enough cores $(( ${cores} * ${sockets} )) for $(( ${1} + 1 )) starting at ${startcore}"
64	exit 1
65	fi
66	if [ ${hashyper} -eq ${false} ] ; then taskset="${startcore}-$(( ${1} + ${startcore} ))"; return; fi # no hyperthreads
67	start2=$(( ${startcore} + ${cores} ))
68	if [ ${wrap} -eq ${true} ] ; then # hyperthread wrapping
69	end1=$(( ${1} / 2 + ${startcore} ))
70	end2=$(( ${end1} + ${cores} ))
71	if [ $(( ${1} % 2 )) -eq 0 ] ; then
72	end2=$(( ${end2} - 1 ))
73	fi
74	taskset="${startcore}-${end1},${start2}-${end2}"
75	else # hyperthread scanning
76	if [ ${1} -lt ${cps} ] ; then taskset="${startcore}-$(( ${1} + ${startcore} ))"; return; fi
77	filled=$(( ${1} / ( ${cps} * 2 ) * ${cps} ))
78	modulus=$(( ${1} % ( ${cps} * 2 ) )) # leftover cores added to saturated sockets
79	if [ ${modulus} -gt ${cps} ] ; then
80	taskset="${startcore}-$(( ${startcore} + ${filled} + ${cps} - 1 )),${start2}-$(( ${start2} + ${filled} + ${modulus} % ${cps} ))"
81	else
82	taskset="${startcore}-$(( ${startcore} + ${filled} + ${modulus} )),${start2}-$(( ${start2} + ${filled} - 1 ))"
83	fi
84	fi
85	}
86
87	numtimes=11
88
89	# locks=('-DLOCKS=L1' '-DLOCKS=L2' '-DLOCKS=L3' '-DLOCKS=L4' '-DLOCKS=L5' '-DLOCKS=L6' '-DLOCKS=L7' '-DLOCKS=L8')
90	# locks='1 2 3 4 5 6 7 8'
91	lock_flags=('-DLOCKS=L2' '-DLOCKS=L4' '-DLOCKS=L8')
92	locks=('2' '4' '8')
93
94	num_threads='2 4 8 16 24 32'
95	# num_threads='2 4 8'
96
97	# toggle benchmarks
98	order=${true}
99	rand=${true}
100	baseline=${true}
101
102	runCFA=${true}
103	runCPP=${true}
104	# runCFA=${false}
105	# runCPP=${false}
106
107	cfa=~/cfa-cc/driver/cfa
108	cpp=g++
109
110	# Helpers to minimize code duplication
111
112	# repeats a command ${numtimes}
113	preprint=''
114	repeat_command() {
115	t=1
116	while [ ${t} -le ${numtimes} ] ; do
117	echo -n -e ${preprint}
118	"${@}"
119	t=`expr ${t} + 1`
120	done
121	}
122
123	# prints the leading info for a given run of a variant
124	print_header() {
125	echo ${1}':'
126	echo -e "cores\tthroughput (entries)"
127	}
128
129	# runs the current benchmark with provided args
130	# only works for standard-run benchmarks (not Akka)
131	# must split into pre and post args to be able to supply val of p
132	pre_args=''
133	post_args=''
134	single_run() {
135	affinity ${1}
136	preprint="${1}\t"
137	repeat_command taskset -c ${taskset} ./a.${hostname} ${pre_args} ${1} ${post_args}
138	}
139
140	# runs the current bench for all processor vals
141	# works for standard benchs that dont need to set a config file (not Akka or CAF)
142	run_bench() {
143	for p in ${num_threads} ; do
144	single_run ${p}
145	done
146	}
147
148	arch # get hostname
149
150	# set up leading info for python script
151	echo $numtimes
152	echo $num_threads
153
154	for i in ${!locks[@]}; do
155	echo -n ${locks[$i]}' '
156	done
157	echo ""
158
159	if [ ${runCFA} -eq ${true} ] && [ ${order} -eq ${true} ]; then
160	echo -n 'CFA-order '
161	fi
162	if [ ${runCPP} -eq ${true} ] && [ ${order} -eq ${true} ]; then
163	echo -n 'CPP-order '
164	fi
165	if [ ${runCFA} -eq ${true} ] && [ ${baseline} -eq ${true} ]; then
166	echo -n 'CFA-baseline '
167	fi
168	if [ ${runCPP} -eq ${true} ] && [ ${baseline} -eq ${true} ]; then
169	echo -n 'CPP-baseline '
170	fi
171	if [ ${runCFA} -eq ${true} ] && [ ${rand} -eq ${true} ]; then
172	echo -n 'CFA-rand '
173	fi
174	if [ ${runCPP} -eq ${true} ] && [ ${rand} -eq ${true} ]; then
175	echo -n 'CPP-rand '
176	fi
177	echo ""
178
179	# done printing header info for output
180
181	# cfa flags
182	cfa_flags='-quiet -O3 -nodebug -DNDEBUG'
183
184	# cpp flagse
185	cpp_flags='-O3 -std=c++17 -lpthread -pthread -DNDEBUG'
186
187	# run the benchmarks
188
189	run_order() {
190	post_args=${1}
191
192	if [ ${runCFA} -eq ${true} ] ; then
193	cd cfa # CFA RUN
194	print_header 'CFA-'${3}
195	${cfa} ${cfa_flags} ${2} ${3}.cfa -o a.${hostname} > /dev/null 2>&1
196	run_bench
197	rm a.${hostname}
198	cd - > /dev/null
199	fi # done CFA
200
201	if [ ${runCPP} -eq ${true} ] ; then
202	cd cpp # CPP RUN
203	print_header 'CPP-'${3}
204	${cpp} ${cpp_flags} ${2} ${3}.cc -o a.${hostname} > /dev/null 2>&1
205	run_bench
206	rm a.${hostname}
207	cd - > /dev/null
208	fi # done CPP
209	}
210
211	# /usr/bin/time -f "%Uu %Ss %Er %Mkb"
212
213	for i in ${!locks[@]}; do
214	echo "locks: "${locks[$i]}
215	if [ ${order} -eq ${true} ] ; then
216	run_order ${locks[$i]} ${lock_flags[$i]} 'order'
217	fi
218	if [ ${baseline} -eq ${true} ] ; then
219	run_order ${locks[$i]} ${lock_flags[$i]} 'baseline'
220	fi
221	if [ ${rand} -eq ${true} ] ; then
222	run_order ${locks[$i]} '-DLOCKS=L8' 'rand'
223	fi
224	done
225
226

Note: See TracBrowser for help on using the repository browser.

Download in other formats: