[2c7eee0] | 1 | #include <cassert>
|
---|
[f9b2e73] | 2 | #include <climits>
|
---|
| 3 | #include <cstdint>
|
---|
| 4 | #include <cstdio>
|
---|
[2c7eee0] | 5 |
|
---|
| 6 | #include <time.h> // timespec
|
---|
| 7 | #include <sys/time.h> // timeval
|
---|
| 8 |
|
---|
[56ac392] | 9 | typedef __uint128_t __lehmer64_state_t;
|
---|
| 10 | static inline uint64_t __lehmer64( __lehmer64_state_t & state ) {
|
---|
| 11 | state *= 0xda942042e4dd58b5;
|
---|
| 12 | return state >> 64;
|
---|
| 13 | }
|
---|
| 14 |
|
---|
[2c7eee0] | 15 | enum { TIMEGRAN = 1000000000LL }; // nanosecond granularity, except for timeval
|
---|
| 16 |
|
---|
| 17 |
|
---|
| 18 | volatile bool stop = false;
|
---|
| 19 | bool clock_mode;
|
---|
| 20 | double duration = -1;
|
---|
| 21 | unsigned long long stop_count = 0;
|
---|
| 22 | unsigned nprocs = 1;
|
---|
| 23 | unsigned nthreads = 1;
|
---|
| 24 |
|
---|
| 25 | volatile unsigned long long threads_left;
|
---|
| 26 |
|
---|
| 27 | #define BENCH_OPT \
|
---|
| 28 | {'d', "duration", "Duration of the experiments in seconds", duration }, \
|
---|
| 29 | {'i', "iterations", "Number of iterations of the experiments", stop_count }, \
|
---|
| 30 | {'t', "nthreads", "Number of threads to use", nthreads }, \
|
---|
| 31 | {'p', "nprocs", "Number of processors to use", nprocs }
|
---|
| 32 |
|
---|
| 33 | #define BENCH_OPT_PARSE(name) \
|
---|
| 34 | { \
|
---|
| 35 | int opt_cnt = sizeof(opt) / sizeof(option_t); \
|
---|
| 36 | char **left; \
|
---|
| 37 | parse_args( argc, argv, opt, opt_cnt, "[OPTIONS]...\n" name, &left ); \
|
---|
| 38 | if(duration > 0 && stop_count > 0) { \
|
---|
| 39 | fprintf(stderr, "--duration and --iterations cannot be used together\n"); \
|
---|
| 40 | print_args_usage(argc, argv, opt, opt_cnt, "[OPTIONS]...\n" name, true); \
|
---|
| 41 | } else if(duration > 0) { \
|
---|
| 42 | clock_mode = true; \
|
---|
| 43 | stop_count = 0xFFFFFFFFFFFFFFFF; \
|
---|
| 44 | printf("Running for %lf seconds\n", duration); \
|
---|
| 45 | } else if(stop_count > 0) { \
|
---|
| 46 | clock_mode = false; \
|
---|
| 47 | printf("Running for %llu iterations\n", stop_count); \
|
---|
| 48 | } else { \
|
---|
| 49 | duration = 5; clock_mode = true;\
|
---|
| 50 | printf("Running for %lf seconds\n", duration); \
|
---|
| 51 | } \
|
---|
| 52 | }
|
---|
| 53 |
|
---|
[e54d0c3] | 54 | uint64_t timeHiRes() {
|
---|
[2c7eee0] | 55 | timespec curr;
|
---|
| 56 | clock_gettime( CLOCK_REALTIME, &curr );
|
---|
| 57 | return (int64_t)curr.tv_sec * TIMEGRAN + curr.tv_nsec;
|
---|
| 58 | }
|
---|
| 59 |
|
---|
| 60 | uint64_t to_miliseconds( uint64_t durtn ) { return durtn / (TIMEGRAN / 1000LL); }
|
---|
| 61 | double to_fseconds(uint64_t durtn ) { return durtn / (double)TIMEGRAN; }
|
---|
| 62 | uint64_t from_fseconds(double sec) { return sec * TIMEGRAN; }
|
---|
| 63 |
|
---|
[f9b2e73] | 64 | template<typename Sleeper>
|
---|
[2c7eee0] | 65 | void wait(const uint64_t & start, bool is_tty) {
|
---|
| 66 | for(;;) {
|
---|
[f9b2e73] | 67 | Sleeper::usleep(100000);
|
---|
[e54d0c3] | 68 | uint64_t end = timeHiRes();
|
---|
[2c7eee0] | 69 | uint64_t delta = end - start;
|
---|
| 70 | if(is_tty) {
|
---|
| 71 | printf(" %.1f\r", to_fseconds(delta));
|
---|
| 72 | fflush(stdout);
|
---|
| 73 | }
|
---|
| 74 | if( clock_mode && delta >= from_fseconds(duration) ) {
|
---|
| 75 | break;
|
---|
| 76 | }
|
---|
| 77 | else if( !clock_mode && threads_left == 0 ) {
|
---|
| 78 | break;
|
---|
| 79 | }
|
---|
| 80 | }
|
---|
| 81 | }
|
---|
| 82 |
|
---|
[56ac392] | 83 | class Fibre;
|
---|
| 84 | int fibre_park();
|
---|
| 85 | int fibre_unpark( Fibre * );
|
---|
| 86 | Fibre * fibre_self();
|
---|
| 87 |
|
---|
| 88 | class __attribute__((aligned(128))) bench_sem {
|
---|
| 89 | Fibre * volatile ptr = nullptr;
|
---|
| 90 | public:
|
---|
| 91 | inline bool wait() {
|
---|
| 92 | static Fibre * const ready = reinterpret_cast<Fibre *>(1ull);
|
---|
| 93 | for(;;) {
|
---|
| 94 | Fibre * expected = this->ptr;
|
---|
| 95 | if(expected == ready) {
|
---|
| 96 | if(__atomic_compare_exchange_n(&this->ptr, &expected, nullptr, false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST)) {
|
---|
| 97 | return false;
|
---|
| 98 | }
|
---|
| 99 | }
|
---|
| 100 | else {
|
---|
| 101 | /* paranoid */ assert( expected == nullptr );
|
---|
| 102 | if(__atomic_compare_exchange_n(&this->ptr, &expected, fibre_self(), false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST)) {
|
---|
| 103 | fibre_park();
|
---|
| 104 | return true;
|
---|
| 105 | }
|
---|
| 106 | }
|
---|
| 107 |
|
---|
| 108 | }
|
---|
| 109 | }
|
---|
| 110 |
|
---|
| 111 | inline bool post() {
|
---|
| 112 | static Fibre * const ready = reinterpret_cast<Fibre *>(1ull);
|
---|
| 113 | for(;;) {
|
---|
| 114 | Fibre * expected = this->ptr;
|
---|
| 115 | if(expected == ready) return false;
|
---|
| 116 | if(expected == nullptr) {
|
---|
| 117 | if(__atomic_compare_exchange_n(&this->ptr, &expected, ready, false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST)) {
|
---|
| 118 | return false;
|
---|
| 119 | }
|
---|
| 120 | }
|
---|
| 121 | else {
|
---|
| 122 | if(__atomic_compare_exchange_n(&this->ptr, &expected, nullptr, false, __ATOMIC_SEQ_CST, __ATOMIC_SEQ_CST)) {
|
---|
| 123 | fibre_unpark( expected );
|
---|
| 124 | return true;
|
---|
| 125 | }
|
---|
| 126 | }
|
---|
| 127 | }
|
---|
| 128 | }
|
---|
| 129 | };
|
---|
| 130 |
|
---|
[2c7eee0] | 131 | // ==========================================================================================
|
---|
[f9b2e73] | 132 | #include <cstdlib>
|
---|
[2c7eee0] | 133 | #include <cstring>
|
---|
| 134 |
|
---|
[f9b2e73] | 135 | #include <algorithm>
|
---|
| 136 |
|
---|
[2c7eee0] | 137 | //-----------------------------------------------------------------------------
|
---|
| 138 | // Typed argument parsing
|
---|
| 139 | bool parse_yesno(const char * arg, bool & value ) {
|
---|
| 140 | if(strcmp(arg, "yes") == 0) {
|
---|
| 141 | value = true;
|
---|
| 142 | return true;
|
---|
| 143 | }
|
---|
| 144 |
|
---|
| 145 | if(strcmp(arg, "no") == 0) {
|
---|
| 146 | value = false;
|
---|
| 147 | return true;
|
---|
| 148 | }
|
---|
| 149 |
|
---|
| 150 | return false;
|
---|
| 151 | }
|
---|
| 152 |
|
---|
[c4241b6] | 153 | bool parse_truefalse(const char * arg, bool & value) {
|
---|
| 154 | if(strcmp(arg, "true") == 0) {
|
---|
| 155 | value = true;
|
---|
| 156 | return true;
|
---|
| 157 | }
|
---|
| 158 |
|
---|
| 159 | if(strcmp(arg, "false") == 0) {
|
---|
| 160 | value = false;
|
---|
| 161 | return true;
|
---|
| 162 | }
|
---|
| 163 |
|
---|
| 164 | return false;
|
---|
| 165 | }
|
---|
| 166 |
|
---|
[2c7eee0] | 167 | bool parse_settrue (const char *, bool & value ) {
|
---|
| 168 | value = true;
|
---|
| 169 | return true;
|
---|
| 170 | }
|
---|
| 171 |
|
---|
| 172 | bool parse_setfalse(const char *, bool & value ) {
|
---|
| 173 | value = false;
|
---|
| 174 | return true;
|
---|
| 175 | }
|
---|
| 176 |
|
---|
| 177 | bool parse(const char * arg, const char * & value ) {
|
---|
| 178 | value = arg;
|
---|
| 179 | return true;
|
---|
| 180 | }
|
---|
| 181 |
|
---|
| 182 | bool parse(const char * arg, int & value) {
|
---|
| 183 | char * end;
|
---|
| 184 | int r = strtoll(arg, &end, 10);
|
---|
| 185 | if(*end != '\0') return false;
|
---|
| 186 |
|
---|
| 187 | value = r;
|
---|
| 188 | return true;
|
---|
| 189 | }
|
---|
| 190 |
|
---|
| 191 | bool parse(const char * arg, unsigned & value) {
|
---|
| 192 | char * end;
|
---|
| 193 | unsigned long long int r = strtoull(arg, &end, 10);
|
---|
| 194 | if(*end != '\0') return false;
|
---|
| 195 | if(r > UINT_MAX) return false;
|
---|
| 196 |
|
---|
| 197 | value = r;
|
---|
| 198 | return true;
|
---|
| 199 | }
|
---|
| 200 |
|
---|
| 201 | bool parse(const char * arg, unsigned long & value) {
|
---|
| 202 | char * end;
|
---|
| 203 | unsigned long long int r = strtoull(arg, &end, 10);
|
---|
| 204 | if(*end != '\0') return false;
|
---|
| 205 | if(r > ULONG_MAX) return false;
|
---|
| 206 |
|
---|
| 207 | value = r;
|
---|
| 208 | return true;
|
---|
| 209 | }
|
---|
| 210 |
|
---|
| 211 | bool parse(const char * arg, unsigned long long & value) {
|
---|
| 212 | char * end;
|
---|
| 213 | unsigned long long int r = strtoull(arg, &end, 10);
|
---|
| 214 | if(*end != '\0') return false;
|
---|
| 215 | if(r > ULLONG_MAX) return false;
|
---|
| 216 |
|
---|
| 217 | value = r;
|
---|
| 218 | return true;
|
---|
| 219 | }
|
---|
| 220 |
|
---|
| 221 | bool parse(const char * arg, double & value) {
|
---|
| 222 | char * end;
|
---|
| 223 | double r = strtod(arg, &end);
|
---|
| 224 | if(*end != '\0') return false;
|
---|
| 225 |
|
---|
| 226 | value = r;
|
---|
| 227 | return true;
|
---|
| 228 | }
|
---|
| 229 |
|
---|
| 230 | //-----------------------------------------------------------------------------
|
---|
| 231 | struct option_t {
|
---|
| 232 | char short_name;
|
---|
| 233 | const char * long_name;
|
---|
| 234 | const char * help;
|
---|
| 235 | void * variable;
|
---|
| 236 | bool (*parse_fun)(const char *, void * );
|
---|
| 237 |
|
---|
| 238 | template<typename T>
|
---|
| 239 | inline option_t( char short_name, const char * long_name, const char * help, T & variable ) {
|
---|
| 240 | this->short_name = short_name;
|
---|
| 241 | this->long_name = long_name;
|
---|
| 242 | this->help = help;
|
---|
| 243 | this->variable = reinterpret_cast<void*>(&variable);
|
---|
[56ac392] | 244 | #pragma GCC diagnostic push
|
---|
| 245 | #pragma GCC diagnostic ignored "-Wcast-function-type"
|
---|
| 246 | this->parse_fun = reinterpret_cast<bool (*)(const char *, void * )>(static_cast<bool (*)(const char *, T & )>(parse));
|
---|
| 247 | #pragma GCC diagnostic pop
|
---|
[2c7eee0] | 248 | }
|
---|
| 249 |
|
---|
| 250 | template<typename T>
|
---|
| 251 | inline option_t( char short_name, const char * long_name, const char * help, T & variable, bool (*parse)(const char *, T & )) {
|
---|
| 252 | this->short_name = short_name;
|
---|
| 253 | this->long_name = long_name;
|
---|
| 254 | this->help = help;
|
---|
| 255 | this->variable = reinterpret_cast<void*>(&variable);
|
---|
[56ac392] | 256 | #pragma GCC diagnostic push
|
---|
| 257 | #pragma GCC diagnostic ignored "-Wcast-function-type"
|
---|
| 258 | this->parse_fun = reinterpret_cast<bool (*)(const char *, void * )>(parse);
|
---|
| 259 | #pragma GCC diagnostic pop
|
---|
[2c7eee0] | 260 | }
|
---|
| 261 | };
|
---|
| 262 |
|
---|
| 263 | extern option_t last_option;
|
---|
| 264 |
|
---|
| 265 |
|
---|
| 266 | //-----------------------------------------------------------------------------
|
---|
| 267 | #include <cstdint>
|
---|
| 268 | #include <climits>
|
---|
| 269 | #include <errno.h>
|
---|
| 270 | #include <unistd.h>
|
---|
| 271 | extern "C" {
|
---|
| 272 | #include <getopt.h>
|
---|
| 273 | #include <sys/ioctl.h>
|
---|
| 274 |
|
---|
| 275 | extern FILE * stderr;
|
---|
| 276 | extern FILE * stdout;
|
---|
| 277 |
|
---|
| 278 | extern int fileno(FILE *stream);
|
---|
| 279 |
|
---|
| 280 | extern int fprintf ( FILE * stream, const char * format, ... );
|
---|
| 281 |
|
---|
| 282 | extern long long int strtoll (const char* str, char** endptr, int base);
|
---|
| 283 | extern unsigned long long int strtoull(const char* str, char** endptr, int base);
|
---|
| 284 | extern double strtod (const char* str, char** endptr);
|
---|
| 285 | }
|
---|
| 286 |
|
---|
| 287 | static void usage(char * cmd, option_t options[], size_t opt_count, const char * usage, FILE * out) __attribute__ ((noreturn));
|
---|
| 288 |
|
---|
| 289 | //-----------------------------------------------------------------------------
|
---|
| 290 | // getopt_long wrapping
|
---|
| 291 | void parse_args(
|
---|
| 292 | int argc,
|
---|
| 293 | char * argv[],
|
---|
| 294 | option_t options[],
|
---|
| 295 | size_t opt_count,
|
---|
| 296 | const char * usage_msg,
|
---|
| 297 | char ** * left
|
---|
| 298 | ) {
|
---|
| 299 | struct option optarr[opt_count + 2];
|
---|
| 300 | {
|
---|
| 301 | int idx = 0;
|
---|
[c4241b6] | 302 | for(size_t i = 0; i < opt_count; i++) {
|
---|
[2c7eee0] | 303 | if(options[i].long_name) {
|
---|
| 304 | optarr[idx].name = options[i].long_name;
|
---|
| 305 | optarr[idx].flag = nullptr;
|
---|
| 306 | optarr[idx].val = options[i].short_name;
|
---|
| 307 | if( ((intptr_t)options[i].parse_fun) == ((intptr_t)parse_settrue)
|
---|
| 308 | || ((intptr_t)options[i].parse_fun) == ((intptr_t)parse_setfalse) ) {
|
---|
| 309 | optarr[idx].has_arg = no_argument;
|
---|
| 310 | } else {
|
---|
| 311 | optarr[idx].has_arg = required_argument;
|
---|
| 312 | }
|
---|
| 313 | idx++;
|
---|
| 314 | }
|
---|
| 315 | }
|
---|
| 316 | optarr[idx+0].name = "help";
|
---|
| 317 | optarr[idx+0].has_arg = no_argument;
|
---|
| 318 | optarr[idx+0].flag = 0;
|
---|
| 319 | optarr[idx+0].val = 'h';
|
---|
| 320 | optarr[idx+1].name = 0;
|
---|
| 321 | optarr[idx+1].has_arg = no_argument;
|
---|
| 322 | optarr[idx+1].flag = 0;
|
---|
| 323 | optarr[idx+1].val = 0;
|
---|
| 324 | }
|
---|
| 325 |
|
---|
| 326 | char optstring[opt_count * 3];
|
---|
| 327 | for(auto & o : optstring) {
|
---|
| 328 | o = '\0';
|
---|
| 329 | }
|
---|
| 330 | {
|
---|
| 331 | int idx = 0;
|
---|
[c4241b6] | 332 | for(size_t i = 0; i < opt_count; i++) {
|
---|
[2c7eee0] | 333 | optstring[idx] = options[i].short_name;
|
---|
| 334 | idx++;
|
---|
| 335 | if( ((intptr_t)options[i].parse_fun) != ((intptr_t)parse_settrue)
|
---|
| 336 | && ((intptr_t)options[i].parse_fun) != ((intptr_t)parse_setfalse) ) {
|
---|
| 337 | optstring[idx] = ':';
|
---|
| 338 | idx++;
|
---|
| 339 | }
|
---|
| 340 | }
|
---|
| 341 | optstring[idx+0] = 'h';
|
---|
| 342 | optstring[idx+1] = '\0';
|
---|
| 343 | }
|
---|
| 344 |
|
---|
| 345 | FILE * out = stderr;
|
---|
| 346 | for(;;) {
|
---|
| 347 | int idx = 0;
|
---|
| 348 | int opt = getopt_long(argc, argv, optstring, optarr, &idx);
|
---|
| 349 | switch(opt) {
|
---|
| 350 | case -1:
|
---|
| 351 | if(left != nullptr) *left = argv + optind;
|
---|
| 352 | return;
|
---|
| 353 | case 'h':
|
---|
| 354 | out = stdout;
|
---|
[c4241b6] | 355 | [[fallthrough]];
|
---|
[2c7eee0] | 356 | case '?':
|
---|
| 357 | usage(argv[0], options, opt_count, usage_msg, out);
|
---|
| 358 | default:
|
---|
[c4241b6] | 359 | for(size_t i = 0; i < opt_count; i++) {
|
---|
[2c7eee0] | 360 | if(opt == options[i].short_name) {
|
---|
| 361 | const char * arg = optarg ? optarg : "";
|
---|
[c4241b6] | 362 | if( arg[0] == '=' ) { arg++; }
|
---|
[2c7eee0] | 363 | bool success = options[i].parse_fun( arg, options[i].variable );
|
---|
| 364 | if(success) goto NEXT_ARG;
|
---|
| 365 |
|
---|
| 366 | fprintf(out, "Argument '%s' for option %c could not be parsed\n\n", arg, (char)opt);
|
---|
| 367 | usage(argv[0], options, opt_count, usage_msg, out);
|
---|
| 368 | }
|
---|
| 369 | }
|
---|
| 370 | std::abort();
|
---|
| 371 | }
|
---|
| 372 | NEXT_ARG:;
|
---|
| 373 | }
|
---|
| 374 | }
|
---|
| 375 |
|
---|
| 376 | //-----------------------------------------------------------------------------
|
---|
| 377 | // Print usage
|
---|
| 378 | static void printopt(FILE * out, int width, int max, char sn, const char * ln, const char * help) {
|
---|
| 379 | int hwidth = max - (11 + width);
|
---|
| 380 | if(hwidth <= 0) hwidth = max;
|
---|
| 381 |
|
---|
| 382 | fprintf(out, " -%c, --%-*s %.*s\n", sn, width, ln, hwidth, help);
|
---|
| 383 | for(;;) {
|
---|
| 384 | help += std::min(strlen(help), (unsigned long)hwidth);
|
---|
| 385 | if('\0' == *help) break;
|
---|
| 386 | fprintf(out, "%*s%.*s\n", width + 11, "", hwidth, help);
|
---|
| 387 | }
|
---|
| 388 | }
|
---|
| 389 |
|
---|
| 390 | __attribute__((noreturn)) void print_args_usage(int , char * argv[], option_t options[], size_t opt_count, const char * usage_msg, bool error) {
|
---|
| 391 | usage(argv[0], options, opt_count, usage_msg, error ? stderr : stdout);
|
---|
| 392 | }
|
---|
| 393 |
|
---|
| 394 | static __attribute__((noreturn)) void usage(char * cmd, option_t options[], size_t opt_count, const char * help, FILE * out) {
|
---|
| 395 | int width = 0;
|
---|
| 396 | {
|
---|
[c4241b6] | 397 | for(size_t i = 0; i < opt_count; i++) {
|
---|
[2c7eee0] | 398 | if(options[i].long_name) {
|
---|
| 399 | int w = strlen(options[i].long_name);
|
---|
| 400 | if(w > width) width = w;
|
---|
| 401 | }
|
---|
| 402 | }
|
---|
| 403 | }
|
---|
| 404 |
|
---|
| 405 | int max_width = 1000000;
|
---|
| 406 | int outfd = fileno(out);
|
---|
| 407 | if(isatty(outfd)) {
|
---|
| 408 | struct winsize size;
|
---|
| 409 | int ret = ioctl(outfd, TIOCGWINSZ, &size);
|
---|
| 410 | if(ret < 0) abort(); // "ioctl error: (%d) %s\n", (int)errno, strerror(errno)
|
---|
| 411 | max_width = size.ws_col;
|
---|
| 412 | }
|
---|
| 413 |
|
---|
| 414 | fprintf(out, "Usage:\n %s %s\n", cmd, help);
|
---|
| 415 |
|
---|
[c4241b6] | 416 | for(size_t i = 0; i < opt_count; i++) {
|
---|
[2c7eee0] | 417 | printopt(out, width, max_width, options[i].short_name, options[i].long_name, options[i].help);
|
---|
| 418 | }
|
---|
| 419 | fprintf(out, " -%c, --%-*s %s\n", 'h', width, "help", "print this help message");
|
---|
| 420 | exit(out == stdout ? 0 : 1);
|
---|
| 421 | }
|
---|
| 422 |
|
---|