#include #include #include // STDERR_FILENO #include "bits/debug.hfa" #include "stats.hfa" #if !defined(__CFA_NO_STATISTICS__) void __init_stats( struct __stats_t * stats ) { stats->ready.pick.push.attempt = 0; stats->ready.pick.push.success = 0; stats->ready.pick.push.local = 0; stats->ready.pick.push.lsuccess = 0; stats->ready.pick.pop .probe = 0; stats->ready.pick.pop .attempt = 0; stats->ready.pick.pop .success = 0; stats->ready.pick.pop .local = 0; stats->ready.pick.pop .lsuccess = 0; stats->ready.threads.migration = 0; stats->ready.sleep.halts = 0; stats->ready.sleep.cancels = 0; stats->ready.sleep.wakes = 0; stats->ready.sleep.exits = 0; #if defined(HAVE_LINUX_IO_URING_H) stats->io.submit_q.submit_avg.rdy = 0; stats->io.submit_q.submit_avg.csm = 0; stats->io.submit_q.submit_avg.avl = 0; stats->io.submit_q.submit_avg.cnt = 0; stats->io.submit_q.look_avg.val = 0; stats->io.submit_q.look_avg.cnt = 0; stats->io.submit_q.look_avg.block = 0; stats->io.submit_q.alloc_avg.val = 0; stats->io.submit_q.alloc_avg.cnt = 0; stats->io.submit_q.alloc_avg.block = 0; stats->io.complete_q.completed_avg.val = 0; stats->io.complete_q.completed_avg.slow_cnt = 0; stats->io.complete_q.completed_avg.fast_cnt = 0; #endif } void __tally_stats( struct __stats_t * cltr, struct __stats_t * proc ) { __atomic_fetch_add( &cltr->ready.pick.push.attempt , proc->ready.pick.push.attempt , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.pick.push.success , proc->ready.pick.push.success , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.pick.push.local , proc->ready.pick.push.local , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.pick.push.lsuccess, proc->ready.pick.push.lsuccess, __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.pick.pop .probe , proc->ready.pick.pop .probe , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.pick.pop .attempt , proc->ready.pick.pop .attempt , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.pick.pop .success , proc->ready.pick.pop .success , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.pick.pop .local , proc->ready.pick.pop .local , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.pick.pop .lsuccess, proc->ready.pick.pop .lsuccess, __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.threads.migration, proc->ready.threads.migration, __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.sleep.halts , proc->ready.sleep.halts , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.sleep.cancels, proc->ready.sleep.cancels, __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.sleep.wakes , proc->ready.sleep.wakes , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->ready.sleep.exits , proc->ready.sleep.exits , __ATOMIC_SEQ_CST ); #if defined(HAVE_LINUX_IO_URING_H) __atomic_fetch_add( &cltr->io.submit_q.submit_avg.rdy , proc->io.submit_q.submit_avg.rdy , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.submit_q.submit_avg.csm , proc->io.submit_q.submit_avg.csm , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.submit_q.submit_avg.avl , proc->io.submit_q.submit_avg.avl , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.submit_q.submit_avg.cnt , proc->io.submit_q.submit_avg.cnt , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.submit_q.look_avg.val , proc->io.submit_q.look_avg.val , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.submit_q.look_avg.cnt , proc->io.submit_q.look_avg.cnt , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.submit_q.look_avg.block , proc->io.submit_q.look_avg.block , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.submit_q.alloc_avg.val , proc->io.submit_q.alloc_avg.val , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.submit_q.alloc_avg.cnt , proc->io.submit_q.alloc_avg.cnt , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.submit_q.alloc_avg.block , proc->io.submit_q.alloc_avg.block , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.complete_q.completed_avg.val , proc->io.complete_q.completed_avg.val , __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.complete_q.completed_avg.slow_cnt, proc->io.complete_q.completed_avg.slow_cnt, __ATOMIC_SEQ_CST ); __atomic_fetch_add( &cltr->io.complete_q.completed_avg.fast_cnt, proc->io.complete_q.completed_avg.fast_cnt, __ATOMIC_SEQ_CST ); #endif } void __print_stats( struct __stats_t * stats, int flags, bool cluster, const char * name, void * id ) with( *stats ) { if( flags & CFA_STATS_READY_Q ) { double push_sur = (100.0 * ((double)ready.pick.push.success) / ready.pick.push.attempt); double pop_sur = (100.0 * ((double)ready.pick.pop .success) / ready.pick.pop .attempt); double push_len = ((double)ready.pick.push.attempt) / ready.pick.push.success; double pop_len = ((double)ready.pick.pop .attempt) / ready.pick.pop .success; double lpush_sur = (100.0 * ((double)ready.pick.push.lsuccess) / ready.pick.push.local); double lpop_sur = (100.0 * ((double)ready.pick.pop .lsuccess) / ready.pick.pop .local); double lpush_len = ((double)ready.pick.push.local) / ready.pick.push.lsuccess; double lpop_len = ((double)ready.pick.pop .local) / ready.pick.pop .lsuccess; __cfaabi_bits_print_safe( STDOUT_FILENO, "----- %s \"%s\" (%p) - Ready Q Stats -----\n" "- total threads run : %'15lu\n" "- total threads scheduled: %'15lu\n" "- push average probe len : %'18.2lf, %'18.2lf%% (%'15lu attempts)\n" "- pop average probe len : %'18.2lf, %'18.2lf%% (%'15lu attempts)\n" "- local push avg prb len : %'18.2lf, %'18.2lf%% (%'15lu attempts)\n" "- local pop avg prb len : %'18.2lf, %'18.2lf%% (%'15lu attempts)\n" "- thread migrations : %'15lu\n" "- Idle Sleep -\n" "-- halts : %'15lu\n" "-- cancelled halts : %'15lu\n" "-- schedule wake : %'15lu\n" "-- wake on exit : %'15lu\n" "\n" , cluster ? "Cluster" : "Processor", name, id , ready.pick.pop.success , ready.pick.push.success , push_len, push_sur, ready.pick.push.attempt , pop_len , pop_sur , ready.pick.pop .attempt , lpush_len, lpush_sur, ready.pick.push.local , lpop_len , lpop_sur , ready.pick.pop .local , ready.threads.migration , ready.sleep.halts, ready.sleep.cancels, ready.sleep.wakes, ready.sleep.exits ); } #if defined(HAVE_LINUX_IO_URING_H) if( flags & CFA_STATS_IO ) { double avgrdy = ((double)io.submit_q.submit_avg.rdy) / io.submit_q.submit_avg.cnt; double avgcsm = ((double)io.submit_q.submit_avg.csm) / io.submit_q.submit_avg.cnt; double avgavl = ((double)io.submit_q.submit_avg.avl) / io.submit_q.submit_avg.cnt; double lavgv = 0; double lavgb = 0; if(io.submit_q.look_avg.cnt != 0) { lavgv = ((double)io.submit_q.look_avg.val ) / io.submit_q.look_avg.cnt; lavgb = ((double)io.submit_q.look_avg.block) / io.submit_q.look_avg.cnt; } double aavgv = 0; double aavgb = 0; if(io.submit_q.alloc_avg.cnt != 0) { aavgv = ((double)io.submit_q.alloc_avg.val ) / io.submit_q.alloc_avg.cnt; aavgb = ((double)io.submit_q.alloc_avg.block) / io.submit_q.alloc_avg.cnt; } __cfaabi_bits_print_safe( STDOUT_FILENO, "----- %s \"%s\" (%p) - I/O Stats -----\n" "- total submit calls : %'15lu\n" "- avg ready entries : %'18.2lf\n" "- avg submitted entries : %'18.2lf\n" "- avg available entries : %'18.2lf\n" "- total ready search : %'15lu\n" "- avg ready search len : %'18.2lf\n" "- avg ready search block : %'18.2lf\n" "- total alloc search : %'15lu\n" "- avg alloc search len : %'18.2lf\n" "- avg alloc search block : %'18.2lf\n" "- total wait calls : %'15lu (%'lu slow, %'lu fast)\n" "- avg completion/wait : %'18.2lf\n" "\n" , cluster ? "Cluster" : "Processor", name, id , io.submit_q.submit_avg.cnt , avgrdy, avgcsm, avgavl , io.submit_q.look_avg.cnt , lavgv, lavgb , io.submit_q.alloc_avg.cnt , aavgv, aavgb , io.complete_q.completed_avg.slow_cnt + io.complete_q.completed_avg.fast_cnt , io.complete_q.completed_avg.slow_cnt, io.complete_q.completed_avg.fast_cnt , ((double)io.complete_q.completed_avg.val) / (io.complete_q.completed_avg.slow_cnt + io.complete_q.completed_avg.fast_cnt) ); } #endif } #endif