1 | #include <stdint.h> |
---|
2 | #include <stdlib.hfa> |
---|
3 | |
---|
4 | #include <unistd.h> // STDERR_FILENO |
---|
5 | #include <inttypes.h> |
---|
6 | #include "bits/debug.hfa" |
---|
7 | #include "bits/locks.hfa" |
---|
8 | #include "stats.hfa" |
---|
9 | #include "strstream.hfa" |
---|
10 | |
---|
11 | #if !defined(__CFA_NO_STATISTICS__) |
---|
12 | void __init_stats( struct __stats_t * stats ) { |
---|
13 | stats->ready.push.local.attempt = 0; |
---|
14 | stats->ready.push.local.success = 0; |
---|
15 | stats->ready.push.share.attempt = 0; |
---|
16 | stats->ready.push.share.success = 0; |
---|
17 | stats->ready.push.extrn.attempt = 0; |
---|
18 | stats->ready.push.extrn.success = 0; |
---|
19 | stats->ready.pop.local .attempt = 0; |
---|
20 | stats->ready.pop.local .success = 0; |
---|
21 | stats->ready.pop.help .attempt = 0; |
---|
22 | stats->ready.pop.help .success = 0; |
---|
23 | stats->ready.pop.steal .attempt = 0; |
---|
24 | stats->ready.pop.steal .success = 0; |
---|
25 | stats->ready.pop.search.attempt = 0; |
---|
26 | stats->ready.pop.search.success = 0; |
---|
27 | stats->ready.threads.migration = 0; |
---|
28 | stats->ready.threads.extunpark = 0; |
---|
29 | stats->ready.threads.threads = 0; |
---|
30 | stats->ready.threads.cthreads = 0; |
---|
31 | stats->ready.threads.preempt.yield = 0; |
---|
32 | stats->ready.threads.preempt.rllfwd = 0; |
---|
33 | stats->ready.sleep.halts = 0; |
---|
34 | stats->ready.sleep.cancels = 0; |
---|
35 | stats->ready.sleep.early = 0; |
---|
36 | stats->ready.sleep.wakes = 0; |
---|
37 | stats->ready.sleep.seen = 0; |
---|
38 | stats->ready.sleep.exits = 0; |
---|
39 | |
---|
40 | #if defined(CFA_HAVE_LINUX_IO_URING_H) |
---|
41 | stats->io.alloc.fast = 0; |
---|
42 | stats->io.alloc.slow = 0; |
---|
43 | stats->io.alloc.fail = 0; |
---|
44 | stats->io.alloc.revoke = 0; |
---|
45 | stats->io.alloc.block = 0; |
---|
46 | stats->io.submit.fast = 0; |
---|
47 | stats->io.submit.slow = 0; |
---|
48 | stats->io.flush.external = 0; |
---|
49 | stats->io.flush.dirty = 0; |
---|
50 | stats->io.flush.full = 0; |
---|
51 | stats->io.flush.idle = 0; |
---|
52 | stats->io.flush.eager = 0; |
---|
53 | stats->io.calls.flush = 0; |
---|
54 | stats->io.calls.submitted = 0; |
---|
55 | stats->io.calls.drain = 0; |
---|
56 | stats->io.calls.completed = 0; |
---|
57 | stats->io.calls.locked = 0; |
---|
58 | stats->io.calls.helped = 0; |
---|
59 | stats->io.calls.errors.busy = 0; |
---|
60 | stats->io.ops.sockread = 0; |
---|
61 | stats->io.ops.epllread = 0; |
---|
62 | stats->io.ops.sockwrite = 0; |
---|
63 | stats->io.ops.epllwrite = 0; |
---|
64 | #endif |
---|
65 | |
---|
66 | #if defined(CFA_STATS_ARRAY) |
---|
67 | stats->array.values = alloc(CFA_STATS_ARRAY); |
---|
68 | stats->array.cnt = 0; |
---|
69 | #endif |
---|
70 | } |
---|
71 | |
---|
72 | static inline void tally_one( volatile uint64_t * agg, volatile uint64_t * val) { |
---|
73 | uint64_t add = __atomic_exchange_n(val, 0_l64u, __ATOMIC_RELAXED); |
---|
74 | __atomic_fetch_add(agg, add, __ATOMIC_RELAXED); |
---|
75 | } |
---|
76 | |
---|
77 | static inline void tally_one( volatile int64_t * agg, volatile int64_t * val) { |
---|
78 | int64_t add = __atomic_exchange_n(val, 0_l64, __ATOMIC_RELAXED); |
---|
79 | __atomic_fetch_add(agg, add, __ATOMIC_RELAXED); |
---|
80 | } |
---|
81 | |
---|
82 | void __tally_stats( struct __stats_t * cltr, struct __stats_t * proc ) { |
---|
83 | tally_one( &cltr->ready.push.local.attempt , &proc->ready.push.local.attempt ); |
---|
84 | tally_one( &cltr->ready.push.local.success , &proc->ready.push.local.success ); |
---|
85 | tally_one( &cltr->ready.push.share.attempt , &proc->ready.push.share.attempt ); |
---|
86 | tally_one( &cltr->ready.push.share.success , &proc->ready.push.share.success ); |
---|
87 | tally_one( &cltr->ready.push.extrn.attempt , &proc->ready.push.extrn.attempt ); |
---|
88 | tally_one( &cltr->ready.push.extrn.success , &proc->ready.push.extrn.success ); |
---|
89 | tally_one( &cltr->ready.pop.local .attempt , &proc->ready.pop.local .attempt ); |
---|
90 | tally_one( &cltr->ready.pop.local .success , &proc->ready.pop.local .success ); |
---|
91 | tally_one( &cltr->ready.pop.help .attempt , &proc->ready.pop.help .attempt ); |
---|
92 | tally_one( &cltr->ready.pop.help .success , &proc->ready.pop.help .success ); |
---|
93 | tally_one( &cltr->ready.pop.steal .attempt , &proc->ready.pop.steal .attempt ); |
---|
94 | tally_one( &cltr->ready.pop.steal .success , &proc->ready.pop.steal .success ); |
---|
95 | tally_one( &cltr->ready.pop.search.attempt , &proc->ready.pop.search.attempt ); |
---|
96 | tally_one( &cltr->ready.pop.search.success , &proc->ready.pop.search.success ); |
---|
97 | tally_one( &cltr->ready.threads.migration , &proc->ready.threads.migration ); |
---|
98 | tally_one( &cltr->ready.threads.extunpark , &proc->ready.threads.extunpark ); |
---|
99 | tally_one( &cltr->ready.threads.threads , &proc->ready.threads.threads ); |
---|
100 | tally_one( &cltr->ready.threads.cthreads , &proc->ready.threads.cthreads ); |
---|
101 | tally_one( &cltr->ready.threads.preempt.yield , &proc->ready.threads.preempt.yield ); |
---|
102 | tally_one( &cltr->ready.threads.preempt.rllfwd, &proc->ready.threads.preempt.rllfwd ); |
---|
103 | tally_one( &cltr->ready.sleep.halts , &proc->ready.sleep.halts ); |
---|
104 | tally_one( &cltr->ready.sleep.cancels , &proc->ready.sleep.cancels ); |
---|
105 | tally_one( &cltr->ready.sleep.early , &proc->ready.sleep.early ); |
---|
106 | tally_one( &cltr->ready.sleep.wakes , &proc->ready.sleep.wakes ); |
---|
107 | tally_one( &cltr->ready.sleep.seen , &proc->ready.sleep.wakes ); |
---|
108 | tally_one( &cltr->ready.sleep.exits , &proc->ready.sleep.exits ); |
---|
109 | |
---|
110 | #if defined(CFA_HAVE_LINUX_IO_URING_H) |
---|
111 | tally_one( &cltr->io.alloc.fast , &proc->io.alloc.fast ); |
---|
112 | tally_one( &cltr->io.alloc.slow , &proc->io.alloc.slow ); |
---|
113 | tally_one( &cltr->io.alloc.fail , &proc->io.alloc.fail ); |
---|
114 | tally_one( &cltr->io.alloc.revoke , &proc->io.alloc.revoke ); |
---|
115 | tally_one( &cltr->io.alloc.block , &proc->io.alloc.block ); |
---|
116 | tally_one( &cltr->io.submit.fast , &proc->io.submit.fast ); |
---|
117 | tally_one( &cltr->io.submit.slow , &proc->io.submit.slow ); |
---|
118 | tally_one( &cltr->io.flush.external , &proc->io.flush.external ); |
---|
119 | tally_one( &cltr->io.flush.dirty , &proc->io.flush.dirty ); |
---|
120 | tally_one( &cltr->io.flush.full , &proc->io.flush.full ); |
---|
121 | tally_one( &cltr->io.flush.idle , &proc->io.flush.idle ); |
---|
122 | tally_one( &cltr->io.flush.eager , &proc->io.flush.eager ); |
---|
123 | tally_one( &cltr->io.calls.flush , &proc->io.calls.flush ); |
---|
124 | tally_one( &cltr->io.calls.submitted , &proc->io.calls.submitted ); |
---|
125 | tally_one( &cltr->io.calls.drain , &proc->io.calls.drain ); |
---|
126 | tally_one( &cltr->io.calls.completed , &proc->io.calls.completed ); |
---|
127 | tally_one( &cltr->io.calls.locked , &proc->io.calls.locked ); |
---|
128 | tally_one( &cltr->io.calls.helped , &proc->io.calls.helped ); |
---|
129 | tally_one( &cltr->io.calls.errors.busy, &proc->io.calls.errors.busy ); |
---|
130 | tally_one( &cltr->io.ops.sockread , &proc->io.ops.sockread ); |
---|
131 | tally_one( &cltr->io.ops.epllread , &proc->io.ops.epllread ); |
---|
132 | tally_one( &cltr->io.ops.sockwrite , &proc->io.ops.sockwrite ); |
---|
133 | tally_one( &cltr->io.ops.epllwrite , &proc->io.ops.epllwrite ); |
---|
134 | #endif |
---|
135 | } |
---|
136 | |
---|
137 | #define eng3(X) (ws(3, 3, unit(eng( X )))) |
---|
138 | |
---|
139 | void __print_stats( struct __stats_t * stats, int flags, const char * type, const char * name, void * id ) with( *stats ) { |
---|
140 | |
---|
141 | char buf[1024]; |
---|
142 | ostrstream sstr = { buf, 1024 }; |
---|
143 | |
---|
144 | if( flags & CFA_STATS_READY_Q ) { |
---|
145 | |
---|
146 | sstr | "----- " | type | " \"" | name | "\" (" | "" | id | "" | ") - Ready Q Stats -----"; |
---|
147 | |
---|
148 | uint64_t totalR = ready.pop.local.success + ready.pop.help.success + ready.pop.steal.success + ready.pop.search.success; |
---|
149 | uint64_t totalS = ready.push.local.success + ready.push.share.success + ready.push.extrn.success; |
---|
150 | sstr | "- totals : " | eng3(totalR) | "run," | eng3(totalS) | "schd (" | eng3(ready.push.extrn.success) | "ext," |
---|
151 | | eng3(ready.threads.migration) | "mig," | eng3(ready.threads.extunpark) | " eupk," | ready.threads.threads | " t," | ready.threads.cthreads | " cthr)"; |
---|
152 | |
---|
153 | double push_len = ((double)ready.push.local.attempt + ready.push.share.attempt + ready.push.extrn.attempt) / totalS; |
---|
154 | double sLcl_len = ready.push.local.success ? ((double)ready.push.local.attempt) / ready.push.local.success : 0; |
---|
155 | double sOth_len = ready.push.share.success ? ((double)ready.push.share.attempt) / ready.push.share.success : 0; |
---|
156 | double sExt_len = ready.push.extrn.success ? ((double)ready.push.extrn.attempt) / ready.push.extrn.success : 0; |
---|
157 | sstr | "- push avg : " | ws(3, 3, push_len) |
---|
158 | | "- l: " | eng3(ready.push.local.attempt) | " (" | ws(3, 3, sLcl_len) | ")" |
---|
159 | | ", s: " | eng3(ready.push.share.attempt) | " (" | ws(3, 3, sOth_len) | ")" |
---|
160 | | ", e: " | eng3(ready.push.extrn.attempt) | " (" | ws(3, 3, sExt_len) | ")"; |
---|
161 | |
---|
162 | double rLcl_pc = (100.0 * (double)ready.pop.local .success) / totalR; |
---|
163 | sstr | "- local : " | eng3(ready.pop.local .success) | "-"| ws(3, 3, rLcl_pc) | '%' |
---|
164 | | " (" | eng3(ready.pop.local .attempt) | " try)"; |
---|
165 | double rHlp_pc = (100.0 * (double)ready.pop.help .success) / totalR; |
---|
166 | sstr | "- help : " | eng3(ready.pop.help .success) | "-"| ws(3, 3, rHlp_pc) | '%' |
---|
167 | | " (" | eng3(ready.pop.help .attempt) | " try)"; |
---|
168 | double rStl_pc = (100.0 * (double)ready.pop.steal .success) / totalR; |
---|
169 | sstr | "- steal : " | eng3(ready.pop.steal .success) | "-"| ws(3, 3, rStl_pc) | '%' |
---|
170 | | " (" | eng3(ready.pop.steal .attempt) | " try)"; |
---|
171 | double rSch_pc = (100.0 * (double)ready.pop.search.success) / totalR; |
---|
172 | sstr | "- search : " | eng3(ready.pop.search.success) | "-"| ws(3, 3, rSch_pc) | '%' |
---|
173 | | " (" | eng3(ready.pop.search.attempt) | " try)"; |
---|
174 | |
---|
175 | sstr | "- Idle Slp : " | eng3(ready.sleep.halts) | "halt," | eng3(ready.sleep.cancels) | "cancel," |
---|
176 | | eng3(ready.sleep.wakes + ready.sleep.early) | '(' | eng3(ready.sleep.early) | ',' | eng3(ready.sleep.seen) | ')' | " wake(early, seen)," |
---|
177 | | eng3(ready.sleep.exits) | "exit"; |
---|
178 | sstr | "- Preemption : " | eng3(ready.threads.preempt.yield) | "yields," | eng3(ready.threads.preempt.rllfwd) | "delayed"; |
---|
179 | sstr | nl; |
---|
180 | } |
---|
181 | |
---|
182 | #if defined(CFA_HAVE_LINUX_IO_URING_H) |
---|
183 | if( flags & CFA_STATS_IO ) { |
---|
184 | sstr | "----- " | type | " \"" | name | "\" (" | "" | id | "" | ") - I/O Stats -----"; |
---|
185 | |
---|
186 | uint64_t total_allocs = io.alloc.fast + io.alloc.slow; |
---|
187 | |
---|
188 | uint64_t total_submits = io.submit.fast + io.submit.slow; |
---|
189 | sstr | "- totals : allc" | eng3(io.alloc .fast) | nonl; |
---|
190 | if(io.alloc.slow) { |
---|
191 | double avgfasta = (100.0 * (double)io.alloc.fast) / total_allocs; |
---|
192 | sstr | "fast," | eng3(io.alloc .slow) | "slow (" | ws(3, 3, avgfasta) | "%)" | nonl; |
---|
193 | } |
---|
194 | sstr | " - subm" | eng3(io.submit.fast) | nonl; |
---|
195 | if(io.alloc.slow) { |
---|
196 | double avgfasts = (100.0 * (double)io.submit.fast) / total_submits; |
---|
197 | sstr | "fast," | eng3(io.submit.slow) | "slow (" | ws(3, 3, avgfasts) | "%)" | nonl; |
---|
198 | } |
---|
199 | sstr | nl; |
---|
200 | |
---|
201 | if(io.alloc.fail || io.alloc.revoke || io.alloc.block) |
---|
202 | sstr | "- failures : " | eng3(io.alloc.fail) | "oom, " | eng3(io.alloc.revoke) | "rvk, " | eng3(io.alloc.block) | "blk"; |
---|
203 | // if(io.flush.external) |
---|
204 | // sstr | "- flush external : " | eng3(io.flush.external); |
---|
205 | |
---|
206 | double avgsubs = ((double)io.calls.submitted) / io.calls.flush; |
---|
207 | double avgcomp = ((double)io.calls.completed) / io.calls.drain; |
---|
208 | sstr | "- syscll : " |
---|
209 | | " sub " | eng3(io.calls.submitted) | "/" | eng3(io.calls.flush) | "(" | ws(3, 3, avgsubs) | "/flush)" |
---|
210 | | " - cmp " | eng3(io.calls.completed) | "/" | eng3(io.calls.drain) | "(" | ws(3, 3, avgcomp) | "/drain)" |
---|
211 | | " - cmp " | eng3(io.calls.locked) | "locked, " | eng3(io.calls.helped) | "helped" |
---|
212 | | " - " | eng3(io.calls.errors.busy) | " EBUSY"; |
---|
213 | sstr | " - sub: " | eng3(io.flush.full) | "full, " | eng3(io.flush.dirty) | "drty, " | eng3(io.flush.idle) | "idle, " | eng3(io.flush.eager) | "eagr, " | eng3(io.flush.external) | "ext"; |
---|
214 | sstr | "- ops blk: " |
---|
215 | | " sk rd: " | eng3(io.ops.sockread) | "epll: " | eng3(io.ops.epllread) |
---|
216 | | " sk wr: " | eng3(io.ops.sockwrite) | "epll: " | eng3(io.ops.epllwrite); |
---|
217 | sstr | nl; |
---|
218 | } |
---|
219 | #endif |
---|
220 | |
---|
221 | if(flags) write( sstr, stdout ); |
---|
222 | } |
---|
223 | |
---|
224 | #if defined(CFA_STATS_ARRAY) |
---|
225 | extern "C" { |
---|
226 | #include <stdio.h> |
---|
227 | #include <errno.h> |
---|
228 | #include <sys/stat.h> |
---|
229 | #include <fcntl.h> |
---|
230 | } |
---|
231 | |
---|
232 | void __flush_stat( struct __stats_t * this, const char * name, void * handle) { |
---|
233 | int ret = mkdir(".cfadata", 0755); |
---|
234 | if(ret < 0 && errno != EEXIST) abort("Failed to create directory .cfadata: %d\n", errno); |
---|
235 | |
---|
236 | char filename[100]; |
---|
237 | snprintf(filename, 100, ".cfadata/%s%p.data", name, handle); |
---|
238 | |
---|
239 | int fd = open(filename, O_WRONLY | O_APPEND | O_CREAT, 0644); |
---|
240 | if(fd < 0) abort("Failed to create file %s: %d\n", filename, errno); |
---|
241 | |
---|
242 | for(i; this->array.cnt) { |
---|
243 | char line[100]; |
---|
244 | size_t n = snprintf(line, 100, "%llu, %lld\n", this->array.values[i].ts, this->array.values[i].value); |
---|
245 | write(fd, line, n); |
---|
246 | } |
---|
247 | |
---|
248 | this->array.cnt = 0; |
---|
249 | close(fd); |
---|
250 | } |
---|
251 | |
---|
252 | static __spinlock_t stats_lock; |
---|
253 | |
---|
254 | void __push_stat( struct __stats_t * this, int64_t value, bool external, const char * name, void * handle ) { |
---|
255 | if(external) lock(stats_lock __cfaabi_dbg_ctx2); |
---|
256 | |
---|
257 | if( this->array.cnt >= CFA_STATS_ARRAY ) __flush_stat( this, name, handle ); |
---|
258 | |
---|
259 | size_t idx = this->array.cnt; |
---|
260 | this->array.cnt++; |
---|
261 | |
---|
262 | if(external) unlock(stats_lock); |
---|
263 | |
---|
264 | this->array.values[idx].ts = rdtscl(); |
---|
265 | this->array.values[idx].value = value; |
---|
266 | } |
---|
267 | #endif |
---|
268 | #endif |
---|