| 1 | // | 
|---|
| 2 | // Cforall Version 1.0.0 Copyright (C) 2021 University of Waterloo | 
|---|
| 3 | // | 
|---|
| 4 | // The contents of this file are covered under the licence agreement in the | 
|---|
| 5 | // file "LICENCE" distributed with Cforall. | 
|---|
| 6 | // | 
|---|
| 7 | // cpu.cfa -- checks that libcfa correctly counts the number of cpus. | 
|---|
| 8 | // | 
|---|
| 9 | // Author           : Thierry Delisle | 
|---|
| 10 | // Created On       : Mon Jun 14 13:59:01 2021 | 
|---|
| 11 | // Last Modified By : | 
|---|
| 12 | // Last Modified On : | 
|---|
| 13 | // Update Count     : | 
|---|
| 14 | // | 
|---|
| 15 |  | 
|---|
| 16 |  | 
|---|
| 17 | #include <fstream.hfa> | 
|---|
| 18 | #include <device/cpu.hfa> | 
|---|
| 19 | #include <stdlib.hfa> | 
|---|
| 20 |  | 
|---|
| 21 | #include <errno.h> | 
|---|
| 22 | #include <stdio.h> | 
|---|
| 23 | #include <string.h> | 
|---|
| 24 | #include <unistd.h> | 
|---|
| 25 |  | 
|---|
| 26 | extern "C" { | 
|---|
| 27 | #include <dirent.h> | 
|---|
| 28 | #include <sys/types.h> | 
|---|
| 29 | #include <sys/stat.h> | 
|---|
| 30 | #include <sys/sysinfo.h> | 
|---|
| 31 | #include <fcntl.h> | 
|---|
| 32 | } | 
|---|
| 33 |  | 
|---|
| 34 | // go through a directory calling fn on each file | 
|---|
| 35 | static int iterate_dir( const char * path, void (*fn)(struct dirent * ent) ) { | 
|---|
| 36 | // open the directory | 
|---|
| 37 | DIR *dir = opendir(path); | 
|---|
| 38 | if(dir == 0p) { return ENOTDIR; } | 
|---|
| 39 |  | 
|---|
| 40 | // call fn for each | 
|---|
| 41 | struct dirent * ent; | 
|---|
| 42 | while ((ent = readdir(dir)) != 0p) { | 
|---|
| 43 | fn( ent ); | 
|---|
| 44 | } | 
|---|
| 45 |  | 
|---|
| 46 | // no longer need this | 
|---|
| 47 | closedir(dir); | 
|---|
| 48 | return 0; | 
|---|
| 49 | } | 
|---|
| 50 |  | 
|---|
| 51 | // count the number of directories with the specified prefix | 
|---|
| 52 | // the directories counted have the form '[prefix]N' where prefix is the parameter | 
|---|
| 53 | // and N is an base 10 integer. | 
|---|
| 54 | static int count_prefix_dirs(const char * path, const char * prefix) { | 
|---|
| 55 | // read the directory and find the cpu count | 
|---|
| 56 | // and make sure everything is as expected | 
|---|
| 57 | int max = -1; | 
|---|
| 58 | int count = 0; | 
|---|
| 59 | void lambda(struct dirent * ent) { | 
|---|
| 60 | // were are looking for prefixX, where X is a number | 
|---|
| 61 | // check that it starts with 'cpu | 
|---|
| 62 | char * s = strstr(ent->d_name, prefix); | 
|---|
| 63 | if(s == 0p) { return; } | 
|---|
| 64 | if(s != ent->d_name) { return; } | 
|---|
| 65 |  | 
|---|
| 66 | // check that the next part is a number | 
|---|
| 67 | s += strlen(prefix); | 
|---|
| 68 | char * end; | 
|---|
| 69 | long int val = strtol(s, &end, 10); | 
|---|
| 70 | if(*end != '\0' || val < 0) { return; } | 
|---|
| 71 |  | 
|---|
| 72 | // check that it's a directory | 
|---|
| 73 | if(ent->d_type != DT_DIR) { return; } | 
|---|
| 74 |  | 
|---|
| 75 | // it's a match! | 
|---|
| 76 | max = max(val, max); | 
|---|
| 77 | count++; | 
|---|
| 78 | } | 
|---|
| 79 | iterate_dir(path, lambda); | 
|---|
| 80 |  | 
|---|
| 81 | /* paranoid */ verifyf(count == max + 1, "Inconsistent %s count, counted %d, but max %s was %d", prefix, count, prefix, (int)max); | 
|---|
| 82 |  | 
|---|
| 83 | return count; | 
|---|
| 84 | } | 
|---|
| 85 |  | 
|---|
| 86 | // Count number of cache *indexes* in the system | 
|---|
| 87 | // cache indexes are distinct from cache level as Data or Instruction cache | 
|---|
| 88 | // can share a level but not an index | 
|---|
| 89 | // PITFALL: assumes all cpus have the same indexes as cpu0 | 
|---|
| 90 | static int count_cache_indexes(void) { | 
|---|
| 91 | return count_prefix_dirs("/sys/devices/system/cpu/cpu0/cache", "index"); | 
|---|
| 92 | } | 
|---|
| 93 |  | 
|---|
| 94 | // read information about a spcficic cache index/cpu file into the output buffer | 
|---|
| 95 | static size_t read_cpuidxinfo_into(unsigned cpu, unsigned idx, const char * file, char * out, size_t out_len) { | 
|---|
| 96 | // Pick the file we want and read it | 
|---|
| 97 | char buf[128]; | 
|---|
| 98 | /* paranoid */ __attribute__((unused)) int len = | 
|---|
| 99 | snprintf(buf, 128, "/sys/devices/system/cpu/cpu%u/cache/index%u/%s", cpu, idx, file); | 
|---|
| 100 | /* paranoid */ verifyf(len > 0, "Could not generate '%s' filename for cpu %u, index %u", file, cpu, idx); | 
|---|
| 101 |  | 
|---|
| 102 | int fd = open(buf, 0, O_RDONLY); | 
|---|
| 103 | /* paranoid */ verifyf(fd > 0, "Could not open file '%s'", buf); | 
|---|
| 104 |  | 
|---|
| 105 | ssize_t r = read(fd, out, out_len); | 
|---|
| 106 | /* paranoid */ verifyf(r > 0, "Could not read file '%s'", buf); | 
|---|
| 107 |  | 
|---|
| 108 | /* paranoid */ __attribute__((unused)) int ret = | 
|---|
| 109 | close(fd); | 
|---|
| 110 | /* paranoid */ verifyf(ret == 0, "Could not close file '%s'", buf); | 
|---|
| 111 |  | 
|---|
| 112 | out[r-1] = '\0'; | 
|---|
| 113 | return r-1; | 
|---|
| 114 | } | 
|---|
| 115 |  | 
|---|
| 116 | unsigned find_idx() { | 
|---|
| 117 | int idxs = count_cache_indexes(); | 
|---|
| 118 |  | 
|---|
| 119 | unsigned found_level = 0; | 
|---|
| 120 | unsigned found = -1u; | 
|---|
| 121 | for(i; idxs) { | 
|---|
| 122 | unsigned idx = idxs - 1 - i; | 
|---|
| 123 | char buf[32]; | 
|---|
| 124 |  | 
|---|
| 125 | // Level is the cache level: higher means bigger and slower | 
|---|
| 126 | read_cpuidxinfo_into(0, idx, "level", buf, 32); | 
|---|
| 127 | char * end; | 
|---|
| 128 | unsigned long level = strtoul(buf, &end, 10); | 
|---|
| 129 | /* paranoid */ verifyf(level <= 250, "Cpu %u has more than 250 levels of cache, that doesn't sound right", 0); | 
|---|
| 130 | /* paranoid */ verify(*end == '\0'); | 
|---|
| 131 |  | 
|---|
| 132 | if(found_level < level) { | 
|---|
| 133 | found_level = level; | 
|---|
| 134 | found = idx; | 
|---|
| 135 | } | 
|---|
| 136 | } | 
|---|
| 137 |  | 
|---|
| 138 | /* paranoid */ verify(found != -1u); | 
|---|
| 139 | return found; | 
|---|
| 140 | } | 
|---|
| 141 |  | 
|---|
| 142 | int main() { | 
|---|
| 143 | //----------------------------------------------------------------------- | 
|---|
| 144 | int ret1 = get_nprocs(); | 
|---|
| 145 | int ret2 = cpu_info.hthrd_count; | 
|---|
| 146 | if(ret1 != ret2) { | 
|---|
| 147 | sout | "No match! libcfa says" | ret2 | "hardware threads but linux counts" | ret1 | "processors"; | 
|---|
| 148 | } | 
|---|
| 149 | else { | 
|---|
| 150 | sout | "Match!"; | 
|---|
| 151 | } | 
|---|
| 152 |  | 
|---|
| 153 | //----------------------------------------------------------------------- | 
|---|
| 154 | // Make sure no one has the same self | 
|---|
| 155 | for(ime; cpu_info.hthrd_count) { | 
|---|
| 156 | unsigned me = cpu_info.llc_map[ime].self; | 
|---|
| 157 | { | 
|---|
| 158 | unsigned s = cpu_info.llc_map[ime].start; | 
|---|
| 159 | unsigned e = s + cpu_info.llc_map[ime].count; | 
|---|
| 160 | if(me < s || me >= e) { | 
|---|
| 161 | sout | "CPU" | ime | "outside of it's own map: " | s | "<=" | me | "<" | e; | 
|---|
| 162 | } | 
|---|
| 163 | } | 
|---|
| 164 |  | 
|---|
| 165 |  | 
|---|
| 166 | for(ithem; cpu_info.hthrd_count) { | 
|---|
| 167 | if(ime == ithem) continue; | 
|---|
| 168 |  | 
|---|
| 169 | unsigned them = cpu_info.llc_map[ithem].self; | 
|---|
| 170 | if(me == them) { | 
|---|
| 171 | sout | "CPU" | ime | "has conflicting self id with" | ithem | "(" | me | ")"; | 
|---|
| 172 | } | 
|---|
| 173 | } | 
|---|
| 174 | } | 
|---|
| 175 |  | 
|---|
| 176 |  | 
|---|
| 177 | //----------------------------------------------------------------------- | 
|---|
| 178 | unsigned idx = find_idx(); | 
|---|
| 179 | // For all procs check mapping is consistent | 
|---|
| 180 | for(cpu_me; cpu_info.hthrd_count) { | 
|---|
| 181 | char buf_me[32]; | 
|---|
| 182 | size_t len_me = read_cpuidxinfo_into(cpu_me, idx, "shared_cpu_list", buf_me, 32); | 
|---|
| 183 | for(cpu_them; cpu_info.hthrd_count) { | 
|---|
| 184 | if(cpu_me == cpu_them) continue; | 
|---|
| 185 | char buf_them[32]; | 
|---|
| 186 | size_t len_them = read_cpuidxinfo_into(cpu_them, idx, "shared_cpu_list", buf_them, 32); | 
|---|
| 187 |  | 
|---|
| 188 | bool match_file = len_them == len_me && 0 == strncmp(buf_them, buf_me, len_me); | 
|---|
| 189 | bool match_info = cpu_info.llc_map[cpu_me].start == cpu_info.llc_map[cpu_them].start && cpu_info.llc_map[cpu_me].count == cpu_info.llc_map[cpu_them].count; | 
|---|
| 190 |  | 
|---|
| 191 | if(match_file != match_info) { | 
|---|
| 192 | sout | "CPU" | cpu_me | "and" | cpu_them | "have inconsitent file and cpu_info"; | 
|---|
| 193 | sout | cpu_me | ": <" | cpu_info.llc_map[cpu_me  ].start | "," | cpu_info.llc_map[cpu_me  ].count | "> '" | buf_me   | "'"; | 
|---|
| 194 | sout | cpu_me | ": <" | cpu_info.llc_map[cpu_them].start | "," | cpu_info.llc_map[cpu_them].count | "> '" | buf_them | "'"; | 
|---|
| 195 | } | 
|---|
| 196 | } | 
|---|
| 197 | } | 
|---|
| 198 | } | 
|---|