starpu_perfmodel_recdump.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2011-2021 Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
  4. * Copyright (C) 2011 Télécom-SudParis
  5. * Copyright (C) 2020 Federal University of Rio Grande do Sul (UFRGS)
  6. *
  7. * StarPU is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU Lesser General Public License as published by
  9. * the Free Software Foundation; either version 2.1 of the License, or (at
  10. * your option) any later version.
  11. *
  12. * StarPU is distributed in the hope that it will be useful, but
  13. * WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  15. *
  16. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  17. */
  18. #if !defined(_WIN32) || defined(__MINGW32__) || defined(__CYGWIN__)
  19. #include <dirent.h>
  20. #include <sys/stat.h>
  21. #endif
  22. #include <config.h>
  23. #include <assert.h>
  24. #include <getopt.h>
  25. #include <unistd.h>
  26. #include <stdio.h>
  27. #include <starpu.h>
  28. #include <common/utils.h>
  29. #include <common/uthash.h>
  30. #include <core/perfmodel/perfmodel.h> // we need to browse the list associated to history-based models
  31. // just like in starpu_perfmodel_plot
  32. #define STRHEADCMP(s, head) strncmp(s, head, strlen(head))
  33. #if defined(_WIN32) && !defined(__CYGWIN__)
  34. #include <windows.h>
  35. #endif
  36. #define PROGNAME "starpu_perfmodel_recdump"
  37. struct _footprint_list
  38. {
  39. struct _footprint_list* next;
  40. uint32_t footprint;
  41. };
  42. struct _footprint_list* add_footprint(struct _footprint_list* list, uint32_t footprint)
  43. {
  44. struct _footprint_list * l = list;
  45. while(l)
  46. {
  47. if(l->footprint == footprint) break;
  48. l = l->next;
  49. }
  50. if(l) return list;
  51. else
  52. {
  53. struct _footprint_list *res;
  54. _STARPU_MALLOC(res, sizeof(struct _footprint_list));
  55. res->footprint = footprint;
  56. res->next = list;
  57. return res;
  58. }
  59. }
  60. static struct model
  61. {
  62. UT_hash_handle hh;
  63. char *name;
  64. struct starpu_perfmodel model;
  65. struct _footprint_list* footprints;
  66. } *models;
  67. void get_comb_name(int comb, char* name, int name_size)
  68. {
  69. struct starpu_perfmodel_arch *arch_comb = starpu_perfmodel_arch_comb_fetch(comb);
  70. STARPU_ASSERT_MSG(arch_comb->ndevices == 1, "Cannot work with multi-device workers\n");
  71. snprintf(name, name_size, "%s%d", starpu_perfmodel_get_archtype_name(arch_comb->devices[0].type), arch_comb->devices[0].devid);
  72. }
  73. void print_archs(FILE* output)
  74. {
  75. int nb_workers = 0;
  76. unsigned workerid, node, src, dst; int comb, old_comb = -1;
  77. fprintf(output, "%%rec: worker_count\n\n");
  78. for (workerid = 0; workerid < starpu_worker_get_count(); workerid++)
  79. {
  80. struct starpu_perfmodel_arch* arch = starpu_worker_get_perf_archtype(workerid, STARPU_NMAX_SCHED_CTXS);
  81. comb = starpu_perfmodel_arch_comb_get(arch->ndevices, arch->devices);
  82. if (comb < 0) continue; // Ignore architecture which is not present in any perfmodel
  83. if(comb != old_comb)
  84. {
  85. if(nb_workers > 0)
  86. {
  87. char name[32];
  88. get_comb_name(old_comb, name, 32);
  89. fprintf(output, "Architecture: %s\n", name);
  90. fprintf(output, "NbWorkers: %d\n\n", nb_workers);
  91. }
  92. old_comb = comb;
  93. nb_workers = 1;
  94. }
  95. else
  96. {
  97. nb_workers += 1;
  98. }
  99. }
  100. if(nb_workers > 0)
  101. {
  102. char name[32];
  103. get_comb_name(old_comb, name, 32);
  104. fprintf(output, "Architecture: %s\n", name);
  105. fprintf(output, "NbWorkers: %d\n\n", nb_workers);
  106. }
  107. fprintf(output, "%%rec: memory_workers\n\n");
  108. for (node = 0; node < starpu_memory_nodes_get_count(); node++)
  109. {
  110. unsigned printed = 0;
  111. char name[32];
  112. fprintf(output, "MemoryNode: %u\n", node);
  113. starpu_memory_node_get_name(node, name, sizeof(name));
  114. fprintf(output, "Name: %s\n", name);
  115. fprintf(output, "Size: %ld\n", (long) starpu_memory_get_total(node));
  116. for (workerid = 0; workerid < starpu_worker_get_count(); workerid++)
  117. {
  118. if (starpu_worker_get_memory_node(workerid) == node)
  119. {
  120. if (!printed)
  121. {
  122. fprintf(output, "Workers:");
  123. printed = 1;
  124. }
  125. fprintf(output, " %u", workerid);
  126. }
  127. }
  128. if (printed)
  129. fprintf(output, "\n");
  130. fprintf(output, "\n");
  131. }
  132. fprintf(output, "%%rec: memory_performance\n\n");
  133. for (src = 0; src < starpu_memory_nodes_get_count(); src++)
  134. {
  135. for (dst = 0; dst < starpu_memory_nodes_get_count(); dst++)
  136. {
  137. if (src != dst)
  138. {
  139. fprintf(output, "MemoryNodeSrc: %u\n", src);
  140. fprintf(output, "MemoryNodeDst: %u\n", dst);
  141. fprintf(output, "Bandwidth: %f\n", starpu_transfer_bandwidth(src, dst));
  142. fprintf(output, "Latency: %f\n", starpu_transfer_latency(src, dst));
  143. fprintf(output, "\n");
  144. }
  145. }
  146. }
  147. }
  148. /* output file name */
  149. static char* poutput = NULL;
  150. static char* pinput = NULL;
  151. static void usage()
  152. {
  153. fprintf(stderr, "Dumps perfmodels to a rec file\n\n");
  154. fprintf(stderr, "Usage: %s [ input-file ] [ -o output-file ]\n", PROGNAME);
  155. fprintf(stderr, "\n");
  156. fprintf(stderr, "If input or output file names are not given, stdin and stdout are used.");
  157. fprintf(stderr, "\n");
  158. fprintf(stderr, "Report bugs to <"PACKAGE_BUGREPORT">.");
  159. fprintf(stderr, "\n");
  160. }
  161. static void print_entry(const char *name, const char *archname, FILE *output, struct starpu_perfmodel_history_entry *entry)
  162. {
  163. fprintf(output, "Model: %s\n", name);
  164. fprintf(output, "Architecture: %s\n", archname);
  165. fprintf(output, "Footprint: %08x\n", entry->footprint);
  166. fprintf(output, "Size: %lu\n", (unsigned long) entry->size);
  167. if (!isnan(entry->flops))
  168. fprintf(output, "Flops: %-15e\n", entry->flops);
  169. fprintf(output, "Mean: %-15e\nStddev: %-15e\n",
  170. entry->mean, entry->deviation);
  171. fprintf(output, "Samples: %u\n", entry->nsample);
  172. fprintf(output, "\n");
  173. }
  174. static void parse_args(int argc, char **argv)
  175. {
  176. int c;
  177. static struct option long_options[] =
  178. {
  179. {"help", no_argument, NULL, 'h'},
  180. {"output", required_argument, NULL, 'o'},
  181. {0, 0, 0, 0}
  182. };
  183. int option_index;
  184. while ((c = getopt_long(argc, argv, "ho:", long_options, &option_index)) != -1)
  185. {
  186. switch (c)
  187. {
  188. case 'h': /* display help */
  189. usage();
  190. exit(EXIT_SUCCESS);
  191. break;
  192. case 'o':
  193. poutput = optarg;
  194. break;
  195. case '?':
  196. default:
  197. fprintf(stderr, "Unrecognized option: -%c\n", optopt);
  198. }
  199. }
  200. if(optind < argc)
  201. {
  202. pinput = argv[optind++];
  203. if(optind < argc)
  204. {
  205. fprintf(stderr, "Unrecognized argument: %s\n", argv[optind]);
  206. exit(EXIT_FAILURE);
  207. }
  208. }
  209. }
  210. int main(int argc, char **argv)
  211. {
  212. #if defined(_WIN32) && !defined(__CYGWIN__) && !defined(__MINGW32__)
  213. WSADATA wsadata;
  214. WSAStartup(MAKEWORD(1,0), &wsadata);
  215. _STARPU_MSG("Listing perfmodels is not implemented on pure Windows yet\n");
  216. return 1;
  217. #else
  218. FILE* output;
  219. parse_args(argc, argv);
  220. if(poutput != NULL)
  221. {
  222. output = fopen(poutput, "w+");
  223. if (!output)
  224. {
  225. fprintf(stderr, "couldn't open %s for write: %s\n", poutput, strerror(errno));
  226. exit(EXIT_FAILURE);
  227. }
  228. }
  229. else
  230. {
  231. output = stdout;
  232. }
  233. if (starpu_init(NULL) != 0)
  234. {
  235. fprintf(stderr, "StarPU initialization failure\n");
  236. exit(EXIT_FAILURE);
  237. }
  238. starpu_pause();
  239. if(pinput)
  240. {
  241. FILE* input = fopen(pinput, "r");
  242. char s[1024], *c;
  243. struct model *model, *tmp=NULL;
  244. uint32_t footprint = 0;
  245. char *model_name = NULL;
  246. int ret;
  247. if (!input)
  248. {
  249. fprintf(stderr, "couldn't open %s for read: %s\n", pinput, strerror(errno));
  250. exit(EXIT_FAILURE);
  251. }
  252. while (fgets(s, sizeof(s), input))
  253. {
  254. if (strlen(s) == sizeof(s) - 1)
  255. {
  256. fprintf(stderr, "oops, very long line '%s', it's odd\n", s);
  257. exit(EXIT_FAILURE);
  258. }
  259. if (s[0] == '\n')
  260. {
  261. /* empty line, end of task */
  262. if (model_name)
  263. {
  264. /* Try to get already-loaded model */
  265. HASH_FIND_STR(models, model_name, model);
  266. if (model == NULL)
  267. {
  268. _STARPU_MALLOC(model, sizeof(*model));
  269. model->name = model_name;
  270. model->footprints = NULL;
  271. memset(&model->model, 0, sizeof(model->model));
  272. model->model.type = STARPU_PERFMODEL_INVALID;
  273. ret = starpu_perfmodel_load_symbol(model_name, &model->model);
  274. if (ret == 1)
  275. {
  276. fprintf(stderr, "The performance model for the symbol <%s> could not be loaded\n", model_name);
  277. exit(EXIT_FAILURE);
  278. }
  279. HASH_ADD_STR(models, name, model);
  280. }
  281. else
  282. {
  283. free(model_name);
  284. }
  285. model->footprints = add_footprint(model->footprints, footprint);
  286. model_name = NULL;
  287. }
  288. continue;
  289. }
  290. /* Get rec field name */
  291. c = strchr(s, ':');
  292. if (!c)
  293. {
  294. fprintf(stderr, "odd line '%s'\n", s);
  295. exit(EXIT_FAILURE);
  296. }
  297. if (!STRHEADCMP(s, "Footprint: "))
  298. {
  299. footprint = strtoul(s + strlen("Footprint: "), NULL, 16);
  300. }
  301. else if (!STRHEADCMP(s, "Model: "))
  302. {
  303. model_name = strdup(s + strlen("Model: "));
  304. model_name[strlen(model_name) - 1] = '\0'; /* Drop '\n' */
  305. }
  306. }
  307. /* All models loaded */
  308. {
  309. print_archs(output);
  310. fprintf(output, "%%rec: timing\n\n");
  311. int nb_combs = starpu_perfmodel_get_narch_combs();
  312. HASH_ITER(hh, models, model, tmp)
  313. {
  314. struct _footprint_list* l = model->footprints, *ltmp;
  315. int comb;
  316. while(l)
  317. {
  318. for(comb = 0; comb < nb_combs; comb++)
  319. {
  320. char archname[32];
  321. get_comb_name(comb, archname, 32);
  322. if(!model->model.state || model->model.state->nimpls[comb] == 0)
  323. {
  324. _STARPU_DISP("Symbol %s does not have any implementation on comb %d, not dumping\n", model->name, comb);
  325. continue;
  326. }
  327. if(model->model.state->nimpls[comb] > 1)
  328. _STARPU_DISP("Warning, more than one implementations in comb %d of symbol %s, using only the first one\n", comb, model->name);
  329. struct starpu_perfmodel_per_arch *arch_model = &model->model.state->per_arch[comb][0];
  330. struct starpu_perfmodel_history_list *ptr;
  331. ptr = arch_model->list;
  332. if(!ptr)
  333. _STARPU_DISP("Implementation %d of symbol %s does not have history based model, not dumping\n", comb, model->name);
  334. else while(ptr)
  335. {
  336. struct starpu_perfmodel_history_entry *entry = ptr->entry;
  337. if(entry->footprint == l->footprint)
  338. {
  339. print_entry(model->name, archname, output, entry);
  340. break;
  341. }
  342. ptr=ptr->next;
  343. }
  344. }
  345. ltmp = l->next;
  346. free(l);
  347. l = ltmp;
  348. }
  349. starpu_perfmodel_unload_model(&model->model);
  350. free(model->name);
  351. HASH_DEL(models, model);
  352. free(model);
  353. }
  354. }
  355. fclose(input);
  356. }
  357. else
  358. {
  359. fprintf(output, "%%rec: timing\n\n");
  360. char *path;
  361. DIR *dp;
  362. struct dirent *ep;
  363. path = _starpu_get_perf_model_dir_codelet();
  364. dp = opendir(path);
  365. if (dp != NULL)
  366. {
  367. while ((ep = readdir(dp)))
  368. {
  369. if (strcmp(ep->d_name, ".") && strcmp(ep->d_name, ".."))
  370. {
  371. int comb, nb_combs;
  372. char* symbol = strdup(ep->d_name);
  373. char *dot = strrchr(symbol, '.');
  374. struct starpu_perfmodel model = {.type = STARPU_PERFMODEL_INVALID };
  375. if(dot) *dot = '\0';
  376. if (starpu_perfmodel_load_symbol(symbol, &model) != 0)
  377. {
  378. free(symbol);
  379. continue;
  380. }
  381. if(model.state == NULL)
  382. {
  383. free(symbol);
  384. continue;
  385. }
  386. _STARPU_DISP("Dumping %s\n", symbol);
  387. nb_combs = starpu_perfmodel_get_narch_combs();
  388. for(comb = 0; comb < nb_combs; ++comb)
  389. {
  390. char name[32];
  391. get_comb_name(comb, name, 32);
  392. if(!model.state || model.state->nimpls[comb] == 0)
  393. {
  394. _STARPU_DISP("Symbol %s does not have any implementation on comb %d, not dumping\n", symbol, comb);
  395. fprintf(output, "\n");
  396. continue;
  397. }
  398. struct starpu_perfmodel_per_arch *arch_model = &model.state->per_arch[comb][0];
  399. struct starpu_perfmodel_history_list *ptr;
  400. ptr = arch_model->list;
  401. if(!ptr)
  402. _STARPU_DISP("Symbol %s for comb %d does not have history based model, not dumping\n", symbol, comb);
  403. else while(ptr)
  404. {
  405. print_entry(symbol, name, output, ptr->entry);
  406. ptr=ptr->next;
  407. }
  408. }
  409. starpu_perfmodel_unload_model(&model);
  410. free(symbol);
  411. }
  412. }
  413. closedir (dp);
  414. }
  415. else
  416. {
  417. _STARPU_DISP("Could not open the perfmodel directory <%s>: %s\n", path, strerror(errno));
  418. }
  419. print_archs(output);
  420. }
  421. starpu_resume();
  422. starpu_shutdown();
  423. fclose(output);
  424. return 0;
  425. #endif
  426. }