starpu_perfmodel_recdump.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2017 Inria
  4. * Copyright (C) 2011-2014,2016-2017 CNRS
  5. * Copyright (C) 2011,2013-2014,2017 Université de Bordeaux
  6. * Copyright (C) 2011 Télécom-SudParis
  7. *
  8. * StarPU is free software; you can redistribute it and/or modify
  9. * it under the terms of the GNU Lesser General Public License as published by
  10. * the Free Software Foundation; either version 2.1 of the License, or (at
  11. * your option) any later version.
  12. *
  13. * StarPU is distributed in the hope that it will be useful, but
  14. * WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  16. *
  17. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  18. */
  19. #if !defined(_WIN32) || defined(__MINGW32__) || defined(__CYGWIN__)
  20. #include <dirent.h>
  21. #include <sys/stat.h>
  22. #endif
  23. #include <config.h>
  24. #include <assert.h>
  25. #include <getopt.h>
  26. #include <unistd.h>
  27. #include <stdio.h>
  28. #include <starpu.h>
  29. #include <common/utils.h>
  30. #include <common/uthash.h>
  31. #include <core/perfmodel/perfmodel.h> // we need to browse the list associated to history-based models
  32. // just like in starpu_perfmodel_plot
  33. #define STRHEADCMP(s, head) strncmp(s, head, strlen(head))
  34. #if defined(_WIN32) && !defined(__CYGWIN__)
  35. #include <windows.h>
  36. #endif
  37. #define PROGNAME "starpu_perfmodel_recdump"
  38. struct _footprint_list
  39. {
  40. struct _footprint_list* next;
  41. uint32_t footprint;
  42. };
  43. struct _footprint_list* add_footprint(struct _footprint_list* list, uint32_t footprint)
  44. {
  45. struct _footprint_list * l = list;
  46. while(l)
  47. {
  48. if(l->footprint == footprint) break;
  49. l = l->next;
  50. }
  51. if(l) return list;
  52. else
  53. {
  54. struct _footprint_list * res = malloc(sizeof(struct _footprint_list));
  55. res->footprint = footprint;
  56. res->next = list;
  57. return res;
  58. }
  59. }
  60. static struct model
  61. {
  62. UT_hash_handle hh;
  63. char *name;
  64. struct starpu_perfmodel model;
  65. struct _footprint_list* footprints;
  66. } *models;
  67. void get_comb_name(int comb, char* name, int name_size)
  68. {
  69. struct starpu_perfmodel_arch *arch_comb = starpu_perfmodel_arch_comb_fetch(comb);
  70. STARPU_ASSERT_MSG(arch_comb->ndevices == 1, "Cannot work with multi-device workers\n");
  71. snprintf(name, name_size, "%s%d", starpu_perfmodel_get_archtype_name(arch_comb->devices[0].type), arch_comb->devices[0].devid);
  72. }
  73. void print_archs(FILE* output)
  74. {
  75. int nb_workers = 0;
  76. unsigned workerid; int comb, old_comb = -1;
  77. fprintf(output, "%%rec: worker_count\n\n");
  78. for (workerid = 0; workerid < starpu_worker_get_count(); workerid++)
  79. {
  80. struct starpu_perfmodel_arch* arch = starpu_worker_get_perf_archtype(workerid, STARPU_NMAX_SCHED_CTXS);
  81. comb = starpu_perfmodel_arch_comb_get(arch->ndevices, arch->devices);
  82. STARPU_ASSERT(comb >= 0);
  83. if(comb != old_comb) {
  84. if(nb_workers > 0) {
  85. char name[32];
  86. get_comb_name(old_comb, name, 32);
  87. fprintf(output, "Architecture: %s\n", name);
  88. fprintf(output, "NbWorkers: %d\n\n", nb_workers);
  89. }
  90. old_comb = comb;
  91. nb_workers = 1;
  92. } else {
  93. nb_workers += 1;
  94. }
  95. }
  96. if(nb_workers > 0) {
  97. char name[32];
  98. get_comb_name(old_comb, name, 32);
  99. fprintf(output, "Architecture: %s\n", name);
  100. fprintf(output, "NbWorkers: %d\n\n", nb_workers);
  101. }
  102. }
  103. /* output file name */
  104. static char* poutput = NULL;
  105. static char* pinput = NULL;
  106. static void usage()
  107. {
  108. fprintf(stderr, "Dumps perfmodels to a rec file\n\n");
  109. fprintf(stderr, "Usage: %s [ output-file ]\n", PROGNAME);
  110. fprintf(stderr, "\n");
  111. fprintf(stderr, "If input or output file names are not given, stdin and stdout are used.");
  112. fprintf(stderr, "\n");
  113. fprintf(stderr, "Report bugs to <"PACKAGE_BUGREPORT">.");
  114. fprintf(stderr, "\n");
  115. }
  116. static void parse_args(int argc, char **argv)
  117. {
  118. int c;
  119. static struct option long_options[] =
  120. {
  121. {"help", no_argument, NULL, 'h'},
  122. {"output", required_argument, NULL, 'o'},
  123. {0, 0, 0, 0}
  124. };
  125. int option_index;
  126. while ((c = getopt_long(argc, argv, "ho:", long_options, &option_index)) != -1)
  127. {
  128. switch (c)
  129. {
  130. case 'h': /* display help */
  131. usage();
  132. exit(EXIT_SUCCESS);
  133. break;
  134. case 'o':
  135. poutput = optarg;
  136. break;
  137. case '?':
  138. default:
  139. fprintf(stderr, "Unrecognized option: -%c\n", optopt);
  140. }
  141. }
  142. if(optind < argc)
  143. {
  144. pinput = argv[optind++];
  145. if(optind < argc)
  146. {
  147. fprintf(stderr, "Unrecognized argument: %s\n", argv[optind]);
  148. exit(EXIT_FAILURE);
  149. }
  150. }
  151. }
  152. int main(int argc, char **argv)
  153. {
  154. #if defined(_WIN32) && !defined(__CYGWIN__) && !defined(__MINGW32__)
  155. WSADATA wsadata;
  156. WSAStartup(MAKEWORD(1,0), &wsadata);
  157. _STARPU_MSG("Listing perfmodels is not implemented on pure Windows yet\n");
  158. return 1;
  159. #else
  160. FILE* output;
  161. parse_args(argc, argv);
  162. if(poutput != NULL)
  163. {
  164. output = fopen(poutput, "w+");
  165. if (!output)
  166. {
  167. fprintf(stderr, "couldn't open %s for write: %s\n", poutput, strerror(errno));
  168. exit(EXIT_FAILURE);
  169. }
  170. }
  171. else
  172. {
  173. output = stdout;
  174. }
  175. if (starpu_init(NULL) != 0)
  176. {
  177. fprintf(stderr, "StarPU initialization failure\n");
  178. exit(EXIT_FAILURE);
  179. }
  180. starpu_pause();
  181. if(pinput)
  182. {
  183. FILE* input = fopen(pinput, "r");
  184. char s[1024], *c;
  185. struct model *model, *tmp;
  186. uint32_t footprint = 0;
  187. char *model_name = NULL;
  188. int ret;
  189. if (!input)
  190. {
  191. fprintf(stderr, "couldn't open %s for read: %s\n", pinput, strerror(errno));
  192. exit(EXIT_FAILURE);
  193. }
  194. while (fgets(s, sizeof(s), input))
  195. {
  196. if (strlen(s) == sizeof(s) - 1)
  197. {
  198. fprintf(stderr, "oops, very long line '%s', it's odd\n", s);
  199. exit(EXIT_FAILURE);
  200. }
  201. if (s[0] == '\n')
  202. {
  203. /* empty line, end of task */
  204. if (model_name)
  205. {
  206. /* Try to get already-loaded model */
  207. HASH_FIND_STR(models, model_name, model);
  208. if (model == NULL)
  209. {
  210. model = malloc(sizeof(*model));
  211. model->name = model_name;
  212. model->footprints = NULL;
  213. memset(&model->model, 0, sizeof(model->model));
  214. model->model.type = STARPU_PERFMODEL_INVALID;
  215. ret = starpu_perfmodel_load_symbol(model_name, &model->model);
  216. if (ret == 1)
  217. {
  218. fprintf(stderr, "The performance model for the symbol <%s> could not be loaded\n", model_name);
  219. exit(EXIT_FAILURE);
  220. }
  221. HASH_ADD_STR(models, name, model);
  222. }
  223. else
  224. {
  225. free(model_name);
  226. }
  227. model->footprints = add_footprint(model->footprints, footprint);
  228. model_name = NULL;
  229. }
  230. continue;
  231. }
  232. /* Get rec field name */
  233. c = strchr(s, ':');
  234. if (!c)
  235. {
  236. fprintf(stderr, "odd line '%s'\n", s);
  237. exit(EXIT_FAILURE);
  238. }
  239. if (!STRHEADCMP(s, "Footprint: "))
  240. {
  241. footprint = strtoul(s + strlen("Footprint: "), NULL, 16);
  242. }
  243. else if (!STRHEADCMP(s, "Model: "))
  244. {
  245. model_name = strdup(s + strlen("Model: "));
  246. model_name[strlen(model_name) - 1] = '\0'; /* Drop '\n' */
  247. }
  248. }
  249. /* All models loaded */
  250. {
  251. print_archs(output);
  252. fprintf(output, "%%rec: timing\n\n");
  253. int nb_combs = starpu_perfmodel_get_narch_combs();
  254. HASH_ITER(hh, models, model, tmp)
  255. {
  256. struct _footprint_list* l = model->footprints, *ltmp;
  257. int comb;
  258. while(l)
  259. {
  260. for(comb = 0; comb < nb_combs; comb++)
  261. {
  262. char archname[32];
  263. get_comb_name(comb, archname, 32);
  264. if(!model->model.state || model->model.state->nimpls[comb] == 0)
  265. {
  266. _STARPU_DISP("Symbol %s does not have any implementation on comb %d, not dumping\n", model->name, comb);
  267. continue;
  268. }
  269. if(model->model.state->nimpls[comb] > 1)
  270. _STARPU_DISP("Warning, more than one implementations in comb %d of symbol %s, using only the first one\n", comb, model->name);
  271. struct starpu_perfmodel_per_arch *arch_model = &model->model.state->per_arch[comb][0];
  272. struct starpu_perfmodel_history_list *ptr;
  273. ptr = arch_model->list;
  274. if(!ptr)
  275. _STARPU_DISP("Implementation %d of symbol %s does not have history based model, not dumping\n", comb, model->name);
  276. else while(ptr)
  277. {
  278. struct starpu_perfmodel_history_entry *entry = ptr->entry;
  279. if(entry->footprint == l->footprint)
  280. {
  281. fprintf(output, "Name: %s\n", model->name);
  282. fprintf(output, "Architecture: %s\n", archname);
  283. fprintf(output, "Footprint: %08x\n", l->footprint);
  284. fprintf(output, "Mean: %-15e\nStddev: %-15e\n",
  285. entry->mean, entry->deviation);
  286. fprintf(output, "\n");
  287. break;
  288. }
  289. ptr=ptr->next;
  290. }
  291. }
  292. ltmp = l->next;
  293. free(l);
  294. l = ltmp;
  295. }
  296. free(model->name);
  297. HASH_DEL(models, model);
  298. }
  299. }
  300. fclose(input);
  301. }
  302. else
  303. {
  304. fprintf(output, "%%rec: timing\n\n");
  305. char *path;
  306. DIR *dp;
  307. struct dirent *ep;
  308. path = _starpu_get_perf_model_dir_codelet();
  309. dp = opendir(path);
  310. if (dp != NULL)
  311. {
  312. while ((ep = readdir(dp)))
  313. {
  314. if (strcmp(ep->d_name, ".") && strcmp(ep->d_name, ".."))
  315. {
  316. int comb, nb_combs;
  317. char* symbol = strdup(ep->d_name);
  318. char *dot = strrchr(symbol, '.');
  319. struct starpu_perfmodel model = {.type = STARPU_PERFMODEL_INVALID };
  320. if(dot) *dot = '\0';
  321. if (starpu_perfmodel_load_symbol(symbol, &model) != 0)
  322. {
  323. free(symbol);
  324. continue;
  325. }
  326. if(model.state == NULL)
  327. {
  328. free(symbol);
  329. continue;
  330. }
  331. _STARPU_DISP("Dumping %s\n", symbol);
  332. nb_combs = starpu_perfmodel_get_narch_combs();
  333. for(comb = 0; comb < nb_combs; ++comb)
  334. {
  335. char name[32];
  336. get_comb_name(comb, name, 32);
  337. if(!model.state || model.state->nimpls[comb] == 0)
  338. {
  339. _STARPU_DISP("Symbol %s does not have any implementation on comb %d, not dumping\n", symbol, comb);
  340. fprintf(output, "\n");
  341. continue;
  342. }
  343. struct starpu_perfmodel_per_arch *arch_model = &model.state->per_arch[comb][0];
  344. struct starpu_perfmodel_history_list *ptr;
  345. ptr = arch_model->list;
  346. if(!ptr)
  347. _STARPU_DISP("Symbol %s for comb %d does not have history based model, not dumping\n", symbol, comb);
  348. else while(ptr)
  349. {
  350. struct starpu_perfmodel_history_entry *entry = ptr->entry;
  351. fprintf(output, "Name: %s\n", symbol);
  352. fprintf(output, "Architecture: %s\n", name);
  353. fprintf(output, "Footprint: %08x\nMean: %-15e\nStddev: %-15e\n",
  354. entry->footprint, entry->mean, entry->deviation);
  355. fprintf(output, "\n");
  356. ptr=ptr->next;
  357. }
  358. }
  359. starpu_perfmodel_unload_model(&model);
  360. free(symbol);
  361. }
  362. }
  363. closedir (dp);
  364. }
  365. else
  366. {
  367. _STARPU_DISP("Could not open the perfmodel directory <%s>: %s\n", path, strerror(errno));
  368. }
  369. print_archs(output);
  370. }
  371. starpu_resume();
  372. starpu_shutdown();
  373. fclose(output);
  374. return 0;
  375. #endif
  376. }