starpu_perfmodel_plot.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2011-2012 Université de Bordeaux 1
  4. * Copyright (C) 2011, 2012 Centre National de la Recherche Scientifique
  5. * Copyright (C) 2011 Télécom-SudParis
  6. *
  7. * StarPU is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU Lesser General Public License as published by
  9. * the Free Software Foundation; either version 2.1 of the License, or (at
  10. * your option) any later version.
  11. *
  12. * StarPU is distributed in the hope that it will be useful, but
  13. * WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  15. *
  16. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  17. */
  18. #include <config.h>
  19. #include <assert.h>
  20. #include <unistd.h>
  21. #include <stdio.h>
  22. #include <sys/stat.h>
  23. #include <limits.h>
  24. #include <starpu.h>
  25. #include <core/perfmodel/perfmodel.h> // we need to browse the list associated to history-based models
  26. #ifdef __MINGW32__
  27. #include <windows.h>
  28. #endif
  29. #define PROGNAME "starpu_perfmodel_plot"
  30. static struct starpu_perfmodel model;
  31. /* display all available models */
  32. static int list = 0;
  33. /* what kernel ? */
  34. static char *symbol = NULL;
  35. /* which architecture ? (NULL = all)*/
  36. static char *arch = NULL;
  37. /* Unless a FxT file is specified, we just display the model */
  38. static int no_fxt_file = 1;
  39. #ifdef STARPU_USE_FXT
  40. static struct starpu_fxt_codelet_event *dumped_codelets;
  41. static long dumped_codelets_count;
  42. static struct starpu_fxt_options options;
  43. #endif
  44. #ifdef STARPU_USE_FXT
  45. static int archtype_is_found[STARPU_NARCH_VARIATIONS];
  46. static char data_file_name[256];
  47. #endif
  48. static char avg_file_name[256];
  49. static char gnuplot_file_name[256];
  50. static void usage(char **argv)
  51. {
  52. fprintf(stderr, "Draw a graph corresponding to the execution time of a \
  53. given perfmodel\n");
  54. fprintf(stderr, "Usage: %s [ options ]\n", PROGNAME);
  55. fprintf(stderr, "\n");
  56. fprintf(stderr, "One must specify a symbol with the -s option or use -l\n");
  57. fprintf(stderr, "Options:\n");
  58. fprintf(stderr, " -l display all available models\n");
  59. fprintf(stderr, " -s <symbol> specify the symbol\n");
  60. fprintf(stderr, " -i <Fxt files> input FxT files generated by StarPU\n");
  61. fprintf(stderr, " -a <arch> specify the architecture (e.g. cpu, cpu:k, cuda_k, gordon)\n");
  62. fprintf(stderr, " -h, --help display this help and exit\n");
  63. fprintf(stderr, " -v, --version output version information and exit\n\n");
  64. fprintf(stderr, "Report bugs to <%s>.", PACKAGE_BUGREPORT);
  65. fprintf(stderr, "\n");
  66. }
  67. static void parse_args(int argc, char **argv)
  68. {
  69. #ifdef STARPU_USE_FXT
  70. /* Default options */
  71. starpu_fxt_options_init(&options);
  72. options.out_paje_path = NULL;
  73. options.activity_path = NULL;
  74. options.distrib_time_path = NULL;
  75. options.dag_path = NULL;
  76. options.dumped_codelets = &dumped_codelets;
  77. #endif
  78. /* We want to support arguments such as "-i trace_*" */
  79. unsigned reading_input_filenames = 0;
  80. int i;
  81. for (i = 1; i < argc; i++) {
  82. if (strcmp(argv[i], "-s") == 0) {
  83. symbol = argv[++i];
  84. continue;
  85. }
  86. if (strcmp(argv[i], "-i") == 0) {
  87. reading_input_filenames = 1;
  88. #ifdef STARPU_USE_FXT
  89. options.filenames[options.ninputfiles++] = argv[++i];
  90. no_fxt_file = 0;
  91. #else
  92. fprintf(stderr, "Warning: FxT support was not enabled in StarPU: FxT traces will thus be ignored!\n");
  93. #endif
  94. continue;
  95. }
  96. if (strcmp(argv[i], "-l") == 0) {
  97. list = 1;
  98. continue;
  99. }
  100. if (strcmp(argv[i], "-a") == 0) {
  101. arch = argv[++i];
  102. continue;
  103. }
  104. if (strcmp(argv[i], "-h") == 0 ||
  105. strcmp(argv[i], "--help") == 0) {
  106. usage(argv);
  107. exit(EXIT_SUCCESS);
  108. }
  109. if (strcmp(argv[i], "-v") == 0 ||
  110. strcmp(argv[i], "--version") == 0) {
  111. (void) fprintf(stdout, "%s %d.%d\n",
  112. PROGNAME, STARPU_MAJOR_VERSION,
  113. STARPU_MINOR_VERSION);
  114. exit(EXIT_SUCCESS);
  115. }
  116. /* If the reading_input_filenames flag is set, and that the
  117. * argument does not match an option, we assume this may be
  118. * another filename */
  119. if (reading_input_filenames)
  120. {
  121. #ifdef STARPU_USE_FXT
  122. options.filenames[options.ninputfiles++] = argv[i];
  123. #endif
  124. continue;
  125. }
  126. }
  127. if (!symbol && !list)
  128. {
  129. fprintf(stderr, "Incorrect usage, aborting\n");
  130. usage(argv);
  131. exit(-1);
  132. }
  133. }
  134. static void print_comma(FILE *gnuplot_file, int *first)
  135. {
  136. if (*first)
  137. {
  138. *first = 0;
  139. }
  140. else {
  141. fprintf(gnuplot_file, ",\\\n\t");
  142. }
  143. }
  144. static void display_perf_model(FILE *gnuplot_file, struct starpu_perfmodel *model, enum starpu_perf_archtype arch, int *first, unsigned nimpl)
  145. {
  146. char arch_name[256];
  147. starpu_perfmodel_get_arch_name(arch, arch_name, 256, nimpl);
  148. struct starpu_perfmodel_per_arch *arch_model =
  149. &model->per_arch[arch][nimpl];
  150. if (arch_model->regression.valid || arch_model->regression.nl_valid)
  151. fprintf(stderr,"Arch: %s\n", arch_name);
  152. #ifdef STARPU_USE_FXT
  153. if (!no_fxt_file && archtype_is_found[arch])
  154. {
  155. print_comma(gnuplot_file, first);
  156. fprintf(gnuplot_file, "\"< grep -w \\^%d %s\" using 2:3 title \"%s\"", arch, data_file_name, arch_name);
  157. }
  158. #endif
  159. /* Only display the regression model if we could actually build a model */
  160. if (arch_model->regression.valid && !arch_model->regression.nl_valid)
  161. {
  162. print_comma(gnuplot_file, first);
  163. fprintf(stderr, "\tLinear: y = alpha size ^ beta\n");
  164. fprintf(stderr, "\t\talpha = %e\n", arch_model->regression.alpha * 0.001);
  165. fprintf(stderr, "\t\tbeta = %e\n", arch_model->regression.beta);
  166. fprintf(gnuplot_file, "0.001 * %f * x ** %f title \"Linear Regression %s\"",
  167. arch_model->regression.alpha, arch_model->regression.beta, arch_name);
  168. }
  169. if (arch_model->regression.nl_valid)
  170. {
  171. print_comma(gnuplot_file, first);
  172. fprintf(stderr, "\tNon-Linear: y = a size ^b + c\n");
  173. fprintf(stderr, "\t\ta = %e\n", arch_model->regression.a * 0.001);
  174. fprintf(stderr, "\t\tb = %e\n", arch_model->regression.b);
  175. fprintf(stderr, "\t\tc = %e\n", arch_model->regression.c * 0.001);
  176. fprintf(gnuplot_file, "0.001 * %f * x ** %f + 0.001 * %f title \"Non-Linear Regression %s\"",
  177. arch_model->regression.a, arch_model->regression.b, arch_model->regression.c, arch_name);
  178. }
  179. }
  180. static void display_history_based_perf_models(FILE *gnuplot_file, struct starpu_perfmodel *model, enum starpu_perf_archtype arch1, enum starpu_perf_archtype arch2, int *first)
  181. {
  182. char *command;
  183. FILE *datafile;
  184. unsigned arch;
  185. struct starpu_perfmodel_history_list *ptr;
  186. char archname[32];
  187. int col;
  188. int len;
  189. unsigned long last, minimum = 0;
  190. len = 10 + strlen(avg_file_name) + 1;
  191. command = (char *) malloc(len);
  192. datafile = fopen(avg_file_name, "w");
  193. free(command);
  194. col = 2;
  195. unsigned implid;
  196. for (arch = arch1; arch < arch2; arch++) {
  197. for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++) {
  198. struct starpu_perfmodel_per_arch *arch_model = &model->per_arch[arch][implid];
  199. starpu_perfmodel_get_arch_name((enum starpu_perf_archtype) arch, archname, 32, implid);
  200. //ptrs[arch-arch1][implid] = ptr[arch-arch1][implid] = arch_model->list;
  201. if (arch_model->list) {
  202. print_comma(gnuplot_file, first);
  203. fprintf(gnuplot_file, "\"%s\" using 1:%d:%d with errorlines title \"Measured %s\"", avg_file_name, col, col+1, archname);
  204. col += 2;
  205. }
  206. }
  207. }
  208. while (1) {
  209. last = minimum;
  210. minimum = ULONG_MAX;
  211. /* Get the next minimum */
  212. for (arch = arch1; arch < arch2; arch++)
  213. for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++) {
  214. struct starpu_perfmodel_per_arch *arch_model = &model->per_arch[arch][implid];
  215. for (ptr = arch_model->list; ptr; ptr = ptr->next) {
  216. unsigned long size = ptr->entry->size;
  217. if (size > last && size < minimum)
  218. minimum = size;
  219. }
  220. }
  221. if (minimum == ULONG_MAX)
  222. break;
  223. fprintf(stderr, "%lu ", minimum);
  224. fprintf(datafile, "%-15lu ", minimum);
  225. for (arch = arch1; arch < arch2; arch++) {
  226. for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++) {
  227. struct starpu_perfmodel_per_arch *arch_model = &model->per_arch[arch][implid];
  228. for (ptr = arch_model->list; ptr; ptr = ptr->next) {
  229. struct starpu_perfmodel_history_entry *entry = ptr->entry;
  230. if (entry->size == minimum) {
  231. fprintf(datafile, "\t%-15le\t%-15le", 0.001*entry->mean, 0.001*entry->deviation);
  232. break;
  233. }
  234. }
  235. if (!ptr && arch_model->list)
  236. /* No value for this arch. */
  237. fprintf(datafile, "\t\"\"\t\"\"");
  238. }
  239. }
  240. fprintf(datafile, "\n");
  241. }
  242. fprintf(stderr, "\n");
  243. fclose(datafile);
  244. }
  245. static void display_perf_models(FILE *gnuplot_file, struct starpu_perfmodel *model, enum starpu_perf_archtype arch1, enum starpu_perf_archtype arch2, int *first)
  246. {
  247. unsigned arch;
  248. unsigned implid;
  249. for (arch = arch1; arch < arch2; arch++) {
  250. for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++) {
  251. display_perf_model(gnuplot_file, model, (enum starpu_perf_archtype) arch, first,
  252. implid);
  253. }
  254. }
  255. display_history_based_perf_models(gnuplot_file, model, arch1, arch2, first);
  256. }
  257. #ifdef STARPU_USE_FXT
  258. static void dump_data_file(FILE *data_file)
  259. {
  260. memset(archtype_is_found, 0, STARPU_NARCH_VARIATIONS*sizeof(int));
  261. int i;
  262. for (i = 0; i < options.dumped_codelets_count; i++)
  263. {
  264. /* Dump only if the symbol matches user's request */
  265. if (strcmp(dumped_codelets[i].symbol, symbol) == 0) {
  266. enum starpu_perf_archtype archtype = dumped_codelets[i].archtype;
  267. archtype_is_found[archtype] = 1;
  268. size_t size = dumped_codelets[i].size;
  269. float time = dumped_codelets[i].time;
  270. fprintf(data_file, "%d %f %f\n", archtype, (float)size, time);
  271. }
  272. }
  273. }
  274. #endif
  275. static void display_selected_models(FILE *gnuplot_file, struct starpu_perfmodel *model)
  276. {
  277. fprintf(gnuplot_file, "#!/usr/bin/gnuplot -persist\n");
  278. fprintf(gnuplot_file, "\n");
  279. fprintf(gnuplot_file, "set term postscript eps enhanced color\n");
  280. fprintf(gnuplot_file, "set output \"starpu_%s.eps\"\n", symbol);
  281. fprintf(gnuplot_file, "set title \"Model for codelet %s\"\n", symbol);
  282. fprintf(gnuplot_file, "set xlabel \"Total data size\"\n");
  283. fprintf(gnuplot_file, "set ylabel \"Time (ms)\"\n");
  284. fprintf(gnuplot_file, "\n");
  285. fprintf(gnuplot_file, "set key top left\n");
  286. fprintf(gnuplot_file, "set logscale x\n");
  287. fprintf(gnuplot_file, "set logscale y\n");
  288. fprintf(gnuplot_file, "\n");
  289. /* If no input data is given to gnuplot, we at least need to specify an
  290. * arbitrary range. */
  291. if (no_fxt_file)
  292. fprintf(gnuplot_file, "set xrange [1:10**9]\n\n");
  293. int first = 1;
  294. fprintf(gnuplot_file, "plot\t");
  295. if (arch == NULL)
  296. {
  297. /* display all architectures */
  298. display_perf_models(gnuplot_file, model, (enum starpu_perf_archtype) 0, (enum starpu_perf_archtype) STARPU_NARCH_VARIATIONS, &first);
  299. }
  300. else {
  301. if (strcmp(arch, "cpu") == 0) {
  302. unsigned impl;
  303. for (impl = 0; impl < STARPU_MAXIMPLEMENTATIONS; impl++) {
  304. display_perf_model(gnuplot_file, model,
  305. STARPU_CPU_DEFAULT,
  306. &first, impl);
  307. }
  308. return;
  309. }
  310. int k;
  311. if (sscanf(arch, "cpu:%d", &k) == 1)
  312. {
  313. /* For combined CPU workers */
  314. if ((k < 1) || (k > STARPU_MAXCPUS))
  315. {
  316. fprintf(stderr, "Invalid CPU size\n");
  317. exit(-1);
  318. }
  319. display_perf_models(gnuplot_file, model, (enum starpu_perf_archtype) (STARPU_CPU_DEFAULT + k - 1), (enum starpu_perf_archtype) (STARPU_CPU_DEFAULT + k), &first);
  320. return;
  321. }
  322. if (strcmp(arch, "cuda") == 0) {
  323. display_perf_models(gnuplot_file, model, STARPU_CUDA_DEFAULT, (enum starpu_perf_archtype) (STARPU_CUDA_DEFAULT + STARPU_MAXCUDADEVS), &first);
  324. return;
  325. }
  326. /* There must be a cleaner way ! */
  327. int gpuid;
  328. int nmatched;
  329. nmatched = sscanf(arch, "cuda_%d", &gpuid);
  330. if (nmatched == 1)
  331. {
  332. unsigned archid = STARPU_CUDA_DEFAULT+ gpuid;
  333. display_perf_models(gnuplot_file, model, (enum starpu_perf_archtype) archid, (enum starpu_perf_archtype) (archid + 1), &first);
  334. return;
  335. }
  336. if (strcmp(arch, "gordon") == 0) {
  337. display_perf_models(gnuplot_file, model, STARPU_GORDON_DEFAULT, (enum starpu_perf_archtype) (STARPU_GORDON_DEFAULT + 1), &first);
  338. return;
  339. }
  340. fprintf(stderr, "Unknown architecture requested, aborting.\n");
  341. exit(-1);
  342. }
  343. }
  344. int main(int argc, char **argv)
  345. {
  346. int ret;
  347. #ifdef __MINGW32__
  348. WSADATA wsadata;
  349. WSAStartup(MAKEWORD(1,0), &wsadata);
  350. #endif
  351. parse_args(argc, argv);
  352. if (list) {
  353. int ret = starpu_perfmodel_list(stdout);
  354. if (ret) {
  355. fprintf(stderr, "The performance model directory is invalid\n");
  356. return 1;
  357. }
  358. return 0;
  359. }
  360. /* Load the performance model associated to the symbol */
  361. ret = starpu_perfmodel_load_symbol(symbol, &model);
  362. if (ret == 1)
  363. {
  364. fprintf(stderr, "The performance model for the symbol <%s> could not be loaded\n", symbol);
  365. return 1;
  366. }
  367. /* If some FxT input was specified, we put the points on the graph */
  368. #ifdef STARPU_USE_FXT
  369. if (!no_fxt_file)
  370. {
  371. starpu_fxt_generate_trace(&options);
  372. snprintf(data_file_name, 256, "starpu_%s.data", symbol);
  373. FILE *data_file = fopen(data_file_name, "w+");
  374. STARPU_ASSERT(data_file);
  375. dump_data_file(data_file);
  376. fclose(data_file);
  377. }
  378. #endif
  379. snprintf(gnuplot_file_name, 256, "starpu_%s.gp", symbol);
  380. snprintf(avg_file_name, 256, "starpu_%s_avg.data", symbol);
  381. FILE *gnuplot_file = fopen(gnuplot_file_name, "w+");
  382. STARPU_ASSERT(gnuplot_file);
  383. display_selected_models(gnuplot_file, &model);
  384. fclose(gnuplot_file);
  385. /* Retrieve the current mode of the gnuplot executable */
  386. struct stat sb;
  387. ret = stat(gnuplot_file_name, &sb);
  388. if (ret)
  389. {
  390. perror("stat");
  391. STARPU_ABORT();
  392. }
  393. /* Make the gnuplot scrit executable for the owner */
  394. ret = chmod(gnuplot_file_name, sb.st_mode|S_IXUSR);
  395. if (ret)
  396. {
  397. perror("chmod");
  398. STARPU_ABORT();
  399. }
  400. return 0;
  401. }