/* StarPU --- Runtime system for heterogeneous multicore architectures. * * Copyright (C) 2011-2013 Université de Bordeaux 1 * Copyright (C) 2011, 2012, 2013 Centre National de la Recherche Scientifique * Copyright (C) 2011 Télécom-SudParis * * StarPU is free software; you can redistribute it and/or modify * it under the terms of the GNU Lesser General Public License as published by * the Free Software Foundation; either version 2.1 of the License, or (at * your option) any later version. * * StarPU is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. * * See the GNU Lesser General Public License in COPYING.LGPL for more details. */ #include #include #include #include #include #include #ifdef STARPU_USE_FXT #include #endif #include #include #include // we need to browse the list associated to history-based models #ifdef __MINGW32__ #include #endif #define PROGNAME "starpu_perfmodel_plot" /* display all available models */ static int list = 0; /* what kernel ? */ static char *symbol = NULL; /* which architecture ? (NULL = all)*/ static char *archname = NULL; /* Unless a FxT file is specified, we just display the model */ static int no_fxt_file = 1; static int gflops = 0; #ifdef STARPU_USE_FXT static struct starpu_fxt_codelet_event *dumped_codelets; static struct starpu_fxt_options options; #endif #ifdef STARPU_USE_FXT static int archtype_is_found[STARPU_NARCH_VARIATIONS]; static char data_file_name[256]; #endif static char avg_file_name[256]; static char gnuplot_file_name[256]; static void usage() { fprintf(stderr, "Draw a graph corresponding to the execution time of a \ given perfmodel\n"); fprintf(stderr, "Usage: %s [ options ]\n", PROGNAME); fprintf(stderr, "\n"); fprintf(stderr, "One must specify a symbol with the -s option or use -l\n"); fprintf(stderr, "Options:\n"); fprintf(stderr, " -l display all available models\n"); fprintf(stderr, " -s specify the symbol\n"); fprintf(stderr, " -f draw GFlops instead of time\n"); fprintf(stderr, " -i input FxT files generated by StarPU\n"); fprintf(stderr, " -a specify the architecture (e.g. cpu, cpu:x, cuda, cuda_d, opencl, opencl_d)\n"); fprintf(stderr, " -h, --help display this help and exit\n"); fprintf(stderr, " -v, --version output version information and exit\n\n"); fprintf(stderr, "Report bugs to <%s>.", PACKAGE_BUGREPORT); fprintf(stderr, "\n"); } static void parse_args(int argc, char **argv) { #ifdef STARPU_USE_FXT /* Default options */ starpu_fxt_options_init(&options); options.out_paje_path = NULL; options.activity_path = NULL; options.distrib_time_path = NULL; options.dag_path = NULL; options.dumped_codelets = &dumped_codelets; #endif /* We want to support arguments such as "-i trace_*" */ unsigned reading_input_filenames = 0; int i; for (i = 1; i < argc; i++) { if (strcmp(argv[i], "-s") == 0) { symbol = argv[++i]; continue; } if (strcmp(argv[i], "-i") == 0) { reading_input_filenames = 1; #ifdef STARPU_USE_FXT options.filenames[options.ninputfiles++] = argv[++i]; no_fxt_file = 0; #else fprintf(stderr, "Warning: FxT support was not enabled in StarPU: FxT traces will thus be ignored!\n"); #endif continue; } if (strcmp(argv[i], "-l") == 0) { list = 1; continue; } if (strcmp(argv[i], "-f") == 0) { gflops = 1; continue; } if (strcmp(argv[i], "-a") == 0) { archname = argv[++i]; continue; } if (strcmp(argv[i], "-h") == 0 || strcmp(argv[i], "--help") == 0) { usage(); exit(EXIT_SUCCESS); } if (strcmp(argv[i], "-v") == 0 || strcmp(argv[i], "--version") == 0) { fputs(PROGNAME " (" PACKAGE_NAME ") " PACKAGE_VERSION "\n", stderr); exit(EXIT_SUCCESS); } /* If the reading_input_filenames flag is set, and that the * argument does not match an option, we assume this may be * another filename */ if (reading_input_filenames) { #ifdef STARPU_USE_FXT options.filenames[options.ninputfiles++] = argv[i]; #endif continue; } } if (!symbol && !list) { fprintf(stderr, "Incorrect usage, aborting\n"); usage(argv); exit(-1); } } static void print_comma(FILE *gnuplot_file, int *first) { if (*first) { *first = 0; } else { fprintf(gnuplot_file, ",\\\n\t"); } } static void display_perf_model(FILE *gnuplot_file, struct starpu_perfmodel *model, enum starpu_perfmodel_archtype arch, int *first, unsigned nimpl) { char arch_name[256]; starpu_perfmodel_get_arch_name(arch, arch_name, 256, nimpl); struct starpu_perfmodel_per_arch *arch_model = &model->per_arch[arch][nimpl]; if (arch_model->regression.valid || arch_model->regression.nl_valid) fprintf(stderr,"Arch: %s\n", arch_name); #ifdef STARPU_USE_FXT if (!gflops && !no_fxt_file && archtype_is_found[arch] && nimpl == 0) { print_comma(gnuplot_file, first); fprintf(gnuplot_file, "\"< grep -w \\^%d %s\" using 2:3 title \"Profiling %s\"", arch, data_file_name, arch_name); } #endif /* Only display the regression model if we could actually build a model */ if (!gflops && arch_model->regression.valid && !arch_model->regression.nl_valid) { print_comma(gnuplot_file, first); fprintf(stderr, "\tLinear: y = alpha size ^ beta\n"); fprintf(stderr, "\t\talpha = %e\n", arch_model->regression.alpha * 0.001); fprintf(stderr, "\t\tbeta = %e\n", arch_model->regression.beta); fprintf(gnuplot_file, "0.001 * %f * x ** %f title \"Linear Regression %s\"", arch_model->regression.alpha, arch_model->regression.beta, arch_name); } if (!gflops && arch_model->regression.nl_valid) { print_comma(gnuplot_file, first); fprintf(stderr, "\tNon-Linear: y = a size ^b + c\n"); fprintf(stderr, "\t\ta = %e\n", arch_model->regression.a * 0.001); fprintf(stderr, "\t\tb = %e\n", arch_model->regression.b); fprintf(stderr, "\t\tc = %e\n", arch_model->regression.c * 0.001); fprintf(gnuplot_file, "0.001 * %f * x ** %f + 0.001 * %f title \"Non-Linear Regression %s\"", arch_model->regression.a, arch_model->regression.b, arch_model->regression.c, arch_name); } } static void display_history_based_perf_models(FILE *gnuplot_file, struct starpu_perfmodel *model, enum starpu_perfmodel_archtype arch1, enum starpu_perfmodel_archtype arch2, int *first) { char *command; FILE *datafile; unsigned arch; struct starpu_perfmodel_history_list *ptr; char arch_name[32]; int col; size_t len; unsigned long last, minimum = 0; len = 10 + strlen(avg_file_name) + 1; command = (char *) malloc(len); datafile = fopen(avg_file_name, "w"); free(command); col = 2; unsigned implid; for (arch = arch1; arch < arch2; arch++) { for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++) { struct starpu_perfmodel_per_arch *arch_model = &model->per_arch[arch][implid]; starpu_perfmodel_get_arch_name((enum starpu_perfmodel_archtype) arch, arch_name, 32, implid); //ptrs[arch-arch1][implid] = ptr[arch-arch1][implid] = arch_model->list; if (arch_model->list) { print_comma(gnuplot_file, first); fprintf(gnuplot_file, "\"%s\" using 1:%d:%d with errorlines title \"Average %s\"", avg_file_name, col, col+1, arch_name); col += 2; } } } while (1) { last = minimum; minimum = ULONG_MAX; /* Get the next minimum */ for (arch = arch1; arch < arch2; arch++) for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++) { struct starpu_perfmodel_per_arch *arch_model = &model->per_arch[arch][implid]; for (ptr = arch_model->list; ptr; ptr = ptr->next) { unsigned long size = ptr->entry->size; if (size > last && size < minimum) minimum = size; } } if (minimum == ULONG_MAX) break; fprintf(stderr, "%lu ", minimum); fprintf(datafile, "%-15lu ", minimum); for (arch = arch1; arch < arch2; arch++) { for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++) { struct starpu_perfmodel_per_arch *arch_model = &model->per_arch[arch][implid]; for (ptr = arch_model->list; ptr; ptr = ptr->next) { struct starpu_perfmodel_history_entry *entry = ptr->entry; if (entry->size == minimum) { if (gflops) fprintf(datafile, "\t%-15le\t%-15le", entry->flops / (entry->mean * 1000), entry->flops / ((entry->mean + entry->deviation) * 1000) - entry->flops / (entry->mean * 1000) ); else fprintf(datafile, "\t%-15le\t%-15le", 0.001*entry->mean, 0.001*entry->deviation); break; } } if (!ptr && arch_model->list) /* No value for this arch. */ fprintf(datafile, "\t\"\"\t\"\""); } } fprintf(datafile, "\n"); } fprintf(stderr, "\n"); fclose(datafile); } static void display_perf_models(FILE *gnuplot_file, struct starpu_perfmodel *model, enum starpu_perfmodel_archtype arch1, enum starpu_perfmodel_archtype arch2, int *first) { unsigned arch; unsigned implid; for (arch = arch1; arch < arch2; arch++) { for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++) { display_perf_model(gnuplot_file, model, (enum starpu_perfmodel_archtype) arch, first, implid); } } display_history_based_perf_models(gnuplot_file, model, arch1, arch2, first); } #ifdef STARPU_USE_FXT static void dump_data_file(FILE *data_file) { memset(archtype_is_found, 0, STARPU_NARCH_VARIATIONS*sizeof(int)); int i; for (i = 0; i < options.dumped_codelets_count; i++) { /* Dump only if the symbol matches user's request */ if (strncmp(dumped_codelets[i].symbol, symbol, (FXT_MAX_PARAMS - 4)*sizeof(unsigned long)-1) == 0) { enum starpu_perfmodel_archtype archtype = dumped_codelets[i].archtype; archtype_is_found[archtype] = 1; size_t size = dumped_codelets[i].size; float time = dumped_codelets[i].time; fprintf(data_file, "%d %f %f\n", archtype, (float)size, time); } } } #endif static void display_selected_models(FILE *gnuplot_file, struct starpu_perfmodel *model) { fprintf(gnuplot_file, "#!/usr/bin/gnuplot -persist\n"); fprintf(gnuplot_file, "\n"); fprintf(gnuplot_file, "set term postscript eps enhanced color\n"); fprintf(gnuplot_file, "set output \"starpu_%s.eps\"\n", symbol); fprintf(gnuplot_file, "set title \"Model for codelet %s\"\n", symbol); fprintf(gnuplot_file, "set xlabel \"Total data size\"\n"); if (gflops) fprintf(gnuplot_file, "set ylabel \"GFlops\"\n"); else fprintf(gnuplot_file, "set ylabel \"Time (ms)\"\n"); fprintf(gnuplot_file, "\n"); fprintf(gnuplot_file, "set key top left\n"); fprintf(gnuplot_file, "set logscale x\n"); fprintf(gnuplot_file, "set logscale y\n"); fprintf(gnuplot_file, "\n"); /* If no input data is given to gnuplot, we at least need to specify an * arbitrary range. */ if (no_fxt_file) fprintf(gnuplot_file, "set xrange [1:10**9]\n\n"); int first = 1; fprintf(gnuplot_file, "plot\t"); if (archname == NULL) { /* display all architectures */ display_perf_models(gnuplot_file, model, (enum starpu_perfmodel_archtype) 0, (enum starpu_perfmodel_archtype) STARPU_NARCH_VARIATIONS, &first); } else { if (strcmp(archname, "cpu") == 0) { unsigned impl; for (impl = 0; impl < STARPU_MAXIMPLEMENTATIONS; impl++) { display_perf_model(gnuplot_file, model, STARPU_CPU_DEFAULT, &first, impl); } return; } int k; if (sscanf(archname, "cpu:%d", &k) == 1) { /* For combined CPU workers */ if ((k < 1) || (k > STARPU_MAXCPUS)) { fprintf(stderr, "Invalid CPU size\n"); exit(-1); } display_perf_models(gnuplot_file, model, (enum starpu_perfmodel_archtype) (STARPU_CPU_DEFAULT + k - 1), (enum starpu_perfmodel_archtype) (STARPU_CPU_DEFAULT + k), &first); return; } if (strcmp(archname, "cuda") == 0) { display_perf_models(gnuplot_file, model, STARPU_CUDA_DEFAULT, (enum starpu_perfmodel_archtype) (STARPU_CUDA_DEFAULT + STARPU_MAXCUDADEVS), &first); return; } /* There must be a cleaner way ! */ int gpuid; int nmatched; nmatched = sscanf(archname, "cuda_%d", &gpuid); if (nmatched == 1) { int archid = STARPU_CUDA_DEFAULT+ gpuid; if (archid < STARPU_OPENCL_DEFAULT) { display_perf_models(gnuplot_file, model, (enum starpu_perfmodel_archtype) archid, (enum starpu_perfmodel_archtype) (archid + 1), &first); return; } else { fprintf(stderr, "Invalid CUDA device %d (last valid one is %d)\n", gpuid, STARPU_MAXCUDADEVS-1); exit(-1); } } if (strcmp(archname, "opencl") == 0) { display_perf_models(gnuplot_file, model, STARPU_OPENCL_DEFAULT, (enum starpu_perfmodel_archtype) (STARPU_OPENCL_DEFAULT + STARPU_MAXOPENCLDEVS), &first); return; } /* There must be a cleaner way ! */ nmatched = sscanf(archname, "opencl_%d", &gpuid); if (nmatched == 1) { int archid = STARPU_OPENCL_DEFAULT+ gpuid; if (archid < STARPU_NARCH_VARIATIONS) { display_perf_models(gnuplot_file, model, (enum starpu_perfmodel_archtype) archid, (enum starpu_perfmodel_archtype) (archid + 1), &first); return; } else { fprintf(stderr, "Invalid OpenCL device %d (last valid one is %d)\n", gpuid, STARPU_MAXOPENCLDEVS-1); exit(-1); } } fprintf(stderr, "Unknown architecture requested, aborting.\n"); exit(-1); } } int main(int argc, char **argv) { int ret; struct starpu_perfmodel model; #ifdef __MINGW32__ WSADATA wsadata; WSAStartup(MAKEWORD(1,0), &wsadata); #endif parse_args(argc, argv); if (list) { ret = starpu_perfmodel_list(stdout); if (ret) { fprintf(stderr, "The performance model directory is invalid\n"); return 1; } return 0; } /* Load the performance model associated to the symbol */ ret = starpu_perfmodel_load_symbol(symbol, &model); if (ret == 1) { fprintf(stderr, "The performance model for the symbol <%s> could not be loaded\n", symbol); return 1; } /* If some FxT input was specified, we put the points on the graph */ #ifdef STARPU_USE_FXT if (!no_fxt_file) { starpu_fxt_generate_trace(&options); snprintf(data_file_name, 256, "starpu_%s.data", symbol); FILE *data_file = fopen(data_file_name, "w+"); STARPU_ASSERT(data_file); dump_data_file(data_file); fclose(data_file); } #endif snprintf(gnuplot_file_name, 256, "starpu_%s.gp", symbol); snprintf(avg_file_name, 256, "starpu_%s_avg.data", symbol); FILE *gnuplot_file = fopen(gnuplot_file_name, "w+"); STARPU_ASSERT(gnuplot_file); display_selected_models(gnuplot_file, &model); fclose(gnuplot_file); /* Retrieve the current mode of the gnuplot executable */ struct stat sb; ret = stat(gnuplot_file_name, &sb); if (ret) { perror("stat"); STARPU_ABORT(); } /* Make the gnuplot scrit executable for the owner */ ret = chmod(gnuplot_file_name, sb.st_mode|S_IXUSR); if (ret) { perror("chmod"); STARPU_ABORT(); } _STARPU_DISP("Gnuplot file <%s> generated\n", gnuplot_file_name); return 0; }