| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710 | /* StarPU --- Runtime system for heterogeneous multicore architectures. * * Copyright (C) 2011-2013  Université de Bordeaux 1 * Copyright (C) 2011, 2012, 2013  Centre National de la Recherche Scientifique * Copyright (C) 2011  Télécom-SudParis * * StarPU is free software; you can redistribute it and/or modify * it under the terms of the GNU Lesser General Public License as published by * the Free Software Foundation; either version 2.1 of the License, or (at * your option) any later version. * * StarPU is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. * * See the GNU Lesser General Public License in COPYING.LGPL for more details. */#include <config.h>#include <assert.h>#include <unistd.h>#include <stdio.h>#include <sys/stat.h>#include <limits.h>#ifdef STARPU_USE_FXT#include <common/fxt.h>#endif#include <common/utils.h>#include <starpu.h>#include <core/perfmodel/perfmodel.h> // we need to browse the list associated to history-based models#include <core/workers.h>#ifdef __MINGW32__#include <windows.h>#endif#define PROGNAME "starpu_perfmodel_plot"/* display all available models */static int list = 0;/* what kernel ? */static char *symbol = NULL;/* which architecture ? (NULL = all)*/static char *archname = NULL;/* Unless a FxT file is specified, we just display the model */static int no_fxt_file = 1;static int gflops = 0;#ifdef STARPU_USE_FXTstatic struct starpu_fxt_codelet_event *dumped_codelets;static struct starpu_fxt_options options;#endif#ifdef STARPU_USE_FXTstatic int **archtype_is_found[STARPU_NARCH];static char data_file_name[256];#endifstatic char avg_file_name[256];static char gnuplot_file_name[256];static void usage(){	fprintf(stderr, "Draw a graph corresponding to the execution time of a \given perfmodel\n");	fprintf(stderr, "Usage: %s [ options ]\n", PROGNAME);        fprintf(stderr, "\n");	fprintf(stderr, "One must specify a symbol with the -s option or use -l\n");        fprintf(stderr, "Options:\n");        fprintf(stderr, "   -l                  display all available models\n");        fprintf(stderr, "   -s <symbol>         specify the symbol\n");	fprintf(stderr, "   -f                  draw GFlops instead of time\n");	fprintf(stderr, "   -i <Fxt files>      input FxT files generated by StarPU\n");        fprintf(stderr, "   -a <arch>           specify the architecture (e.g. cpu, cpu:x, cuda, cuda_d, opencl, opencl_d)\n");	fprintf(stderr, "   -h, --help          display this help and exit\n");	fprintf(stderr, "   -v, --version       output version information and exit\n\n");        fprintf(stderr, "Report bugs to <%s>.", PACKAGE_BUGREPORT);        fprintf(stderr, "\n");}static void parse_args(int argc, char **argv){#ifdef STARPU_USE_FXT	/* Default options */	starpu_fxt_options_init(&options);	options.out_paje_path = NULL;	options.activity_path = NULL;	options.distrib_time_path = NULL;	options.dag_path = NULL;	options.dumped_codelets = &dumped_codelets;#endif	/* We want to support arguments such as "-i trace_*" */	unsigned reading_input_filenames = 0;	int i;	for (i = 1; i < argc; i++)	{		if (strcmp(argv[i], "-s") == 0)		{			symbol = argv[++i];			continue;		}		if (strcmp(argv[i], "-i") == 0)		{			reading_input_filenames = 1;#ifdef STARPU_USE_FXT			options.filenames[options.ninputfiles++] = argv[++i];			no_fxt_file = 0;#else			fprintf(stderr, "Warning: FxT support was not enabled in StarPU: FxT traces will thus be ignored!\n");#endif			continue;		}		if (strcmp(argv[i], "-l") == 0)		{			list = 1;			continue;		}		if (strcmp(argv[i], "-f") == 0)		{			gflops = 1;			continue;		}		if (strcmp(argv[i], "-a") == 0)		{			archname = argv[++i];			continue;		}		if (strcmp(argv[i], "-h") == 0 ||		    strcmp(argv[i], "--help") == 0)		{			usage();			exit(EXIT_SUCCESS);		}		if (strcmp(argv[i], "-v") == 0 ||		    strcmp(argv[i], "--version") == 0)                {		        fputs(PROGNAME " (" PACKAGE_NAME ") " PACKAGE_VERSION "\n", stderr);			exit(EXIT_SUCCESS);		}		/* If the reading_input_filenames flag is set, and that the		 * argument does not match an option, we assume this may be		 * another filename */		if (reading_input_filenames)		{#ifdef STARPU_USE_FXT			options.filenames[options.ninputfiles++] = argv[i];#endif			continue;		}	}	if (!symbol && !list)	{		fprintf(stderr, "Incorrect usage, aborting\n");                usage();		exit(-1);	}}static void print_comma(FILE *gnuplot_file, int *first){	if (*first)	{		*first = 0;	}	else	{		fprintf(gnuplot_file, ",\\\n\t");	}}static void display_perf_model(FILE *gnuplot_file, struct starpu_perfmodel *model, struct starpu_perfmodel_arch* arch, int *first, unsigned nimpl){	char arch_name[256];	starpu_perfmodel_get_arch_name(arch, arch_name, 256, nimpl);	struct starpu_perfmodel_per_arch *arch_model =		&model->per_arch[arch->type][arch->devid][arch->ncore][nimpl];	if (arch_model->regression.valid || arch_model->regression.nl_valid)		fprintf(stderr,"Arch: %s\n", arch_name);#ifdef STARPU_USE_FXT	if (!gflops && !no_fxt_file && archtype_is_found[arch->type][arch->devid][arch->ncore] && nimpl == 0)	{		print_comma(gnuplot_file, first);		fprintf(gnuplot_file, "\"< grep -w \\^%d_%d_%d %s\" using 2:3 title \"Profiling %s\"", arch->type, arch->devid, arch->ncore, data_file_name, arch_name);	}#endif	/* Only display the regression model if we could actually build a model */	if (!gflops && arch_model->regression.valid && !arch_model->regression.nl_valid)	{		print_comma(gnuplot_file, first);		fprintf(stderr, "\tLinear: y = alpha size ^ beta\n");		fprintf(stderr, "\t\talpha = %e\n", arch_model->regression.alpha * 0.001);		fprintf(stderr, "\t\tbeta = %e\n", arch_model->regression.beta);		fprintf(gnuplot_file, "0.001 * %f * x ** %f title \"Linear Regression %s\"",			arch_model->regression.alpha, arch_model->regression.beta, arch_name);	}	if (!gflops && arch_model->regression.nl_valid)	{		print_comma(gnuplot_file, first);		fprintf(stderr, "\tNon-Linear: y = a size ^b + c\n");		fprintf(stderr, "\t\ta = %e\n", arch_model->regression.a * 0.001);		fprintf(stderr, "\t\tb = %e\n", arch_model->regression.b);		fprintf(stderr, "\t\tc = %e\n", arch_model->regression.c * 0.001);		fprintf(gnuplot_file, "0.001 * %f * x ** %f + 0.001 * %f title \"Non-Linear Regression %s\"",			arch_model->regression.a, arch_model->regression.b,  arch_model->regression.c, arch_name);	}}static void display_history_based_perf_models(FILE *gnuplot_file, struct starpu_perfmodel *model, enum starpu_worker_archtype* type, int* devid, int* ncore, int *first){	char *command;	FILE *datafile;	struct starpu_perfmodel_history_list *ptr;	char arch_name[32];	int col;	size_t len;	unsigned long last, minimum = 0;	len = 10 + strlen(avg_file_name) + 1;	command = (char *) malloc(len);	datafile = fopen(avg_file_name, "w");	free(command);	col = 2;	unsigned implid;	unsigned archmin, archmax, devmin, devmax, coremin, coremax;	if(type != NULL)	{		archmin = *type;		archmax = *type +1;		if(devid != NULL)		{			devmin = *devid;			devmax = *devid +1;			if(ncore != NULL)			{				coremin = *ncore;				coremax = *ncore +1;			}			else			{				coremin = 0;				coremax = 0;			}		}		else		{			devmin = 0;			devmax = 0;			coremin = 0;			coremax = 0;		}	}	else	{		archmin = 0;		archmax = STARPU_NARCH;		devmin = 0;		devmax = 0;		coremin = 0;		coremax = 0;	}	struct starpu_perfmodel_arch arch;	unsigned archtype, dev, core;	for (archtype = archmin; archtype < archmax; archtype++)	{		arch.type = archtype;		if(model->per_arch[archtype]!=NULL)		{			for(dev = devmin; model->per_arch[archtype][dev] != NULL && (devmax == 0 || dev < devmax);dev++)			{				arch.devid = dev;				for(core = coremin; model->per_arch[archtype][dev][core] != NULL && (coremax == 0 || core < coremax); core++)				{					arch.ncore = core;					for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++)					{						struct starpu_perfmodel_per_arch *arch_model = &model->per_arch[archtype][dev][core][implid];						starpu_perfmodel_get_arch_name(&arch, arch_name, 32, implid);						//ptrs[arch-arch1][implid] = ptr[arch-arch1][implid] = arch_model->list;						if (arch_model->list)						{							print_comma(gnuplot_file, first);							fprintf(gnuplot_file, "\"%s\" using 1:%d:%d with errorlines title \"Average %s\"", avg_file_name, col, col+1, arch_name);							col += 2;						}					}				}			}		}	}	/* Dump entries in size order */	while (1)	{		last = minimum;		minimum = ULONG_MAX;		/* Get the next minimum */		for (archtype = archmin; archtype < archmax; archtype++)		{			if(model->per_arch[archtype]!=NULL)			{				for(dev = devmin; model->per_arch[archtype][dev] != NULL && (devmax == 0 || dev < devmax);dev++)				{					for(core = coremin; model->per_arch[archtype][dev][core] != NULL && (coremax == 0 || core < coremax); core++)									{						for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++)						{							struct starpu_perfmodel_per_arch *arch_model = &model->per_arch[archtype][dev][core][implid];							for (ptr = arch_model->list; ptr; ptr = ptr->next)							{								unsigned long size = ptr->entry->size;								if (size > last && size < minimum)									minimum = size;							}						}					}				}			}		}		if (minimum == ULONG_MAX)			break;		fprintf(stderr, "%lu ", minimum);		fprintf(datafile, "%-15lu ", minimum);		for (archtype = archmin; archtype < archmax; archtype++)			if(model->per_arch[archtype]!=NULL)				for(dev = devmin; model->per_arch[archtype][dev] != NULL && (devmax == 0 || dev < devmax);dev++)					for(core = coremin; model->per_arch[archtype][dev][core] != NULL && (coremax == 0 || core < coremax); core++)						for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++)						{							struct starpu_perfmodel_per_arch *arch_model = &model->per_arch[archtype][dev][core][implid];							for (ptr = arch_model->list; ptr; ptr = ptr->next)							{								struct starpu_perfmodel_history_entry *entry = ptr->entry;								if (entry->size == minimum)								{									if (gflops)										fprintf(datafile, "\t%-15le\t%-15le", entry->flops / (entry->mean * 1000),												entry->flops / ((entry->mean + entry->deviation) * 1000) -												entry->flops / (entry->mean * 1000)										       );									else										fprintf(datafile, "\t%-15le\t%-15le", 0.001*entry->mean, 0.001*entry->deviation);									break;								}							}							if (!ptr && arch_model->list)								/* No value for this arch. */								fprintf(datafile, "\t\"\"\t\"\"");						}		fprintf(datafile, "\n");	}	fprintf(stderr, "\n");	fclose(datafile);}static void display_selected_arch_perf_models(FILE *gnuplot_file, struct starpu_perfmodel *model, struct starpu_perfmodel_arch* arch, int *first){	unsigned implid;	for (implid = 0; implid < STARPU_MAXIMPLEMENTATIONS; implid++)		display_perf_model(gnuplot_file, model, arch, first, implid);}static void display_selected_device_perf_models(FILE *gnuplot_file, struct starpu_perfmodel *model, enum starpu_worker_archtype archtype, int devid, int *first){	unsigned ncore;	struct starpu_perfmodel_arch arch;	arch.type = archtype;	arch.devid = devid;	for(ncore=0; model->per_arch[archtype][devid][ncore] != NULL; ncore++)	{		arch.ncore = ncore;		display_selected_arch_perf_models(gnuplot_file,model,&arch,first);	}}static void display_selected_archtype_perf_models(FILE *gnuplot_file, struct starpu_perfmodel *model, enum starpu_worker_archtype archtype, int *first){	unsigned devid;	for(devid=0; model->per_arch[archtype][devid] != NULL; devid++)		display_selected_device_perf_models(gnuplot_file,model,archtype,devid,first);}static void display_all_perf_models(FILE *gnuplot_file, struct starpu_perfmodel *model, int *first){	unsigned archtype;	for(archtype = 0; archtype < STARPU_NARCH; archtype++)		display_selected_archtype_perf_models(gnuplot_file,model,archtype,first);}#ifdef STARPU_USE_FXTstatic int ** init_archtype_is_found_per_arch(int maxdevid, unsigned* maxncore_table){	int devid, ncore;	int ** archtype_is_found_per_arch = malloc(sizeof(*archtype_is_found_per_arch)*(maxdevid+1));	archtype_is_found_per_arch[maxdevid] = NULL;	for(devid=0; devid<maxdevid; devid++)	{		int maxncore;		if(maxncore_table != NULL)			maxncore = maxncore_table[devid];		else			maxncore = 1;				archtype_is_found_per_arch[devid] = malloc(sizeof(*archtype_is_found_per_arch[devid])*(maxncore+1));		archtype_is_found_per_arch[devid][maxncore] = 0;		for(ncore=0; ncore<maxncore; ncore++)			archtype_is_found_per_arch[devid][ncore] = 0;	}	return archtype_is_found_per_arch;}static void init_archtype_is_found(struct starpu_perfmodel *model){	unsigned archtype, devid, ndevice, ncore, *maxncore;	for(archtype = 0; archtype < STARPU_NARCH; archtype++)	{			for(devid=0; model->per_arch[archtype][devid] != NULL; devid++);		ndevice = devid;		if(ndevice != 0)		{			maxncore = malloc(sizeof(*maxncore)*ndevice);			for(devid=0; devid < ndevice; devid++);			{							for(ncore=0; model->per_arch[archtype][devid][ncore] != NULL; ncore++);				maxncore[devid] = ncore;			}		}		else		{			maxncore = NULL;		}		archtype_is_found[archtype] = init_archtype_is_found_per_arch(ndevice,maxncore);		if(maxncore != NULL)			free(maxncore);	}}static void dump_data_file(FILE *data_file, struct starpu_perfmodel *model){	init_archtype_is_found(model);	int i;	for (i = 0; i < options.dumped_codelets_count; i++)	{		/* Dump only if the symbol matches user's request */		if (strncmp(dumped_codelets[i].symbol, symbol, (FXT_MAX_PARAMS - 4)*sizeof(unsigned long)-1) == 0)		{			struct starpu_perfmodel_arch* arch = &dumped_codelets[i].arch;			archtype_is_found[arch->type][arch->devid][arch->ncore] = 1;			size_t size = dumped_codelets[i].size;			float time = dumped_codelets[i].time;			fprintf(data_file, "%d_%d_%d	%f	%f\n", arch->type, arch->devid, arch->ncore, (float)size, time);		}	}}#endifstatic void display_selected_models(FILE *gnuplot_file, struct starpu_perfmodel *model){	fprintf(gnuplot_file, "#!/usr/bin/gnuplot -persist\n");	fprintf(gnuplot_file, "\n");	fprintf(gnuplot_file, "set term postscript eps enhanced color\n");	fprintf(gnuplot_file, "set output \"starpu_%s.eps\"\n", symbol);	fprintf(gnuplot_file, "set title \"Model for codelet %s\"\n", symbol);	fprintf(gnuplot_file, "set xlabel \"Total data size\"\n");	if (gflops)		fprintf(gnuplot_file, "set ylabel \"GFlops\"\n");	else		fprintf(gnuplot_file, "set ylabel \"Time (ms)\"\n");	fprintf(gnuplot_file, "\n");	fprintf(gnuplot_file, "set key top left\n");	fprintf(gnuplot_file, "set logscale x\n");	fprintf(gnuplot_file, "set logscale y\n");	fprintf(gnuplot_file, "\n");	/* If no input data is given to gnuplot, we at least need to specify an	 * arbitrary range. */	if (no_fxt_file)		fprintf(gnuplot_file, "set xrange [1:10**9]\n\n");	int first = 1;	fprintf(gnuplot_file, "plot\t");	struct starpu_perfmodel_arch arch;	struct _starpu_machine_config *conf = _starpu_get_machine_config();	if (archname == NULL)	{		/* display all architectures */		display_all_perf_models(gnuplot_file, model, &first);		display_history_based_perf_models(gnuplot_file, model, NULL, NULL, NULL, &first);	}	else	{		if (strcmp(archname, "cpu") == 0)		{						arch.type = STARPU_CPU_WORKER;			arch.devid = 1;			arch.ncore = 0;			display_selected_arch_perf_models(gnuplot_file, model, &arch, &first); 			display_history_based_perf_models(gnuplot_file, model,  &arch.type, &arch.devid, &arch.ncore, &first);			return;		}		unsigned k;		if (sscanf(archname, "cpu:%u", &k) == 1)		{			/* For combined CPU workers */			if ((k < 1) || (k > conf->topology.ncpus))			{				fprintf(stderr, "Invalid CPU size\n");				exit(-1);			}			arch.type = STARPU_CPU_WORKER;			arch.devid = 1;			arch.ncore = k - 1;			display_selected_arch_perf_models(gnuplot_file, model, &arch, &first); 			display_history_based_perf_models(gnuplot_file, model,  &arch.type, &arch.devid, &arch.ncore, &first);			return;		}		if (strcmp(archname, "cuda") == 0)		{			unsigned archtype = STARPU_CUDA_WORKER;			display_selected_archtype_perf_models(gnuplot_file, model, archtype, &first);			display_history_based_perf_models(gnuplot_file, model,  &archtype, NULL, NULL, &first);			return;		}		/* There must be a cleaner way ! */		unsigned gpuid;		int nmatched;		nmatched = sscanf(archname, "cuda_%u", &gpuid);		if (nmatched == 1)		{			if (gpuid < conf->topology.ncudagpus)			{				arch.type = STARPU_CUDA_WORKER;				arch.devid = gpuid;				arch.ncore = 0;				display_selected_arch_perf_models(gnuplot_file, model, &arch, &first);				display_history_based_perf_models(gnuplot_file, model,  &arch.type, &arch.devid, &arch.ncore, &first);				return;			}			else			{				fprintf(stderr, "Invalid CUDA device %d (last valid one is %d)\n", gpuid, STARPU_MAXCUDADEVS-1);				exit(-1);			}		}		if (strcmp(archname, "opencl") == 0)		{			unsigned archtype = STARPU_OPENCL_WORKER;			display_selected_archtype_perf_models(gnuplot_file, model, archtype, &first);			display_history_based_perf_models(gnuplot_file, model,  &archtype, NULL, NULL, &first);			return;		}		/* There must be a cleaner way ! */		nmatched = sscanf(archname, "opencl_%u", &gpuid);		if (nmatched == 1)		{			if (gpuid < conf->topology.nopenclgpus)			{				arch.type = STARPU_OPENCL_WORKER;				arch.devid = gpuid;				arch.ncore = 0;						display_selected_arch_perf_models(gnuplot_file, model, &arch, &first);				display_history_based_perf_models(gnuplot_file, model,  &arch.type, &arch.devid, &arch.ncore, &first);				return;			}			else			{				fprintf(stderr, "Invalid OpenCL device %d (last valid one is %d)\n", gpuid, STARPU_MAXOPENCLDEVS-1);				exit(-1);			}		}		fprintf(stderr, "Unknown architecture requested, aborting.\n");		exit(-1);	}}int main(int argc, char **argv){	int ret;	struct starpu_perfmodel model;#ifdef __MINGW32__	WSADATA wsadata;	WSAStartup(MAKEWORD(1,0), &wsadata);#endif	parse_args(argc, argv);        if (list)	{                ret = starpu_perfmodel_list(stdout);                if (ret)		{                        fprintf(stderr, "The performance model directory is invalid\n");                        return 1;                }		return 0;        }	/* Load the performance model associated to the symbol */	ret = starpu_perfmodel_load_symbol(symbol, &model);	if (ret == 1)	{		fprintf(stderr, "The performance model for the symbol <%s> could not be loaded\n", symbol);		return 1;	}	/* If some FxT input was specified, we put the points on the graph */#ifdef STARPU_USE_FXT	if (!no_fxt_file)	{		starpu_fxt_generate_trace(&options);		snprintf(data_file_name, 256, "starpu_%s.data", symbol);		FILE *data_file = fopen(data_file_name, "w+");		STARPU_ASSERT(data_file);		dump_data_file(data_file, &model);		fclose(data_file);	}#endif	snprintf(gnuplot_file_name, 256, "starpu_%s.gp", symbol);	snprintf(avg_file_name, 256, "starpu_%s_avg.data", symbol);	FILE *gnuplot_file = fopen(gnuplot_file_name, "w+");	STARPU_ASSERT(gnuplot_file);	display_selected_models(gnuplot_file, &model);	fclose(gnuplot_file);	/* Retrieve the current mode of the gnuplot executable */	struct stat sb;	ret = stat(gnuplot_file_name, &sb);	if (ret)	{		perror("stat");		STARPU_ABORT();	}	/* Make the gnuplot scrit executable for the owner */	ret = chmod(gnuplot_file_name, sb.st_mode|S_IXUSR);	if (ret)	{		perror("chmod");		STARPU_ABORT();	}	_STARPU_DISP("Gnuplot file <%s> generated\n", gnuplot_file_name);	return 0;}
 |