| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248 | 
							- /* StarPU --- Runtime system for heterogeneous multicore architectures.
 
-  *
 
-  * Copyright (C) 2019-2020  Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
 
-  *
 
-  * StarPU is free software; you can redistribute it and/or modify
 
-  * it under the terms of the GNU Lesser General Public License as published by
 
-  * the Free Software Foundation; either version 2.1 of the License, or (at
 
-  * your option) any later version.
 
-  *
 
-  * StarPU is distributed in the hope that it will be useful, but
 
-  * WITHOUT ANY WARRANTY; without even the implied warranty of
 
-  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
 
-  *
 
-  * See the GNU Lesser General Public License in COPYING.LGPL for more details.
 
-  */
 
- #include <starpu.h>
 
- #include <assert.h>
 
- #include <inttypes.h>
 
- #define FPRINTF(ofile, fmt, ...) do { if (!getenv("STARPU_SSILENT")) {fprintf(ofile, fmt, ## __VA_ARGS__); }} while(0)
 
- /* global counters */
 
- static int id_g_total_submitted;
 
- static int id_g_peak_submitted;
 
- static int id_g_peak_ready;
 
- /* per worker counters */
 
- static int id_w_total_executed;
 
- static int id_w_cumul_execution_time;
 
- /* per_codelet counters */
 
- static int id_c_total_submitted;
 
- static int id_c_peak_submitted;
 
- static int id_c_peak_ready;
 
- static int id_c_total_executed;
 
- static int id_c_cumul_execution_time;
 
- void g_listener_cb(struct starpu_perf_counter_listener *listener, struct starpu_perf_counter_sample *sample, void *context)
 
- {
 
- 	(void) listener;
 
- 	(void) context;
 
- 	int64_t g_total_submitted = starpu_perf_counter_sample_get_int64_value(sample, id_g_total_submitted);
 
- 	int64_t g_peak_submitted = starpu_perf_counter_sample_get_int64_value(sample, id_g_peak_submitted);
 
- 	int64_t g_peak_ready = starpu_perf_counter_sample_get_int64_value(sample, id_g_peak_ready);
 
- 	printf("global: g_total_submitted = %"PRId64", g_peak_submitted = %"PRId64", g_peak_ready = %"PRId64"\n", g_total_submitted, g_peak_submitted, g_peak_ready);
 
- }
 
- void w_listener_cb(struct starpu_perf_counter_listener *listener, struct starpu_perf_counter_sample *sample, void *context)
 
- {
 
- 	(void) listener;
 
- 	(void) context;
 
- 	int workerid = starpu_worker_get_id();
 
- 	int64_t w_total_executed = starpu_perf_counter_sample_get_int64_value(sample, id_w_total_executed);
 
- 	double w_cumul_execution_time = starpu_perf_counter_sample_get_double_value(sample, id_w_cumul_execution_time);
 
- 	printf("worker[%d]: w_total_executed = %"PRId64", w_cumul_execution_time = %lf\n", workerid, w_total_executed, w_cumul_execution_time);
 
- }
 
- void c_listener_cb(struct starpu_perf_counter_listener *listener, struct starpu_perf_counter_sample *sample, void *context)
 
- {
 
- 	(void) listener;
 
- 	struct starpu_codelet *cl = context;
 
- 	int64_t c_total_submitted = starpu_perf_counter_sample_get_int64_value(sample, id_c_total_submitted);
 
- 	int64_t c_peak_submitted = starpu_perf_counter_sample_get_int64_value(sample, id_c_peak_submitted);
 
- 	int64_t c_peak_ready = starpu_perf_counter_sample_get_int64_value(sample, id_c_peak_ready);
 
- 	int64_t c_total_executed = starpu_perf_counter_sample_get_int64_value(sample, id_c_total_executed);
 
- 	double c_cumul_execution_time = starpu_perf_counter_sample_get_double_value(sample, id_c_cumul_execution_time);
 
- 	if (cl->name != NULL)
 
- 	{
 
- 		printf("codelet[%s]: c_total_submitted = %"PRId64", c_peak_submitted = %"PRId64", c_peak_ready = %"PRId64", c_total_executed = %"PRId64", c_cumul_execution_time = %lf\n", cl->name, c_total_submitted, c_peak_submitted, c_peak_ready, c_total_executed, c_cumul_execution_time);
 
- 	}
 
- 	else
 
- 	{
 
- 		printf("codelet[%p]: c_total_submitted = %"PRId64", c_peak_submitted = %"PRId64", c_peak_ready = %"PRId64", c_total_executed = %"PRId64", c_cumul_execution_time = %lf\n", cl, c_total_submitted, c_peak_submitted, c_peak_ready, c_total_executed, c_cumul_execution_time);
 
- 	}
 
- }
 
- void f(void *buffers[], void *cl_args)
 
- {
 
- 	int *int_vector = (int*)STARPU_VECTOR_GET_PTR(buffers[0]);
 
- 	int NX = (int)STARPU_VECTOR_GET_NX(buffers[0]);
 
- 	const int niters;
 
- 	starpu_codelet_unpack_args(cl_args, &niters);
 
- 	int i;
 
- 	for (i=0; i<niters; i++)
 
- 	{
 
- 		int_vector[i % NX] += i;
 
- 	}
 
- }
 
- struct starpu_codelet cl =
 
- {
 
- 	.cpu_funcs      = {f},
 
- 	.cpu_funcs_name = {"f"},
 
- 	.nbuffers       = 1,
 
- 	.name           = "perf_counter_f"
 
- };
 
- const enum starpu_perf_counter_scope g_scope = starpu_perf_counter_scope_global;
 
- const enum starpu_perf_counter_scope w_scope = starpu_perf_counter_scope_per_worker;
 
- const enum starpu_perf_counter_scope c_scope = starpu_perf_counter_scope_per_codelet;
 
- #define NVECTORS 5
 
- #define NTASKS 1000
 
- #define NITER 1000
 
- #define VECTOR_LEN 2
 
- int main(int argc, char **argv)
 
- {
 
- 	struct starpu_conf conf;
 
- 	starpu_conf_init(&conf);
 
- 	
 
- 	/* Start collecting perfomance counter right after initialization */
 
- 	conf.start_perf_counter_collection = 1;
 
- 	int ret;
 
- 	ret = starpu_init(&conf);
 
- 	if (ret == -ENODEV)
 
- 		return 77;
 
- 	STARPU_CHECK_RETURN_VALUE(ret, "starpu_init");
 
- 	struct starpu_perf_counter_set *g_set = starpu_perf_counter_set_alloc(g_scope);
 
- 	STARPU_ASSERT(g_set != NULL);
 
- 	struct starpu_perf_counter_set *w_set = starpu_perf_counter_set_alloc(w_scope);
 
- 	STARPU_ASSERT(w_set != NULL);
 
- 	struct starpu_perf_counter_set *c_set = starpu_perf_counter_set_alloc(c_scope);
 
- 	STARPU_ASSERT(c_set != NULL);
 
- 	id_g_total_submitted = starpu_perf_counter_name_to_id(g_scope, "starpu.task.g_total_submitted");
 
- 	STARPU_ASSERT(id_g_total_submitted != -1);
 
- 	id_g_peak_submitted = starpu_perf_counter_name_to_id(g_scope, "starpu.task.g_peak_submitted");
 
- 	STARPU_ASSERT(id_g_peak_submitted != -1);
 
- 	id_g_peak_ready = starpu_perf_counter_name_to_id(g_scope, "starpu.task.g_peak_ready");
 
- 	STARPU_ASSERT(id_g_peak_ready != -1);
 
- 	id_w_total_executed = starpu_perf_counter_name_to_id(w_scope, "starpu.task.w_total_executed");
 
- 	STARPU_ASSERT(id_w_total_executed != -1);
 
- 	id_w_cumul_execution_time = starpu_perf_counter_name_to_id(w_scope, "starpu.task.w_cumul_execution_time");
 
- 	STARPU_ASSERT(id_w_cumul_execution_time != -1);
 
- 	id_c_total_submitted = starpu_perf_counter_name_to_id(c_scope, "starpu.task.c_total_submitted");
 
- 	STARPU_ASSERT(id_c_total_submitted != -1);
 
- 	id_c_peak_submitted = starpu_perf_counter_name_to_id(c_scope, "starpu.task.c_peak_submitted");
 
- 	STARPU_ASSERT(id_c_peak_submitted != -1);
 
- 	id_c_peak_ready = starpu_perf_counter_name_to_id(c_scope, "starpu.task.c_peak_ready");
 
- 	STARPU_ASSERT(id_c_peak_ready != -1);
 
- 	id_c_total_executed = starpu_perf_counter_name_to_id(c_scope, "starpu.task.c_total_executed");
 
- 	STARPU_ASSERT(id_c_total_executed != -1);
 
- 	id_c_cumul_execution_time = starpu_perf_counter_name_to_id(c_scope, "starpu.task.c_cumul_execution_time");
 
- 	STARPU_ASSERT(id_c_cumul_execution_time != -1);
 
- 	starpu_perf_counter_set_enable_id(g_set, id_g_total_submitted);
 
- 	starpu_perf_counter_set_enable_id(g_set, id_g_peak_submitted);
 
- 	starpu_perf_counter_set_enable_id(g_set, id_g_peak_ready);
 
- 	starpu_perf_counter_set_enable_id(w_set, id_w_total_executed);
 
- 	starpu_perf_counter_set_enable_id(w_set, id_w_cumul_execution_time);
 
- 	starpu_perf_counter_set_enable_id(c_set, id_c_total_submitted);
 
- 	starpu_perf_counter_set_enable_id(c_set, id_c_peak_submitted);
 
- 	starpu_perf_counter_set_enable_id(c_set, id_c_peak_ready);
 
- 	starpu_perf_counter_set_enable_id(c_set, id_c_total_executed);
 
- 	starpu_perf_counter_set_enable_id(c_set, id_c_cumul_execution_time);
 
- 	struct starpu_perf_counter_listener * g_listener = starpu_perf_counter_listener_init(g_set, g_listener_cb, (void *)(uintptr_t)42);
 
- 	struct starpu_perf_counter_listener * w_listener = starpu_perf_counter_listener_init(w_set, w_listener_cb, (void *)(uintptr_t)17);
 
- 	struct starpu_perf_counter_listener * c_listener = starpu_perf_counter_listener_init(c_set, c_listener_cb, (void *)(uintptr_t)76);
 
- 	starpu_perf_counter_set_global_listener(g_listener);
 
- 	starpu_perf_counter_set_all_per_worker_listeners(w_listener);
 
- 	starpu_perf_counter_set_per_codelet_listener(&cl, c_listener);
 
- 	int* vector[NVECTORS];
 
- 	starpu_data_handle_t vector_h[NVECTORS];
 
- 	int v;
 
- 	for (v=0; v<NVECTORS; v++)
 
- 	{
 
- 		vector[v] = calloc(VECTOR_LEN, sizeof(*(vector[v])));
 
- 		STARPU_ASSERT(vector[v] != NULL);
 
- 		{
 
- 			int i;
 
- 			for (i=0; i<VECTOR_LEN; i++)
 
- 			{
 
- 				vector[v][i] = i;
 
- 			}
 
- 		}
 
- 		starpu_vector_data_register(&vector_h[v], STARPU_MAIN_RAM, (uintptr_t)vector[v], VECTOR_LEN, sizeof(*vector[v]));
 
- 	}
 
- 	{
 
- 		int i;
 
- 		for (i=0; i<NTASKS; i++)
 
- 		{
 
- 			v = i % NVECTORS;
 
- 			const int niter = NITER;
 
- 			starpu_insert_task(&cl,
 
- 					STARPU_RW, vector_h[v],
 
- 					STARPU_VALUE, &niter, sizeof(int),
 
- 					0);
 
- 		}
 
- 	}
 
- 	for (v=0; v<NVECTORS; v++)
 
- 	{
 
- 		starpu_data_unregister(vector_h[v]);
 
- 		free(vector[v]);
 
- 	}
 
- 	starpu_perf_counter_unset_per_codelet_listener(&cl);
 
- 	starpu_perf_counter_unset_all_per_worker_listeners();
 
- 	starpu_perf_counter_unset_global_listener();
 
- 	starpu_perf_counter_listener_exit(c_listener);
 
- 	starpu_perf_counter_listener_exit(w_listener);
 
- 	starpu_perf_counter_listener_exit(g_listener);
 
- 	starpu_perf_counter_set_disable_id(c_set, id_c_cumul_execution_time);
 
- 	starpu_perf_counter_set_disable_id(c_set, id_c_total_executed);
 
- 	starpu_perf_counter_set_disable_id(c_set, id_c_peak_ready);
 
- 	starpu_perf_counter_set_disable_id(c_set, id_c_peak_submitted);
 
- 	starpu_perf_counter_set_disable_id(c_set, id_c_total_submitted);
 
- 	starpu_perf_counter_set_disable_id(w_set, id_w_cumul_execution_time);
 
- 	starpu_perf_counter_set_disable_id(w_set, id_w_total_executed);
 
- 	starpu_perf_counter_set_disable_id(g_set, id_g_peak_ready);
 
- 	starpu_perf_counter_set_disable_id(g_set, id_g_peak_submitted);
 
- 	starpu_perf_counter_set_disable_id(g_set, id_g_total_submitted);
 
- 	starpu_perf_counter_set_free(c_set);
 
- 	c_set = NULL;
 
- 	starpu_perf_counter_set_free(w_set);
 
- 	w_set = NULL;
 
- 	starpu_perf_counter_set_free(g_set);
 
- 	g_set = NULL;
 
- 	starpu_shutdown();
 
- 	return 0;
 
- }
 
 
  |