| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186 | /* StarPU --- Runtime system for heterogeneous multicore architectures. * * Copyright (C) 2010-2014, 2016-2017  Université de Bordeaux * Copyright (C) 2010, 2011, 2013  CNRS * * StarPU is free software; you can redistribute it and/or modify * it under the terms of the GNU Lesser General Public License as published by * the Free Software Foundation; either version 2.1 of the License, or (at * your option) any later version. * * StarPU is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. * * See the GNU Lesser General Public License in COPYING.LGPL for more details. */#ifndef __STARPU_PROFILING_H__#define __STARPU_PROFILING_H__#include <starpu.h>#include <errno.h>#include <time.h>#include <starpu_util.h>#ifdef __cplusplusextern "C"{#endif#define STARPU_PROFILING_DISABLE	0#define STARPU_PROFILING_ENABLE		1struct starpu_profiling_task_info{	struct timespec submit_time;	struct timespec push_start_time;	struct timespec push_end_time;	struct timespec pop_start_time;	struct timespec pop_end_time;	struct timespec acquire_data_start_time;	struct timespec acquire_data_end_time;	struct timespec start_time;	struct timespec end_time;	struct timespec release_data_start_time;	struct timespec release_data_end_time;	struct timespec callback_start_time;	struct timespec callback_end_time;	/* TODO add expected length, expected start/end ? */	int workerid;	uint64_t used_cycles;	uint64_t stall_cycles;	double energy_consumed;};struct starpu_profiling_worker_info{	struct timespec start_time;	struct timespec total_time;	struct timespec executing_time;	struct timespec sleeping_time;	int executed_tasks;	uint64_t used_cycles;	uint64_t stall_cycles;	double energy_consumed;	double flops;};struct starpu_profiling_bus_info{	struct timespec start_time;	struct timespec total_time;	int long long transferred_bytes;	int transfer_count;};void starpu_profiling_init(void);void starpu_profiling_set_id(int new_id);int starpu_profiling_status_set(int status);int starpu_profiling_status_get(void);#ifdef BUILDING_STARPU#include <common/utils.h>#ifdef __GNUC__extern int _starpu_profiling;#define starpu_profiling_status_get() ({ \	int __ret; \	ANNOTATE_HAPPENS_AFTER(&_starpu_profiling); \	__ret = _starpu_profiling; \	ANNOTATE_HAPPENS_BEFORE(&_starpu_profiling); \	__ret; \})#endif#endifint starpu_profiling_worker_get_info(int workerid, struct starpu_profiling_worker_info *worker_info);int starpu_bus_get_count(void);int starpu_bus_get_id(int src, int dst);int starpu_bus_get_src(int busid);int starpu_bus_get_dst(int busid);void starpu_bus_set_direct(int busid, int direct);int starpu_bus_get_direct(int busid);void starpu_bus_set_ngpus(int busid, int ngpus);int starpu_bus_get_ngpus(int busid);int starpu_bus_get_profiling_info(int busid, struct starpu_profiling_bus_info *bus_info);/* Some helper functions to manipulate profiling API output *//* Reset timespec */static __starpu_inline void starpu_timespec_clear(struct timespec *tsp){	tsp->tv_sec = 0;	tsp->tv_nsec = 0;}#define STARPU_NS_PER_S 1000000000/* Computes result = a + b */static __starpu_inline void starpu_timespec_add(struct timespec *a,						struct timespec *b,						struct timespec *result){	result->tv_sec = a->tv_sec + b->tv_sec;	result->tv_nsec = a->tv_nsec + b->tv_nsec;	if (result->tv_nsec >= STARPU_NS_PER_S)	{		++(result)->tv_sec;		result->tv_nsec -= STARPU_NS_PER_S;	}}/* Computes res += b */static __starpu_inline void starpu_timespec_accumulate(struct timespec *result,						       struct timespec *a){	result->tv_sec += a->tv_sec;	result->tv_nsec += a->tv_nsec;	if (result->tv_nsec >= STARPU_NS_PER_S)	{		++(result)->tv_sec;		result->tv_nsec -= STARPU_NS_PER_S;	}}/* Computes result = a - b */static __starpu_inline void starpu_timespec_sub(const struct timespec *a,						const struct timespec *b,						struct timespec *result){	result->tv_sec = a->tv_sec - b->tv_sec;	result->tv_nsec = a->tv_nsec - b->tv_nsec;	if ((result)->tv_nsec < 0)	{		--(result)->tv_sec;		result->tv_nsec += STARPU_NS_PER_S;	}}#define starpu_timespec_cmp(a, b, CMP)                          \	(((a)->tv_sec == (b)->tv_sec) ? ((a)->tv_nsec CMP (b)->tv_nsec) : ((a)->tv_sec CMP (b)->tv_sec))double starpu_timing_timespec_delay_us(struct timespec *start, struct timespec *end);double starpu_timing_timespec_to_us(struct timespec *ts);void starpu_profiling_bus_helper_display_summary(void);void starpu_profiling_worker_helper_display_summary(void);#ifdef __cplusplus}#endif#endif /* __STARPU_PROFILING_H__ */
 |