123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193 |
- /* StarPU --- Runtime system for heterogeneous multicore architectures.
- *
- * Copyright (C) 2010-2014,2016,2017 Université de Bordeaux
- * Copyright (C) 2010,2011,2013,2015,2017,2019 CNRS
- * Copyright (C) 2016 Inria
- *
- * StarPU is free software; you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation; either version 2.1 of the License, or (at
- * your option) any later version.
- *
- * StarPU is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- *
- * See the GNU Lesser General Public License in COPYING.LGPL for more details.
- */
- #ifndef __STARPU_PROFILING_H__
- #define __STARPU_PROFILING_H__
- /** @defgroup
- *
- * @{
- */
- #include <starpu.h>
- #include <errno.h>
- #include <time.h>
- #ifdef __cplusplus
- extern "C"
- {
- #endif
- #define STARPU_PROFILING_DISABLE 0
- #define STARPU_PROFILING_ENABLE 1
- struct starpu_profiling_task_info
- {
- struct timespec submit_time;
- struct timespec push_start_time;
- struct timespec push_end_time;
- struct timespec pop_start_time;
- struct timespec pop_end_time;
- struct timespec acquire_data_start_time;
- struct timespec acquire_data_end_time;
- struct timespec start_time;
- struct timespec end_time;
- struct timespec release_data_start_time;
- struct timespec release_data_end_time;
- struct timespec callback_start_time;
- struct timespec callback_end_time;
- /* TODO add expected length, expected start/end ? */
- int workerid;
- uint64_t used_cycles;
- uint64_t stall_cycles;
- double energy_consumed;
- };
- struct starpu_profiling_worker_info
- {
- struct timespec start_time;
- struct timespec total_time;
- struct timespec executing_time;
- struct timespec sleeping_time;
- int executed_tasks;
- uint64_t used_cycles;
- uint64_t stall_cycles;
- double energy_consumed;
- double flops;
- };
- struct starpu_profiling_bus_info
- {
- struct timespec start_time;
- struct timespec total_time;
- int long long transferred_bytes;
- int transfer_count;
- };
- void starpu_profiling_init(void);
- void starpu_profiling_set_id(int new_id);
- int starpu_profiling_status_set(int status);
- int starpu_profiling_status_get(void);
- #ifdef BUILDING_STARPU
- #include <common/utils.h>
- #ifdef __GNUC__
- extern int _starpu_profiling;
- #define starpu_profiling_status_get() ({ \
- int __ret; \
- ANNOTATE_HAPPENS_AFTER(&_starpu_profiling); \
- __ret = _starpu_profiling; \
- ANNOTATE_HAPPENS_BEFORE(&_starpu_profiling); \
- __ret; \
- })
- #endif
- #endif
- int starpu_profiling_worker_get_info(int workerid, struct starpu_profiling_worker_info *worker_info);
- int starpu_bus_get_count(void);
- int starpu_bus_get_id(int src, int dst);
- int starpu_bus_get_src(int busid);
- int starpu_bus_get_dst(int busid);
- void starpu_bus_set_direct(int busid, int direct);
- int starpu_bus_get_direct(int busid);
- void starpu_bus_set_ngpus(int busid, int ngpus);
- int starpu_bus_get_ngpus(int busid);
- int starpu_bus_get_profiling_info(int busid, struct starpu_profiling_bus_info *bus_info);
- /* Some helper functions to manipulate profiling API output */
- /* Reset timespec */
- static __starpu_inline void starpu_timespec_clear(struct timespec *tsp)
- {
- tsp->tv_sec = 0;
- tsp->tv_nsec = 0;
- }
- #define STARPU_NS_PER_S 1000000000
- /* Computes result = a + b */
- static __starpu_inline void starpu_timespec_add(struct timespec *a,
- struct timespec *b,
- struct timespec *result)
- {
- result->tv_sec = a->tv_sec + b->tv_sec;
- result->tv_nsec = a->tv_nsec + b->tv_nsec;
- if (result->tv_nsec >= STARPU_NS_PER_S)
- {
- ++(result)->tv_sec;
- result->tv_nsec -= STARPU_NS_PER_S;
- }
- }
- /* Computes res += b */
- static __starpu_inline void starpu_timespec_accumulate(struct timespec *result,
- struct timespec *a)
- {
- result->tv_sec += a->tv_sec;
- result->tv_nsec += a->tv_nsec;
- if (result->tv_nsec >= STARPU_NS_PER_S)
- {
- ++(result)->tv_sec;
- result->tv_nsec -= STARPU_NS_PER_S;
- }
- }
- /* Computes result = a - b */
- static __starpu_inline void starpu_timespec_sub(const struct timespec *a,
- const struct timespec *b,
- struct timespec *result)
- {
- result->tv_sec = a->tv_sec - b->tv_sec;
- result->tv_nsec = a->tv_nsec - b->tv_nsec;
- if ((result)->tv_nsec < 0)
- {
- --(result)->tv_sec;
- result->tv_nsec += STARPU_NS_PER_S;
- }
- }
- #define starpu_timespec_cmp(a, b, CMP) \
- (((a)->tv_sec == (b)->tv_sec) ? ((a)->tv_nsec CMP (b)->tv_nsec) : ((a)->tv_sec CMP (b)->tv_sec))
- double starpu_timing_timespec_delay_us(struct timespec *start, struct timespec *end);
- double starpu_timing_timespec_to_us(struct timespec *ts);
- void starpu_profiling_bus_helper_display_summary(void);
- void starpu_profiling_worker_helper_display_summary(void);
- #ifdef __cplusplus
- }
- #endif
- /** @} */
- #endif /* __STARPU_PROFILING_H__ */
|