starpu_profiling.h 4.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2010-2013 Université de Bordeaux 1
  4. * Copyright (C) 2010, 2011, 2013 Centre National de la Recherche Scientifique
  5. *
  6. * StarPU is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU Lesser General Public License as published by
  8. * the Free Software Foundation; either version 2.1 of the License, or (at
  9. * your option) any later version.
  10. *
  11. * StarPU is distributed in the hope that it will be useful, but
  12. * WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  14. *
  15. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  16. */
  17. #ifndef __STARPU_PROFILING_H__
  18. #define __STARPU_PROFILING_H__
  19. #include <starpu.h>
  20. #include <errno.h>
  21. #include <time.h>
  22. #ifdef __cplusplus
  23. extern "C"
  24. {
  25. #endif
  26. #define STARPU_PROFILING_DISABLE 0
  27. #define STARPU_PROFILING_ENABLE 1
  28. struct starpu_profiling_task_info
  29. {
  30. struct timespec submit_time;
  31. struct timespec push_start_time;
  32. struct timespec push_end_time;
  33. struct timespec pop_start_time;
  34. struct timespec pop_end_time;
  35. struct timespec acquire_data_start_time;
  36. struct timespec acquire_data_end_time;
  37. struct timespec start_time;
  38. struct timespec end_time;
  39. struct timespec release_data_start_time;
  40. struct timespec release_data_end_time;
  41. struct timespec callback_start_time;
  42. struct timespec callback_end_time;
  43. /* TODO add expected length, expected start/end ? */
  44. int workerid;
  45. uint64_t used_cycles;
  46. uint64_t stall_cycles;
  47. double power_consumed;
  48. };
  49. struct starpu_profiling_worker_info
  50. {
  51. struct timespec start_time;
  52. struct timespec total_time;
  53. struct timespec executing_time;
  54. struct timespec sleeping_time;
  55. int executed_tasks;
  56. uint64_t used_cycles;
  57. uint64_t stall_cycles;
  58. double power_consumed;
  59. };
  60. struct starpu_profiling_bus_info
  61. {
  62. struct timespec start_time;
  63. struct timespec total_time;
  64. int long long transferred_bytes;
  65. int transfer_count;
  66. };
  67. void starpu_profiling_set_id(int new_id);
  68. int starpu_profiling_status_set(int status);
  69. int starpu_profiling_status_get(void);
  70. #ifdef BUILDING_STARPU
  71. #include <common/utils.h>
  72. extern int _starpu_profiling;
  73. #define starpu_profiling_status_get() ({ \
  74. int __ret; \
  75. ANNOTATE_HAPPENS_AFTER(&_starpu_profiling); \
  76. __ret = _starpu_profiling; \
  77. ANNOTATE_HAPPENS_BEFORE(&_starpu_profiling); \
  78. __ret; \
  79. })
  80. #endif
  81. int starpu_profiling_worker_get_info(int workerid, struct starpu_profiling_worker_info *worker_info);
  82. int starpu_bus_get_count(void);
  83. int starpu_bus_get_id(int src, int dst);
  84. int starpu_bus_get_src(int busid);
  85. int starpu_bus_get_dst(int busid);
  86. int starpu_bus_get_profiling_info(int busid, struct starpu_profiling_bus_info *bus_info);
  87. /* Some helper functions to manipulate profiling API output */
  88. /* Reset timespec */
  89. static __starpu_inline void starpu_timespec_clear(struct timespec *tsp)
  90. {
  91. tsp->tv_sec = 0;
  92. tsp->tv_nsec = 0;
  93. }
  94. /* Computes result = a + b */
  95. static __starpu_inline void starpu_timespec_add(struct timespec *a,
  96. struct timespec *b,
  97. struct timespec *result)
  98. {
  99. result->tv_sec = a->tv_sec + b->tv_sec;
  100. result->tv_nsec = a->tv_nsec + b->tv_nsec;
  101. if (result->tv_nsec >= 1000000000)
  102. {
  103. ++(result)->tv_sec;
  104. result->tv_nsec -= 1000000000;
  105. }
  106. }
  107. /* Computes res += b */
  108. static __starpu_inline void starpu_timespec_accumulate(struct timespec *result,
  109. struct timespec *a)
  110. {
  111. result->tv_sec += a->tv_sec;
  112. result->tv_nsec += a->tv_nsec;
  113. if (result->tv_nsec >= 1000000000)
  114. {
  115. ++(result)->tv_sec;
  116. result->tv_nsec -= 1000000000;
  117. }
  118. }
  119. /* Computes result = a - b */
  120. static __starpu_inline void starpu_timespec_sub(const struct timespec *a,
  121. const struct timespec *b,
  122. struct timespec *result)
  123. {
  124. result->tv_sec = a->tv_sec - b->tv_sec;
  125. result->tv_nsec = a->tv_nsec - b->tv_nsec;
  126. if ((result)->tv_nsec < 0)
  127. {
  128. --(result)->tv_sec;
  129. result->tv_nsec += 1000000000;
  130. }
  131. }
  132. #define starpu_timespec_cmp(a, b, CMP) \
  133. (((a)->tv_sec == (b)->tv_sec) ? ((a)->tv_nsec CMP (b)->tv_nsec) : ((a)->tv_sec CMP (b)->tv_sec))
  134. double starpu_timing_timespec_delay_us(struct timespec *start, struct timespec *end);
  135. double starpu_timing_timespec_to_us(struct timespec *ts);
  136. void starpu_profiling_bus_helper_display_summary(void);
  137. void starpu_profiling_worker_helper_display_summary(void);
  138. #ifdef __cplusplus
  139. }
  140. #endif
  141. #endif /* __STARPU_PROFILING_H__ */