fxt.h 44 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2009-2017 Université de Bordeaux
  4. * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2016, 2017 CNRS
  5. * Copyright (C) 2016 Inria
  6. *
  7. * StarPU is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU Lesser General Public License as published by
  9. * the Free Software Foundation; either version 2.1 of the License, or (at
  10. * your option) any later version.
  11. *
  12. * StarPU is distributed in the hope that it will be useful, but
  13. * WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  15. *
  16. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  17. */
  18. #ifndef __FXT_H__
  19. #define __FXT_H__
  20. #ifndef _GNU_SOURCE
  21. #define _GNU_SOURCE /* ou _BSD_SOURCE ou _SVID_SOURCE */
  22. #endif
  23. #include <string.h>
  24. #include <sys/types.h>
  25. #include <stdlib.h>
  26. #include <common/config.h>
  27. #ifdef HAVE_UNISTD_H
  28. #include <unistd.h>
  29. #endif
  30. #include <common/utils.h>
  31. #include <starpu.h>
  32. /* some key to identify the worker kind */
  33. #define _STARPU_FUT_APPS_KEY 0x100
  34. #define _STARPU_FUT_CPU_KEY 0x101
  35. #define _STARPU_FUT_CUDA_KEY 0x102
  36. #define _STARPU_FUT_OPENCL_KEY 0x103
  37. #define _STARPU_FUT_MIC_KEY 0x104
  38. #define _STARPU_FUT_SCC_KEY 0x105
  39. #define _STARPU_FUT_MPI_KEY 0x106
  40. #define _STARPU_FUT_WORKER_INIT_START 0x5100
  41. #define _STARPU_FUT_WORKER_INIT_END 0x5101
  42. #define _STARPU_FUT_START_CODELET_BODY 0x5102
  43. #define _STARPU_FUT_END_CODELET_BODY 0x5103
  44. #define _STARPU_FUT_JOB_PUSH 0x5104
  45. #define _STARPU_FUT_JOB_POP 0x5105
  46. #define _STARPU_FUT_UPDATE_TASK_CNT 0x5106
  47. #define _STARPU_FUT_START_FETCH_INPUT_ON_TID 0x5107
  48. #define _STARPU_FUT_END_FETCH_INPUT_ON_TID 0x5108
  49. #define _STARPU_FUT_START_PUSH_OUTPUT_ON_TID 0x5109
  50. #define _STARPU_FUT_END_PUSH_OUTPUT_ON_TID 0x5110
  51. #define _STARPU_FUT_TAG 0x5111
  52. #define _STARPU_FUT_TAG_DEPS 0x5112
  53. #define _STARPU_FUT_TASK_DEPS 0x5113
  54. #define _STARPU_FUT_DATA_COPY 0x5114
  55. #define _STARPU_FUT_WORK_STEALING 0x5115
  56. #define _STARPU_FUT_WORKER_DEINIT_START 0x5116
  57. #define _STARPU_FUT_WORKER_DEINIT_END 0x5117
  58. #define _STARPU_FUT_WORKER_SLEEP_START 0x5118
  59. #define _STARPU_FUT_WORKER_SLEEP_END 0x5119
  60. #define _STARPU_FUT_TASK_SUBMIT 0x511a
  61. #define _STARPU_FUT_CODELET_DATA_HANDLE 0x511b
  62. #define _STARPU_FUT_MODEL_NAME 0x511c
  63. #define _STARPU_FUT_USER_DEFINED_START 0x5120
  64. #define _STARPU_FUT_USER_DEFINED_END 0x5121
  65. #define _STARPU_FUT_NEW_MEM_NODE 0x5122
  66. #define _STARPU_FUT_START_CALLBACK 0x5123
  67. #define _STARPU_FUT_END_CALLBACK 0x5124
  68. #define _STARPU_FUT_TASK_DONE 0x5125
  69. #define _STARPU_FUT_TAG_DONE 0x5126
  70. #define _STARPU_FUT_START_ALLOC 0x5127
  71. #define _STARPU_FUT_END_ALLOC 0x5128
  72. #define _STARPU_FUT_START_ALLOC_REUSE 0x5129
  73. #define _STARPU_FUT_END_ALLOC_REUSE 0x5130
  74. #define _STARPU_FUT_USED_MEM 0x512a
  75. #define _STARPU_FUT_START_MEMRECLAIM 0x5131
  76. #define _STARPU_FUT_END_MEMRECLAIM 0x5132
  77. #define _STARPU_FUT_START_DRIVER_COPY 0x5133
  78. #define _STARPU_FUT_END_DRIVER_COPY 0x5134
  79. #define _STARPU_FUT_START_DRIVER_COPY_ASYNC 0x5135
  80. #define _STARPU_FUT_END_DRIVER_COPY_ASYNC 0x5136
  81. #define _STARPU_FUT_START_PROGRESS_ON_TID 0x5137
  82. #define _STARPU_FUT_END_PROGRESS_ON_TID 0x5138
  83. #define _STARPU_FUT_USER_EVENT 0x5139
  84. #define _STARPU_FUT_SET_PROFILING 0x513a
  85. #define _STARPU_FUT_TASK_WAIT_FOR_ALL 0x513b
  86. #define _STARPU_FUT_EVENT 0x513c
  87. #define _STARPU_FUT_THREAD_EVENT 0x513d
  88. #define _STARPU_FUT_CODELET_DETAILS 0x513e
  89. #define _STARPU_FUT_CODELET_DATA 0x513f
  90. #define _STARPU_FUT_LOCKING_MUTEX 0x5140
  91. #define _STARPU_FUT_MUTEX_LOCKED 0x5141
  92. #define _STARPU_FUT_UNLOCKING_MUTEX 0x5142
  93. #define _STARPU_FUT_MUTEX_UNLOCKED 0x5143
  94. #define _STARPU_FUT_TRYLOCK_MUTEX 0x5144
  95. #define _STARPU_FUT_RDLOCKING_RWLOCK 0x5145
  96. #define _STARPU_FUT_RWLOCK_RDLOCKED 0x5146
  97. #define _STARPU_FUT_WRLOCKING_RWLOCK 0x5147
  98. #define _STARPU_FUT_RWLOCK_WRLOCKED 0x5148
  99. #define _STARPU_FUT_UNLOCKING_RWLOCK 0x5149
  100. #define _STARPU_FUT_RWLOCK_UNLOCKED 0x514a
  101. #define _STARPU_FUT_LOCKING_SPINLOCK 0x514b
  102. #define _STARPU_FUT_SPINLOCK_LOCKED 0x514c
  103. #define _STARPU_FUT_UNLOCKING_SPINLOCK 0x514d
  104. #define _STARPU_FUT_SPINLOCK_UNLOCKED 0x514e
  105. #define _STARPU_FUT_TRYLOCK_SPINLOCK 0x514f
  106. #define _STARPU_FUT_COND_WAIT_BEGIN 0x5150
  107. #define _STARPU_FUT_COND_WAIT_END 0x5151
  108. #define _STARPU_FUT_MEMORY_FULL 0x5152
  109. #define _STARPU_FUT_DATA_LOAD 0x5153
  110. #define _STARPU_FUT_START_UNPARTITION_ON_TID 0x5154
  111. #define _STARPU_FUT_END_UNPARTITION_ON_TID 0x5155
  112. #define _STARPU_FUT_START_FREE 0x5156
  113. #define _STARPU_FUT_END_FREE 0x5157
  114. #define _STARPU_FUT_START_WRITEBACK 0x5158
  115. #define _STARPU_FUT_END_WRITEBACK 0x5159
  116. #define _STARPU_FUT_SCHED_COMPONENT_PUSH_PRIO 0x515a
  117. #define _STARPU_FUT_SCHED_COMPONENT_POP_PRIO 0x515b
  118. #define _STARPU_FUT_START_WRITEBACK_ASYNC 0x515c
  119. #define _STARPU_FUT_END_WRITEBACK_ASYNC 0x515d
  120. #define _STARPU_FUT_HYPERVISOR_BEGIN 0x5160
  121. #define _STARPU_FUT_HYPERVISOR_END 0x5161
  122. #define _STARPU_FUT_BARRIER_WAIT_BEGIN 0x5162
  123. #define _STARPU_FUT_BARRIER_WAIT_END 0x5163
  124. #define _STARPU_FUT_WORKER_SCHEDULING_START 0x5164
  125. #define _STARPU_FUT_WORKER_SCHEDULING_END 0x5165
  126. #define _STARPU_FUT_WORKER_SCHEDULING_PUSH 0x5166
  127. #define _STARPU_FUT_WORKER_SCHEDULING_POP 0x5167
  128. #define _STARPU_FUT_START_EXECUTING 0x5168
  129. #define _STARPU_FUT_END_EXECUTING 0x5169
  130. #define _STARPU_FUT_SCHED_COMPONENT_NEW 0x516a
  131. #define _STARPU_FUT_SCHED_COMPONENT_CONNECT 0x516b
  132. #define _STARPU_FUT_SCHED_COMPONENT_PUSH 0x516c
  133. #define _STARPU_FUT_SCHED_COMPONENT_PULL 0x516d
  134. #define _STARPU_FUT_TASK_SUBMIT_START 0x516e
  135. #define _STARPU_FUT_TASK_SUBMIT_END 0x516f
  136. #define _STARPU_FUT_TASK_BUILD_START 0x5170
  137. #define _STARPU_FUT_TASK_BUILD_END 0x5171
  138. #define _STARPU_FUT_TASK_MPI_DECODE_START 0x5172
  139. #define _STARPU_FUT_TASK_MPI_DECODE_END 0x5173
  140. #define _STARPU_FUT_TASK_MPI_PRE_START 0x5174
  141. #define _STARPU_FUT_TASK_MPI_PRE_END 0x5175
  142. #define _STARPU_FUT_TASK_MPI_POST_START 0x5176
  143. #define _STARPU_FUT_TASK_MPI_POST_END 0x5177
  144. #define _STARPU_FUT_TASK_WAIT_START 0x5178
  145. #define _STARPU_FUT_TASK_WAIT_END 0x5179
  146. #define _STARPU_FUT_TASK_WAIT_FOR_ALL_START 0x517a
  147. #define _STARPU_FUT_TASK_WAIT_FOR_ALL_END 0x517b
  148. #define _STARPU_FUT_HANDLE_DATA_REGISTER 0x517c
  149. #define _STARPU_FUT_DATA_INVALIDATE 0x517d
  150. #define _STARPU_FUT_START_FETCH_INPUT 0x517e
  151. #define _STARPU_FUT_END_FETCH_INPUT 0x517f
  152. #ifdef STARPU_USE_FXT
  153. #include <fxt/fxt.h>
  154. #include <fxt/fut.h>
  155. /* Some versions of FxT do not include the declaration of the function */
  156. #ifdef HAVE_ENABLE_FUT_FLUSH
  157. #if !HAVE_DECL_ENABLE_FUT_FLUSH
  158. void enable_fut_flush();
  159. #endif
  160. #endif
  161. #ifdef HAVE_FUT_SET_FILENAME
  162. #if !HAVE_DECL_FUT_SET_FILENAME
  163. void fut_set_filename(char *filename);
  164. #endif
  165. #endif
  166. extern int _starpu_fxt_started;
  167. extern starpu_pthread_mutex_t _starpu_fxt_started_mutex;
  168. extern starpu_pthread_cond_t _starpu_fxt_started_cond;
  169. static inline void _starpu_fxt_wait_initialisation()
  170. {
  171. STARPU_PTHREAD_MUTEX_LOCK(&_starpu_fxt_started_mutex);
  172. while (!_starpu_fxt_started)
  173. STARPU_PTHREAD_COND_WAIT(&_starpu_fxt_started_cond, &_starpu_fxt_started_mutex);
  174. STARPU_PTHREAD_MUTEX_UNLOCK(&_starpu_fxt_started_mutex);
  175. }
  176. long _starpu_gettid(void);
  177. /* Initialize the FxT library. */
  178. void _starpu_fxt_init_profiling(unsigned trace_buffer_size);
  179. /* Stop the FxT library, and generate the trace file. */
  180. void _starpu_stop_fxt_profiling(void);
  181. /* Associate the current processing unit to the identifier of the LWP that runs
  182. * the worker. */
  183. void _starpu_fxt_register_thread(unsigned);
  184. #ifdef FUT_NEEDS_COMMIT
  185. #define _STARPU_FUT_COMMIT(size) fut_commitstampedbuffer(size)
  186. #else
  187. #define _STARPU_FUT_COMMIT(size) do { } while (0)
  188. #endif
  189. #ifdef FUT_DO_PROBE1STR
  190. #define _STARPU_FUT_DO_PROBE1STR(CODE, P1, str) FUT_DO_PROBE1STR(CODE, P1, str)
  191. #else
  192. /* Sometimes we need something a little more specific than the wrappers from
  193. * FxT: these macro permit to put add an event with 3 (or 4) numbers followed
  194. * by a string. */
  195. #define _STARPU_FUT_DO_PROBE1STR(CODE, P1, str) \
  196. do { \
  197. if(fut_active) { \
  198. /* No more than FXT_MAX_PARAMS args are allowed */ \
  199. /* we add a \0 just in case ... */ \
  200. size_t len = STARPU_MIN(strlen(str)+1, (FXT_MAX_PARAMS - 1)*sizeof(unsigned long));\
  201. unsigned nbargs_str = (len + sizeof(unsigned long) - 1)/(sizeof(unsigned long));\
  202. unsigned nbargs = 1 + nbargs_str; \
  203. size_t total_len = FUT_SIZE(nbargs); \
  204. unsigned long *futargs = \
  205. fut_getstampedbuffer(FUT_CODE(CODE, nbargs), total_len);\
  206. *(futargs++) = (unsigned long)(P1); \
  207. snprintf((char *)futargs, len, "%s", str); \
  208. ((char *)futargs)[len - 1] = '\0'; \
  209. _STARPU_FUT_COMMIT(total_len); \
  210. } \
  211. } while (0);
  212. #endif
  213. #ifdef FUT_DO_PROBE2STR
  214. #define _STARPU_FUT_DO_PROBE2STR(CODE, P1, P2, str) FUT_DO_PROBE2STR(CODE, P1, P2, str)
  215. #else
  216. /* Sometimes we need something a little more specific than the wrappers from
  217. * FxT: these macro permit to put add an event with 3 (or 4) numbers followed
  218. * by a string. */
  219. #define _STARPU_FUT_DO_PROBE2STR(CODE, P1, P2, str) \
  220. do { \
  221. if(fut_active) { \
  222. /* No more than FXT_MAX_PARAMS args are allowed */ \
  223. /* we add a \0 just in case ... */ \
  224. size_t len = STARPU_MIN(strlen(str)+1, (FXT_MAX_PARAMS - 2)*sizeof(unsigned long));\
  225. unsigned nbargs_str = (len + sizeof(unsigned long) - 1)/(sizeof(unsigned long));\
  226. unsigned nbargs = 2 + nbargs_str; \
  227. size_t total_len = FUT_SIZE(nbargs); \
  228. unsigned long *futargs = \
  229. fut_getstampedbuffer(FUT_CODE(CODE, nbargs), total_len);\
  230. *(futargs++) = (unsigned long)(P1); \
  231. *(futargs++) = (unsigned long)(P2); \
  232. snprintf((char *)futargs, len, "%s", str); \
  233. ((char *)futargs)[len - 1] = '\0'; \
  234. _STARPU_FUT_COMMIT(total_len); \
  235. } \
  236. } while (0);
  237. #endif
  238. #ifdef FUT_DO_PROBE3STR
  239. #define _STARPU_FUT_DO_PROBE3STR(CODE, P1, P2, P3, str) FUT_DO_PROBE3STR(CODE, P1, P2, P3, str)
  240. #else
  241. #define _STARPU_FUT_DO_PROBE3STR(CODE, P1, P2, P3, str) \
  242. do { \
  243. if(fut_active) { \
  244. /* No more than FXT_MAX_PARAMS args are allowed */ \
  245. /* we add a \0 just in case ... */ \
  246. size_t len = STARPU_MIN(strlen(str)+1, (FXT_MAX_PARAMS - 3)*sizeof(unsigned long));\
  247. unsigned nbargs_str = (len + sizeof(unsigned long) - 1)/(sizeof(unsigned long));\
  248. unsigned nbargs = 3 + nbargs_str; \
  249. size_t total_len = FUT_SIZE(nbargs); \
  250. unsigned long *futargs = \
  251. fut_getstampedbuffer(FUT_CODE(CODE, nbargs), total_len);\
  252. *(futargs++) = (unsigned long)(P1); \
  253. *(futargs++) = (unsigned long)(P2); \
  254. *(futargs++) = (unsigned long)(P3); \
  255. snprintf((char *)futargs, len, "%s", str); \
  256. ((char *)futargs)[len - 1] = '\0'; \
  257. _STARPU_FUT_COMMIT(total_len); \
  258. } \
  259. } while (0);
  260. #endif
  261. #ifdef FUT_DO_PROBE4STR
  262. #define _STARPU_FUT_DO_PROBE4STR(CODE, P1, P2, P3, P4, str) FUT_DO_PROBE4STR(CODE, P1, P2, P3, P4, str)
  263. #else
  264. #define _STARPU_FUT_DO_PROBE4STR(CODE, P1, P2, P3, P4, str) \
  265. do { \
  266. if(fut_active) { \
  267. /* No more than FXT_MAX_PARAMS args are allowed */ \
  268. /* we add a \0 just in case ... */ \
  269. size_t len = STARPU_MIN(strlen(str)+1, (FXT_MAX_PARAMS - 4)*sizeof(unsigned long));\
  270. unsigned nbargs_str = (len + sizeof(unsigned long) - 1)/(sizeof(unsigned long));\
  271. unsigned nbargs = 4 + nbargs_str; \
  272. size_t total_len = FUT_SIZE(nbargs); \
  273. unsigned long *futargs = \
  274. fut_getstampedbuffer(FUT_CODE(CODE, nbargs), total_len);\
  275. *(futargs++) = (unsigned long)(P1); \
  276. *(futargs++) = (unsigned long)(P2); \
  277. *(futargs++) = (unsigned long)(P3); \
  278. *(futargs++) = (unsigned long)(P4); \
  279. snprintf((char *)futargs, len, "%s", str); \
  280. ((char *)futargs)[len - 1] = '\0'; \
  281. _STARPU_FUT_COMMIT(total_len); \
  282. } \
  283. } while (0);
  284. #endif
  285. #ifdef FUT_DO_PROBE5STR
  286. #define _STARPU_FUT_DO_PROBE5STR(CODE, P1, P2, P3, P4, P5, str) FUT_DO_PROBE5STR(CODE, P1, P2, P3, P4, P5, str)
  287. #else
  288. #define _STARPU_FUT_DO_PROBE5STR(CODE, P1, P2, P3, P4, P5, str) \
  289. do { \
  290. if(fut_active) { \
  291. /* No more than FXT_MAX_PARAMS args are allowed */ \
  292. /* we add a \0 just in case ... */ \
  293. size_t len = STARPU_MIN(strlen(str)+1, (FXT_MAX_PARAMS - 5)*sizeof(unsigned long));\
  294. unsigned nbargs_str = (len + sizeof(unsigned long) - 1)/(sizeof(unsigned long));\
  295. unsigned nbargs = 5 + nbargs_str; \
  296. size_t total_len = FUT_SIZE(nbargs); \
  297. unsigned long *futargs = \
  298. fut_getstampedbuffer(FUT_CODE(CODE, nbargs), total_len);\
  299. *(futargs++) = (unsigned long)(P1); \
  300. *(futargs++) = (unsigned long)(P2); \
  301. *(futargs++) = (unsigned long)(P3); \
  302. *(futargs++) = (unsigned long)(P4); \
  303. *(futargs++) = (unsigned long)(P5); \
  304. snprintf((char *)futargs, len, "%s", str); \
  305. ((char *)futargs)[len - 1] = '\0'; \
  306. _STARPU_FUT_COMMIT(total_len); \
  307. } \
  308. } while (0);
  309. #endif
  310. #ifdef FUT_DO_PROBE6STR
  311. #define _STARPU_FUT_DO_PROBE6STR(CODE, P1, P2, P3, P4, P5, P6, str) FUT_DO_PROBE6STR(CODE, P1, P2, P3, P4, P5, P6, str)
  312. #else
  313. #define _STARPU_FUT_DO_PROBE6STR(CODE, P1, P2, P3, P4, P5, P6, str) \
  314. do { \
  315. if(fut_active) { \
  316. /* No more than FXT_MAX_PARAMS args are allowed */ \
  317. /* we add a \0 just in case ... */ \
  318. size_t len = STARPU_MIN(strlen(str)+1, (FXT_MAX_PARAMS - 6)*sizeof(unsigned long));\
  319. unsigned nbargs_str = (len + sizeof(unsigned long) - 1)/(sizeof(unsigned long));\
  320. unsigned nbargs = 6 + nbargs_str; \
  321. size_t total_len = FUT_SIZE(nbargs); \
  322. unsigned long *futargs = \
  323. fut_getstampedbuffer(FUT_CODE(CODE, nbargs), total_len);\
  324. *(futargs++) = (unsigned long)(P1); \
  325. *(futargs++) = (unsigned long)(P2); \
  326. *(futargs++) = (unsigned long)(P3); \
  327. *(futargs++) = (unsigned long)(P4); \
  328. *(futargs++) = (unsigned long)(P5); \
  329. *(futargs++) = (unsigned long)(P6); \
  330. snprintf((char *)futargs, len, "%s", str); \
  331. ((char *)futargs)[len - 1] = '\0'; \
  332. _STARPU_FUT_COMMIT(total_len); \
  333. } \
  334. } while (0);
  335. #endif
  336. #ifdef FUT_DO_PROBE7STR
  337. #define _STARPU_FUT_DO_PROBE7STR(CODE, P1, P2, P3, P4, P5, P6, P7, str) FUT_DO_PROBE7STR(CODE, P1, P2, P3, P4, P5, P6, P7, str)
  338. #else
  339. #define _STARPU_FUT_DO_PROBE7STR(CODE, P1, P2, P3, P4, P5, P6, P7, str) \
  340. do { \
  341. if(fut_active) { \
  342. /* No more than FXT_MAX_PARAMS args are allowed */ \
  343. /* we add a \0 just in case ... */ \
  344. size_t len = STARPU_MIN(strlen(str)+1, (FXT_MAX_PARAMS - 7)*sizeof(unsigned long));\
  345. unsigned nbargs_str = (len + sizeof(unsigned long) - 1)/(sizeof(unsigned long));\
  346. unsigned nbargs = 7 + nbargs_str; \
  347. size_t total_len = FUT_SIZE(nbargs); \
  348. unsigned long *futargs = \
  349. fut_getstampedbuffer(FUT_CODE(CODE, nbargs), total_len);\
  350. *(futargs++) = (unsigned long)(P1); \
  351. *(futargs++) = (unsigned long)(P2); \
  352. *(futargs++) = (unsigned long)(P3); \
  353. *(futargs++) = (unsigned long)(P4); \
  354. *(futargs++) = (unsigned long)(P5); \
  355. *(futargs++) = (unsigned long)(P6); \
  356. *(futargs++) = (unsigned long)(P7); \
  357. snprintf((char *)futargs, len, "%s", str); \
  358. ((char *)futargs)[len - 1] = '\0'; \
  359. _STARPU_FUT_COMMIT(total_len); \
  360. } \
  361. } while (0);
  362. #endif
  363. #ifndef FUT_RAW_PROBE7
  364. #define FUT_RAW_PROBE7(CODE,P1,P2,P3,P4,P5,P6,P7) do { \
  365. if(fut_active) { \
  366. unsigned long *__args __attribute__((unused))= \
  367. fut_getstampedbuffer(CODE, \
  368. FUT_SIZE(7)); \
  369. *(__args++)=(unsigned long)(P1);*(__args++)=(unsigned long)(P2);*(__args++)=(unsigned long)(P3);*(__args++)=(unsigned long)(P4);*(__args++)=(unsigned long)(P5);*(__args++)=(unsigned long)(P6);*(__args++)=(unsigned long)(P7); \
  370. _STARPU_FUT_COMMIT(FUT_SIZE(7)); \
  371. } \
  372. } while (0)
  373. #endif
  374. #ifndef FUT_DO_PROBE7
  375. #define FUT_DO_PROBE7(CODE,P1,P2,P3,P4,P5,P6,P7) do { \
  376. FUT_RAW_PROBE7(FUT_CODE(CODE, 7),P1,P2,P3,P4,P5,P6,P7); \
  377. } while (0)
  378. #endif
  379. /* workerkind = _STARPU_FUT_CPU_KEY for instance */
  380. #define _STARPU_TRACE_NEW_MEM_NODE(nodeid) \
  381. FUT_DO_PROBE2(_STARPU_FUT_NEW_MEM_NODE, nodeid, _starpu_gettid());
  382. #define _STARPU_TRACE_WORKER_INIT_START(workerkind, workerid, devid, memnode, bindid, sync) \
  383. FUT_DO_PROBE7(_STARPU_FUT_WORKER_INIT_START, workerkind, workerid, devid, memnode, bindid, sync, _starpu_gettid());
  384. #define _STARPU_TRACE_WORKER_INIT_END(__workerid) \
  385. FUT_DO_PROBE2(_STARPU_FUT_WORKER_INIT_END, _starpu_gettid(), (__workerid));
  386. #define _STARPU_TRACE_START_CODELET_BODY(job, nimpl, perf_arch, workerid) \
  387. do { \
  388. const char *model_name = _starpu_job_get_model_name((job)), *name = _starpu_job_get_task_name((job)); \
  389. if (name) \
  390. { \
  391. /* we include the task name */ \
  392. _STARPU_FUT_DO_PROBE5STR(_STARPU_FUT_START_CODELET_BODY, (job)->job_id, ((job)->task)->sched_ctx, workerid, starpu_worker_get_memory_node(workerid), 1, name); \
  393. if (model_name && strcmp(model_name, name)) \
  394. _STARPU_FUT_DO_PROBE1STR(_STARPU_FUT_MODEL_NAME, (job)->job_id, model_name); \
  395. } \
  396. else { \
  397. FUT_DO_PROBE5(_STARPU_FUT_START_CODELET_BODY, (job)->job_id, ((job)->task)->sched_ctx, workerid, starpu_worker_get_memory_node(workerid), 0); \
  398. } \
  399. { \
  400. if ((job)->task->cl) \
  401. { \
  402. const int __nbuffers = STARPU_TASK_GET_NBUFFERS((job)->task); \
  403. char __buf[FXT_MAX_PARAMS*sizeof(long)]; \
  404. int __i; \
  405. for (__i = 0; __i < __nbuffers; __i++) \
  406. { \
  407. starpu_data_handle_t __handle = STARPU_TASK_GET_HANDLE((job)->task, __i); \
  408. void *__interface = _STARPU_TASK_GET_INTERFACES((job)->task)[__i]; \
  409. if (__handle->ops->describe) \
  410. { \
  411. __handle->ops->describe(__interface, __buf, sizeof(__buf)); \
  412. _STARPU_FUT_DO_PROBE1STR(_STARPU_FUT_CODELET_DATA, workerid, __buf); \
  413. } \
  414. FUT_DO_PROBE4(_STARPU_FUT_CODELET_DATA_HANDLE, (job)->job_id, (__handle), _starpu_data_get_size(__handle), STARPU_TASK_GET_MODE((job)->task, __i)); \
  415. } \
  416. } \
  417. const size_t __job_size = _starpu_job_get_data_size((job)->task->cl?(job)->task->cl->model:NULL, perf_arch, nimpl, (job)); \
  418. const uint32_t __job_hash = _starpu_compute_buffers_footprint((job)->task->cl?(job)->task->cl->model:NULL, perf_arch, nimpl, (job));\
  419. FUT_DO_PROBE7(_STARPU_FUT_CODELET_DETAILS, ((job)->task)->sched_ctx, __job_size, __job_hash, (job)->task->flops / 1000, (job)->task->tag_id, workerid, ((job)->job_id)); \
  420. } \
  421. } while(0);
  422. #define _STARPU_TRACE_END_CODELET_BODY(job, nimpl, perf_arch, workerid) \
  423. do { \
  424. const size_t job_size = _starpu_job_get_data_size((job)->task->cl?(job)->task->cl->model:NULL, perf_arch, nimpl, (job)); \
  425. const uint32_t job_hash = _starpu_compute_buffers_footprint((job)->task->cl?(job)->task->cl->model:NULL, perf_arch, nimpl, (job));\
  426. char _archname[32]=""; \
  427. starpu_perfmodel_get_arch_name(perf_arch, _archname, 32, 0); \
  428. _STARPU_FUT_DO_PROBE4STR(_STARPU_FUT_END_CODELET_BODY, (job)->job_id, (job_size), (job_hash), workerid, _archname); \
  429. } while(0);
  430. #define _STARPU_TRACE_START_EXECUTING() \
  431. FUT_DO_PROBE1(_STARPU_FUT_START_EXECUTING, _starpu_gettid());
  432. #define _STARPU_TRACE_END_EXECUTING() \
  433. FUT_DO_PROBE1(_STARPU_FUT_END_EXECUTING, _starpu_gettid());
  434. #define _STARPU_TRACE_START_CALLBACK(job) \
  435. FUT_DO_PROBE2(_STARPU_FUT_START_CALLBACK, job, _starpu_gettid());
  436. #define _STARPU_TRACE_END_CALLBACK(job) \
  437. FUT_DO_PROBE2(_STARPU_FUT_END_CALLBACK, job, _starpu_gettid());
  438. #define _STARPU_TRACE_JOB_PUSH(task, prio) \
  439. FUT_DO_PROBE3(_STARPU_FUT_JOB_PUSH, task, prio, _starpu_gettid());
  440. #define _STARPU_TRACE_JOB_POP(task, prio) \
  441. FUT_DO_PROBE3(_STARPU_FUT_JOB_POP, task, prio, _starpu_gettid());
  442. #define _STARPU_TRACE_UPDATE_TASK_CNT(counter) \
  443. FUT_DO_PROBE2(_STARPU_FUT_UPDATE_TASK_CNT, counter, _starpu_gettid())
  444. #define _STARPU_TRACE_START_FETCH_INPUT(job) \
  445. FUT_DO_PROBE2(_STARPU_FUT_START_FETCH_INPUT_ON_TID, job, _starpu_gettid());
  446. #define _STARPU_TRACE_END_FETCH_INPUT(job) \
  447. FUT_DO_PROBE2(_STARPU_FUT_END_FETCH_INPUT_ON_TID, job, _starpu_gettid());
  448. #define _STARPU_TRACE_START_PUSH_OUTPUT(job) \
  449. FUT_DO_PROBE2(_STARPU_FUT_START_PUSH_OUTPUT_ON_TID, job, _starpu_gettid());
  450. #define _STARPU_TRACE_END_PUSH_OUTPUT(job) \
  451. FUT_DO_PROBE2(_STARPU_FUT_END_PUSH_OUTPUT_ON_TID, job, _starpu_gettid());
  452. #define _STARPU_TRACE_WORKER_END_FETCH_INPUT(job, id) \
  453. FUT_DO_PROBE2(_STARPU_FUT_END_FETCH_INPUT, job, id);
  454. #define _STARPU_TRACE_WORKER_START_FETCH_INPUT(job, id) \
  455. FUT_DO_PROBE2(_STARPU_FUT_START_FETCH_INPUT, job, id);
  456. #define _STARPU_TRACE_TAG(tag, job) \
  457. FUT_DO_PROBE2(_STARPU_FUT_TAG, tag, (job)->job_id)
  458. #define _STARPU_TRACE_TAG_DEPS(tag_child, tag_father) \
  459. FUT_DO_PROBE2(_STARPU_FUT_TAG_DEPS, tag_child, tag_father)
  460. #define _STARPU_TRACE_TASK_DEPS(job_prev, job_succ) \
  461. FUT_DO_PROBE2(_STARPU_FUT_TASK_DEPS, (job_prev)->job_id, (job_succ)->job_id)
  462. #define _STARPU_TRACE_GHOST_TASK_DEPS(ghost_prev_id, job_succ_id) \
  463. FUT_DO_PROBE2(_STARPU_FUT_TASK_DEPS, (ghost_prev_id), (job_succ_id))
  464. #define _STARPU_TRACE_TASK_DONE(job) \
  465. do { \
  466. unsigned exclude_from_dag = (job)->exclude_from_dag; \
  467. const char *model_name = _starpu_job_get_task_name((job)); \
  468. if (model_name) \
  469. { \
  470. _STARPU_FUT_DO_PROBE4STR(_STARPU_FUT_TASK_DONE, (job)->job_id, _starpu_gettid(), (long unsigned)exclude_from_dag, 1, model_name);\
  471. } \
  472. else { \
  473. FUT_DO_PROBE4(_STARPU_FUT_TASK_DONE, (job)->job_id, _starpu_gettid(), (long unsigned)exclude_from_dag, 0);\
  474. } \
  475. } while(0);
  476. #define _STARPU_TRACE_TAG_DONE(tag) \
  477. do { \
  478. struct _starpu_job *job = (tag)->job; \
  479. const char *model_name = _starpu_job_get_task_name((job)); \
  480. if (model_name) \
  481. { \
  482. _STARPU_FUT_DO_PROBE3STR(_STARPU_FUT_TAG_DONE, (tag)->id, _starpu_gettid(), 1, model_name); \
  483. } \
  484. else { \
  485. FUT_DO_PROBE3(_STARPU_FUT_TAG_DONE, (tag)->id, _starpu_gettid(), 0);\
  486. } \
  487. } while(0);
  488. #define _STARPU_TRACE_DATA_COPY(src_node, dst_node, size) \
  489. FUT_DO_PROBE3(_STARPU_FUT_DATA_COPY, src_node, dst_node, size)
  490. #define _STARPU_TRACE_START_DRIVER_COPY(src_node, dst_node, size, com_id, prefetch, handle) \
  491. FUT_DO_PROBE6(_STARPU_FUT_START_DRIVER_COPY, src_node, dst_node, size, com_id, prefetch, handle)
  492. #define _STARPU_TRACE_END_DRIVER_COPY(src_node, dst_node, size, com_id, prefetch) \
  493. FUT_DO_PROBE5(_STARPU_FUT_END_DRIVER_COPY, src_node, dst_node, size, com_id, prefetch)
  494. #define _STARPU_TRACE_START_DRIVER_COPY_ASYNC(src_node, dst_node) \
  495. FUT_DO_PROBE2(_STARPU_FUT_START_DRIVER_COPY_ASYNC, src_node, dst_node)
  496. #define _STARPU_TRACE_END_DRIVER_COPY_ASYNC(src_node, dst_node) \
  497. FUT_DO_PROBE2(_STARPU_FUT_END_DRIVER_COPY_ASYNC, src_node, dst_node)
  498. #define _STARPU_TRACE_WORK_STEALING(empty_q, victim_q) \
  499. FUT_DO_PROBE2(_STARPU_FUT_WORK_STEALING, empty_q, victim_q)
  500. #define _STARPU_TRACE_WORKER_DEINIT_START \
  501. FUT_DO_PROBE1(_STARPU_FUT_WORKER_DEINIT_START, _starpu_gettid());
  502. #define _STARPU_TRACE_WORKER_DEINIT_END(workerkind) \
  503. FUT_DO_PROBE2(_STARPU_FUT_WORKER_DEINIT_END, workerkind, _starpu_gettid());
  504. #define _STARPU_TRACE_WORKER_SCHEDULING_START \
  505. FUT_DO_PROBE1(_STARPU_FUT_WORKER_SCHEDULING_START, _starpu_gettid());
  506. #define _STARPU_TRACE_WORKER_SCHEDULING_END \
  507. FUT_DO_PROBE1(_STARPU_FUT_WORKER_SCHEDULING_END, _starpu_gettid());
  508. #define _STARPU_TRACE_WORKER_SCHEDULING_PUSH \
  509. FUT_DO_PROBE1(_STARPU_FUT_WORKER_SCHEDULING_PUSH, _starpu_gettid());
  510. #define _STARPU_TRACE_WORKER_SCHEDULING_POP \
  511. FUT_DO_PROBE1(_STARPU_FUT_WORKER_SCHEDULING_POP, _starpu_gettid());
  512. #define _STARPU_TRACE_WORKER_SLEEP_START \
  513. FUT_DO_PROBE1(_STARPU_FUT_WORKER_SLEEP_START, _starpu_gettid());
  514. #define _STARPU_TRACE_WORKER_SLEEP_END \
  515. FUT_DO_PROBE1(_STARPU_FUT_WORKER_SLEEP_END, _starpu_gettid());
  516. #define _STARPU_TRACE_TASK_SUBMIT(job) \
  517. FUT_DO_PROBE2(_STARPU_FUT_TASK_SUBMIT, (job)->job_id, _starpu_gettid());
  518. #define _STARPU_TRACE_TASK_SUBMIT_START() \
  519. FUT_DO_PROBE1(_STARPU_FUT_TASK_SUBMIT_START, _starpu_gettid());
  520. #define _STARPU_TRACE_TASK_SUBMIT_END() \
  521. FUT_DO_PROBE1(_STARPU_FUT_TASK_SUBMIT_END, _starpu_gettid());
  522. #define _STARPU_TRACE_TASK_BUILD_START() \
  523. FUT_DO_PROBE1(_STARPU_FUT_TASK_BUILD_START, _starpu_gettid());
  524. #define _STARPU_TRACE_TASK_BUILD_END() \
  525. FUT_DO_PROBE1(_STARPU_FUT_TASK_BUILD_END, _starpu_gettid());
  526. #define _STARPU_TRACE_TASK_MPI_DECODE_START() \
  527. FUT_DO_PROBE1(_STARPU_FUT_TASK_MPI_DECODE_START, _starpu_gettid());
  528. #define _STARPU_TRACE_TASK_MPI_DECODE_END() \
  529. FUT_DO_PROBE1(_STARPU_FUT_TASK_MPI_DECODE_END, _starpu_gettid());
  530. #define _STARPU_TRACE_TASK_MPI_PRE_START() \
  531. FUT_DO_PROBE1(_STARPU_FUT_TASK_MPI_PRE_START, _starpu_gettid());
  532. #define _STARPU_TRACE_TASK_MPI_PRE_END() \
  533. FUT_DO_PROBE1(_STARPU_FUT_TASK_MPI_PRE_END, _starpu_gettid());
  534. #define _STARPU_TRACE_TASK_MPI_POST_START() \
  535. FUT_DO_PROBE1(_STARPU_FUT_TASK_MPI_POST_START, _starpu_gettid());
  536. #define _STARPU_TRACE_TASK_MPI_POST_END() \
  537. FUT_DO_PROBE1(_STARPU_FUT_TASK_MPI_POST_END, _starpu_gettid());
  538. #define _STARPU_TRACE_TASK_WAIT_START(job) \
  539. FUT_DO_PROBE2(_STARPU_FUT_TASK_WAIT_START, (job)->job_id, _starpu_gettid());
  540. #define _STARPU_TRACE_TASK_WAIT_END() \
  541. FUT_DO_PROBE1(_STARPU_FUT_TASK_WAIT_END, _starpu_gettid());
  542. #define _STARPU_TRACE_TASK_WAIT_FOR_ALL_START() \
  543. FUT_DO_PROBE1(_STARPU_FUT_TASK_WAIT_FOR_ALL_START, _starpu_gettid());
  544. #define _STARPU_TRACE_TASK_WAIT_FOR_ALL_END() \
  545. FUT_DO_PROBE1(_STARPU_FUT_TASK_WAIT_FOR_ALL_END, _starpu_gettid());
  546. #define _STARPU_TRACE_USER_DEFINED_START \
  547. FUT_DO_PROBE1(_STARPU_FUT_USER_DEFINED_START, _starpu_gettid());
  548. #define _STARPU_TRACE_USER_DEFINED_END \
  549. FUT_DO_PROBE1(_STARPU_FUT_USER_DEFINED_END, _starpu_gettid());
  550. #define _STARPU_TRACE_START_ALLOC(memnode, size) \
  551. FUT_DO_PROBE3(_STARPU_FUT_START_ALLOC, memnode, _starpu_gettid(), size);
  552. #define _STARPU_TRACE_END_ALLOC(memnode) \
  553. FUT_DO_PROBE2(_STARPU_FUT_END_ALLOC, memnode, _starpu_gettid());
  554. #define _STARPU_TRACE_START_ALLOC_REUSE(memnode, size) \
  555. FUT_DO_PROBE3(_STARPU_FUT_START_ALLOC_REUSE, memnode, _starpu_gettid(), size);
  556. #define _STARPU_TRACE_END_ALLOC_REUSE(memnode) \
  557. FUT_DO_PROBE2(_STARPU_FUT_END_ALLOC_REUSE, memnode, _starpu_gettid());
  558. #define _STARPU_TRACE_START_FREE(memnode, size) \
  559. FUT_DO_PROBE3(_STARPU_FUT_START_FREE, memnode, _starpu_gettid(), size);
  560. #define _STARPU_TRACE_END_FREE(memnode) \
  561. FUT_DO_PROBE2(_STARPU_FUT_END_FREE, memnode, _starpu_gettid());
  562. #define _STARPU_TRACE_START_WRITEBACK(memnode) \
  563. FUT_DO_PROBE2(_STARPU_FUT_START_WRITEBACK, memnode, _starpu_gettid());
  564. #define _STARPU_TRACE_END_WRITEBACK(memnode) \
  565. FUT_DO_PROBE2(_STARPU_FUT_END_WRITEBACK, memnode, _starpu_gettid());
  566. #define _STARPU_TRACE_USED_MEM(memnode,used) \
  567. FUT_DO_PROBE3(_STARPU_FUT_USED_MEM, memnode, used, _starpu_gettid());
  568. #define _STARPU_TRACE_START_MEMRECLAIM(memnode,is_prefetch) \
  569. FUT_DO_PROBE3(_STARPU_FUT_START_MEMRECLAIM, memnode, is_prefetch, _starpu_gettid());
  570. #define _STARPU_TRACE_END_MEMRECLAIM(memnode, is_prefetch) \
  571. FUT_DO_PROBE3(_STARPU_FUT_END_MEMRECLAIM, memnode, is_prefetch, _starpu_gettid());
  572. #define _STARPU_TRACE_START_WRITEBACK_ASYNC(memnode) \
  573. FUT_DO_PROBE2(_STARPU_FUT_START_WRITEBACK_ASYNC, memnode, _starpu_gettid());
  574. #define _STARPU_TRACE_END_WRITEBACK_ASYNC(memnode) \
  575. FUT_DO_PROBE2(_STARPU_FUT_END_WRITEBACK_ASYNC, memnode, _starpu_gettid());
  576. /* We skip these events becasue they are called so often that they cause FxT to
  577. * fail and make the overall trace unreadable anyway. */
  578. #define _STARPU_TRACE_START_PROGRESS(memnode) \
  579. FUT_DO_PROBE2(_STARPU_FUT_START_PROGRESS_ON_TID, memnode, _starpu_gettid());
  580. #define _STARPU_TRACE_END_PROGRESS(memnode) \
  581. FUT_DO_PROBE2(_STARPU_FUT_END_PROGRESS_ON_TID, memnode, _starpu_gettid());
  582. #define _STARPU_TRACE_USER_EVENT(code) \
  583. FUT_DO_PROBE2(_STARPU_FUT_USER_EVENT, code, _starpu_gettid());
  584. #define _STARPU_TRACE_SET_PROFILING(status) \
  585. FUT_DO_PROBE2(_STARPU_FUT_SET_PROFILING, status, _starpu_gettid());
  586. #define _STARPU_TRACE_TASK_WAIT_FOR_ALL \
  587. FUT_DO_PROBE0(_STARPU_FUT_TASK_WAIT_FOR_ALL)
  588. #define _STARPU_TRACE_EVENT(S) \
  589. FUT_DO_PROBESTR(_STARPU_FUT_EVENT,S)
  590. #define _STARPU_TRACE_THREAD_EVENT(S) \
  591. _STARPU_FUT_DO_PROBE1STR(_STARPU_FUT_THREAD_EVENT, _starpu_gettid(), S)
  592. #define _STARPU_TRACE_HYPERVISOR_BEGIN() \
  593. FUT_DO_PROBE1(_STARPU_FUT_HYPERVISOR_BEGIN, _starpu_gettid());
  594. #define _STARPU_TRACE_HYPERVISOR_END() \
  595. FUT_DO_PROBE1(_STARPU_FUT_HYPERVISOR_END, _starpu_gettid());
  596. #ifdef STARPU_FXT_LOCK_TRACES
  597. #define _STARPU_TRACE_LOCKING_MUTEX() do { \
  598. const char *file; \
  599. file = strrchr(__FILE__,'/') + 1; \
  600. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_LOCKING_MUTEX,__LINE__,_starpu_gettid(),file); \
  601. } while (0)
  602. #define _STARPU_TRACE_MUTEX_LOCKED() do { \
  603. const char *file; \
  604. file = strrchr(__FILE__,'/') + 1; \
  605. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_MUTEX_LOCKED,__LINE__,_starpu_gettid(),file); \
  606. } while(0)
  607. #define _STARPU_TRACE_UNLOCKING_MUTEX() do { \
  608. const char *file; \
  609. file = strrchr(__FILE__,'/') + 1; \
  610. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_UNLOCKING_MUTEX,__LINE__,_starpu_gettid(),file); \
  611. } while(0)
  612. #define _STARPU_TRACE_MUTEX_UNLOCKED() do {\
  613. const char *file; \
  614. file = strrchr(__FILE__,'/') + 1; \
  615. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_MUTEX_UNLOCKED,__LINE__,_starpu_gettid(),file); \
  616. } while(0)
  617. #define _STARPU_TRACE_TRYLOCK_MUTEX() do { \
  618. const char *file; \
  619. file = strrchr(__FILE__,'/') + 1; \
  620. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_TRYLOCK_MUTEX,__LINE__,_starpu_gettid(),file); \
  621. } while(0)
  622. #define _STARPU_TRACE_RDLOCKING_RWLOCK() do { \
  623. const char *file; \
  624. file = strrchr(__FILE__,'/') + 1; \
  625. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_RDLOCKING_RWLOCK,__LINE__,_starpu_gettid(),file); \
  626. } while(0)
  627. #define _STARPU_TRACE_RWLOCK_RDLOCKED() do { \
  628. const char *file; \
  629. file = strrchr(__FILE__,'/') + 1; \
  630. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_RWLOCK_RDLOCKED,__LINE__,_starpu_gettid(),file); \
  631. } while(0)
  632. #define _STARPU_TRACE_WRLOCKING_RWLOCK() do { \
  633. const char *file; \
  634. file = strrchr(__FILE__,'/') + 1; \
  635. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_WRLOCKING_RWLOCK,__LINE__,_starpu_gettid(),file); \
  636. } while(0)
  637. #define _STARPU_TRACE_RWLOCK_WRLOCKED() do { \
  638. const char *file; \
  639. file = strrchr(__FILE__,'/') + 1; \
  640. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_RWLOCK_WRLOCKED,__LINE__,_starpu_gettid(),file); \
  641. } while(0)
  642. #define _STARPU_TRACE_UNLOCKING_RWLOCK() do { \
  643. const char *file; \
  644. file = strrchr(__FILE__,'/') + 1; \
  645. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_UNLOCKING_RWLOCK,__LINE__,_starpu_gettid(),file); \
  646. } while(0)
  647. #define _STARPU_TRACE_RWLOCK_UNLOCKED() do { \
  648. const char *file; \
  649. file = strrchr(__FILE__,'/') + 1; \
  650. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_RWLOCK_UNLOCKED,__LINE__,_starpu_gettid(),file); \
  651. } while(0)
  652. #define STARPU_TRACE_SPINLOCK_CONDITITION (starpu_worker_get_type(starpu_worker_get_id()) == STARPU_CUDA_WORKER)
  653. #define _STARPU_TRACE_LOCKING_SPINLOCK(file, line) do {\
  654. if (STARPU_TRACE_SPINLOCK_CONDITITION) { \
  655. const char *xfile; \
  656. xfile = strrchr(file,'/') + 1; \
  657. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_LOCKING_SPINLOCK,line,_starpu_gettid(),xfile); \
  658. } \
  659. } while(0)
  660. #define _STARPU_TRACE_SPINLOCK_LOCKED(file, line) do { \
  661. if (STARPU_TRACE_SPINLOCK_CONDITITION) { \
  662. const char *xfile; \
  663. xfile = strrchr(file,'/') + 1; \
  664. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_SPINLOCK_LOCKED,line,_starpu_gettid(),xfile); \
  665. } \
  666. } while(0)
  667. #define _STARPU_TRACE_UNLOCKING_SPINLOCK(file, line) do { \
  668. if (STARPU_TRACE_SPINLOCK_CONDITITION) { \
  669. const char *xfile; \
  670. xfile = strrchr(file,'/') + 1; \
  671. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_UNLOCKING_SPINLOCK,line,_starpu_gettid(),xfile); \
  672. } \
  673. } while(0)
  674. #define _STARPU_TRACE_SPINLOCK_UNLOCKED(file, line) do { \
  675. if (STARPU_TRACE_SPINLOCK_CONDITITION) { \
  676. const char *xfile; \
  677. xfile = strrchr(file,'/') + 1; \
  678. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_SPINLOCK_UNLOCKED,line,_starpu_gettid(),xfile); \
  679. } \
  680. } while(0)
  681. #define _STARPU_TRACE_TRYLOCK_SPINLOCK(file, line) do { \
  682. if (STARPU_TRACE_SPINLOCK_CONDITITION) { \
  683. const char *xfile; \
  684. xfile = strrchr(file,'/') + 1; \
  685. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_TRYLOCK_SPINLOCK,line,_starpu_gettid(),xfile); \
  686. } \
  687. } while(0)
  688. #define _STARPU_TRACE_COND_WAIT_BEGIN() do { \
  689. const char *file; \
  690. file = strrchr(__FILE__,'/') + 1; \
  691. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_COND_WAIT_BEGIN,__LINE__,_starpu_gettid(),file); \
  692. } while(0)
  693. #define _STARPU_TRACE_COND_WAIT_END() do { \
  694. const char *file; \
  695. file = strrchr(__FILE__,'/') + 1; \
  696. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_COND_WAIT_END,__LINE__,_starpu_gettid(),file); \
  697. } while(0)
  698. #define _STARPU_TRACE_BARRIER_WAIT_BEGIN() do { \
  699. const char *file; \
  700. file = strrchr(__FILE__,'/') + 1; \
  701. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_BARRIER_WAIT_BEGIN,__LINE__,_starpu_gettid(),file); \
  702. } while(0)
  703. #define _STARPU_TRACE_BARRIER_WAIT_END() do { \
  704. const char *file; \
  705. file = strrchr(__FILE__,'/') + 1; \
  706. _STARPU_FUT_DO_PROBE2STR(_STARPU_FUT_BARRIER_WAIT_END,__LINE__,_starpu_gettid(),file); \
  707. } while(0)
  708. #else // !STARPU_FXT_LOCK_TRACES
  709. #define _STARPU_TRACE_LOCKING_MUTEX() do {} while(0)
  710. #define _STARPU_TRACE_MUTEX_LOCKED() do {} while(0)
  711. #define _STARPU_TRACE_UNLOCKING_MUTEX() do {} while(0)
  712. #define _STARPU_TRACE_MUTEX_UNLOCKED() do {} while(0)
  713. #define _STARPU_TRACE_TRYLOCK_MUTEX() do {} while(0)
  714. #define _STARPU_TRACE_RDLOCKING_RWLOCK() do {} while(0)
  715. #define _STARPU_TRACE_RWLOCK_RDLOCKED() do {} while(0)
  716. #define _STARPU_TRACE_WRLOCKING_RWLOCK() do {} while(0)
  717. #define _STARPU_TRACE_RWLOCK_WRLOCKED() do {} while(0)
  718. #define _STARPU_TRACE_UNLOCKING_RWLOCK() do {} while(0)
  719. #define _STARPU_TRACE_RWLOCK_UNLOCKED() do {} while(0)
  720. #define _STARPU_TRACE_LOCKING_SPINLOCK(file, line) do {(void) file; (void)line;} while(0)
  721. #define _STARPU_TRACE_SPINLOCK_LOCKED(file, line) do {(void) file; (void)line;} while(0)
  722. #define _STARPU_TRACE_UNLOCKING_SPINLOCK(file, line) do {(void) file; (void)line;} while(0)
  723. #define _STARPU_TRACE_SPINLOCK_UNLOCKED(file, line) do {(void) file; (void)line;} while(0)
  724. #define _STARPU_TRACE_TRYLOCK_SPINLOCK(file, line) do {(void) file; (void)line;} while(0)
  725. #define _STARPU_TRACE_COND_WAIT_BEGIN() do {} while(0)
  726. #define _STARPU_TRACE_COND_WAIT_END() do {} while(0)
  727. #define _STARPU_TRACE_BARRIER_WAIT_BEGIN() do {} while(0)
  728. #define _STARPU_TRACE_BARRIER_WAIT_END() do {} while(0)
  729. #endif // STARPU_FXT_LOCK_TRACES
  730. #define _STARPU_TRACE_MEMORY_FULL(size) \
  731. FUT_DO_PROBE2(_STARPU_FUT_MEMORY_FULL,size,_starpu_gettid());
  732. #define _STARPU_TRACE_DATA_LOAD(workerid,size) \
  733. FUT_DO_PROBE2(_STARPU_FUT_DATA_LOAD, workerid, size);
  734. #define _STARPU_TRACE_START_UNPARTITION(handle, memnode) \
  735. FUT_DO_PROBE3(_STARPU_FUT_START_UNPARTITION_ON_TID, memnode, _starpu_gettid(), handle);
  736. #define _STARPU_TRACE_END_UNPARTITION(handle, memnode) \
  737. FUT_DO_PROBE3(_STARPU_FUT_END_UNPARTITION_ON_TID, memnode, _starpu_gettid(), handle);
  738. #define _STARPU_TRACE_SCHED_COMPONENT_PUSH_PRIO(workerid, ntasks, exp_len) \
  739. FUT_DO_PROBE4(_STARPU_FUT_SCHED_COMPONENT_PUSH_PRIO, _starpu_gettid(), workerid, ntasks, exp_len);
  740. #define _STARPU_TRACE_SCHED_COMPONENT_POP_PRIO(workerid, ntasks, exp_len) \
  741. FUT_DO_PROBE4(_STARPU_FUT_SCHED_COMPONENT_POP_PRIO, _starpu_gettid(), workerid, ntasks, exp_len);
  742. #define _STARPU_TRACE_SCHED_COMPONENT_NEW(component) \
  743. _STARPU_FUT_DO_PROBE1STR(_STARPU_FUT_SCHED_COMPONENT_NEW, component, (component)->name);
  744. #define _STARPU_TRACE_SCHED_COMPONENT_CONNECT(parent, child) \
  745. FUT_DO_PROBE2(_STARPU_FUT_SCHED_COMPONENT_CONNECT, parent, child);
  746. #define _STARPU_TRACE_SCHED_COMPONENT_PUSH(from, to, task) \
  747. FUT_DO_PROBE5(_STARPU_FUT_SCHED_COMPONENT_PUSH, _starpu_gettid(), from, to, task, (task)->priority);
  748. #define _STARPU_TRACE_SCHED_COMPONENT_PULL(from, to, task) \
  749. FUT_DO_PROBE5(_STARPU_FUT_SCHED_COMPONENT_PULL, _starpu_gettid(), from, to, task, (task)->priority);
  750. #define _STARPU_TRACE_HANDLE_DATA_REGISTER(handle) \
  751. FUT_DO_PROBE1(_STARPU_FUT_HANDLE_DATA_REGISTER, handle)
  752. #if 0
  753. #define _STARPU_TRACE_DATA_INVALIDATE(handle, node) \
  754. FUT_DO_PROBE2(_STARPU_FUT_DATA_INVALIDATE, handle, node)
  755. #else
  756. #define _STARPU_TRACE_DATA_INVALIDATE(handle, node) do {(void) handle; (void) node;} while (0)
  757. #endif
  758. #else // !STARPU_USE_FXT
  759. /* Dummy macros in case FxT is disabled */
  760. #define _STARPU_TRACE_NEW_MEM_NODE(nodeid) do {(void)(nodeid);} while(0)
  761. #define _STARPU_TRACE_WORKER_INIT_START(a,b,c,d,e,f) do {(void)(a); (void)(b); (void)(c); (void)(d); (void)(e); (void)(f);} while(0)
  762. #define _STARPU_TRACE_WORKER_INIT_END(workerid) do {(void)(workerid);} while(0)
  763. #define _STARPU_TRACE_START_CODELET_BODY(job, nimpl, perf_arch, workerid) do {(void)(job); (void)(nimpl); (void)(perf_arch); (void)(workerid);} while(0)
  764. #define _STARPU_TRACE_END_CODELET_BODY(job, nimpl, perf_arch, workerid) do {(void)(job); (void)(nimpl); (void)(perf_arch); (void)(workerid);} while(0)
  765. #define _STARPU_TRACE_START_EXECUTING() do {} while(0)
  766. #define _STARPU_TRACE_END_EXECUTING() do {} while(0)
  767. #define _STARPU_TRACE_START_CALLBACK(job) do {(void)(job);} while(0)
  768. #define _STARPU_TRACE_END_CALLBACK(job) do {(void)(job);} while(0)
  769. #define _STARPU_TRACE_JOB_PUSH(task, prio) do {(void)(task); (void)(prio);} while(0)
  770. #define _STARPU_TRACE_JOB_POP(task, prio) do {(void)(task); (void)(prio);} while(0)
  771. #define _STARPU_TRACE_UPDATE_TASK_CNT(counter) do {(void)(counter);} while(0)
  772. #define _STARPU_TRACE_START_FETCH_INPUT(job) do {(void)(job);} while(0)
  773. #define _STARPU_TRACE_END_FETCH_INPUT(job) do {(void)(job);} while(0)
  774. #define _STARPU_TRACE_START_PUSH_OUTPUT(job) do {(void)(job);} while(0)
  775. #define _STARPU_TRACE_END_PUSH_OUTPUT(job) do {(void)(job);} while(0)
  776. #define _STARPU_TRACE_TAG(tag, job) do {(void)(tag); (void)(job);} while(0)
  777. #define _STARPU_TRACE_TAG_DEPS(a, b) do {(void)(a); (void)(b);} while(0)
  778. #define _STARPU_TRACE_TASK_DEPS(a, b) do {(void)(a); (void)(b);} while(0)
  779. #define _STARPU_TRACE_GHOST_TASK_DEPS(a, b) do {(void)(a); (void)(b);} while(0)
  780. #define _STARPU_TRACE_TASK_DONE(a) do {(void)(a);} while(0)
  781. #define _STARPU_TRACE_TAG_DONE(a) do {(void)(a);} while(0)
  782. #define _STARPU_TRACE_DATA_COPY(a, b, c) do {(void)(a); (void)(b); (void)(c);} while(0)
  783. #define _STARPU_TRACE_START_DRIVER_COPY(a,b,c,d,e,f) do {(void)(a); (void)(b); (void)(c); (void)(d); (void)(e); (void)(f);} while(0)
  784. #define _STARPU_TRACE_END_DRIVER_COPY(a,b,c,d,e) do {(void)(a); (void)(b); (void)(c); (void)(d); (void)(e);} while(0)
  785. #define _STARPU_TRACE_START_DRIVER_COPY_ASYNC(a,b) do {(void)(a); (void)(b);} while(0)
  786. #define _STARPU_TRACE_END_DRIVER_COPY_ASYNC(a,b) do {(void)(a); (void)(b);} while(0)
  787. #define _STARPU_TRACE_WORK_STEALING(a, b) do {(void)(a); (void)(b);} while(0)
  788. #define _STARPU_TRACE_WORKER_DEINIT_START do {} while(0)
  789. #define _STARPU_TRACE_WORKER_DEINIT_END(a) do {(void)(a);} while(0)
  790. #define _STARPU_TRACE_WORKER_SCHEDULING_START do {} while(0)
  791. #define _STARPU_TRACE_WORKER_SCHEDULING_END do {} while(0)
  792. #define _STARPU_TRACE_WORKER_SCHEDULING_PUSH do {} while(0)
  793. #define _STARPU_TRACE_WORKER_SCHEDULING_POP do {} while(0)
  794. #define _STARPU_TRACE_WORKER_SLEEP_START do {} while(0)
  795. #define _STARPU_TRACE_WORKER_SLEEP_END do {} while(0)
  796. #define _STARPU_TRACE_TASK_SUBMIT(job) do {(void)(job);} while(0)
  797. #define _STARPU_TRACE_TASK_SUBMIT_START() do {} while(0)
  798. #define _STARPU_TRACE_TASK_SUBMIT_END() do {} while(0)
  799. #define _STARPU_TRACE_TASK_BUILD_START() do {} while(0)
  800. #define _STARPU_TRACE_TASK_BUILD_END() do {} while(0)
  801. #define _STARPU_TRACE_TASK_MPI_DECODE_START() do {} while(0)
  802. #define _STARPU_TRACE_TASK_MPI_DECODE_END() do {} while(0)
  803. #define _STARPU_TRACE_TASK_MPI_PRE_START() do {} while(0)
  804. #define _STARPU_TRACE_TASK_MPI_PRE_END() do {} while(0)
  805. #define _STARPU_TRACE_TASK_MPI_POST_START() do {} while(0)
  806. #define _STARPU_TRACE_TASK_MPI_POST_END() do {} while(0)
  807. #define _STARPU_TRACE_TASK_WAIT_START(job) do {(void)(job);} while(0)
  808. #define _STARPU_TRACE_TASK_WAIT_END() do {} while(0)
  809. #define _STARPU_TRACE_TASK_WAIT_FOR_ALL_START() do {} while(0)
  810. #define _STARPU_TRACE_TASK_WAIT_FOR_ALL_END() do {} while(0)
  811. #define _STARPU_TRACE_USER_DEFINED_START() do {} while(0)
  812. #define _STARPU_TRACE_USER_DEFINED_END() do {} while(0)
  813. #define _STARPU_TRACE_START_ALLOC(memnode, size) do {(void)(memnode); (void)(size);} while(0)
  814. #define _STARPU_TRACE_END_ALLOC(memnode) do {(void)(memnode);} while(0)
  815. #define _STARPU_TRACE_START_ALLOC_REUSE(a, size) do {(void)(a); (void)(size);} while(0)
  816. #define _STARPU_TRACE_END_ALLOC_REUSE(a) do {(void)(a);} while(0)
  817. #define _STARPU_TRACE_START_FREE(memnode, size) do {(void)(memnode); (void)(size);} while(0)
  818. #define _STARPU_TRACE_END_FREE(memnode) do {(void)(memnode);} while(0)
  819. #define _STARPU_TRACE_START_WRITEBACK(memnode) do {(void)(memnode);} while(0)
  820. #define _STARPU_TRACE_END_WRITEBACK(memnode) do {(void)(memnode);} while(0)
  821. #define _STARPU_TRACE_USED_MEM(memnode,used) do {(void)(memnode); (void)(used);} while (0)
  822. #define _STARPU_TRACE_START_MEMRECLAIM(memnode,is_prefetch) do {(void)(memnode); (void)(is_prefetch);} while(0)
  823. #define _STARPU_TRACE_END_MEMRECLAIM(memnode,is_prefetch) do {(void)(memnode); (void)(is_prefetch);} while(0)
  824. #define _STARPU_TRACE_START_WRITEBACK_ASYNC(memnode) do {(void)(memnode);} while(0)
  825. #define _STARPU_TRACE_END_WRITEBACK_ASYNC(memnode) do {(void)(memnode);} while(0)
  826. #define _STARPU_TRACE_START_PROGRESS(memnode) do {(void)( memnode);} while(0)
  827. #define _STARPU_TRACE_END_PROGRESS(memnode) do {(void)( memnode);} while(0)
  828. #define _STARPU_TRACE_USER_EVENT(code) do {(void)(code);} while(0)
  829. #define _STARPU_TRACE_SET_PROFILING(status) do {(void)(status);} while(0)
  830. #define _STARPU_TRACE_TASK_WAIT_FOR_ALL() do {} while(0)
  831. #define _STARPU_TRACE_EVENT(S) do {(void)(S);} while(0)
  832. #define _STARPU_TRACE_THREAD_EVENT(S) do {(void)(S);} while(0)
  833. #define _STARPU_TRACE_LOCKING_MUTEX() do {} while(0)
  834. #define _STARPU_TRACE_MUTEX_LOCKED() do {} while(0)
  835. #define _STARPU_TRACE_UNLOCKING_MUTEX() do {} while(0)
  836. #define _STARPU_TRACE_MUTEX_UNLOCKED() do {} while(0)
  837. #define _STARPU_TRACE_TRYLOCK_MUTEX() do {} while(0)
  838. #define _STARPU_TRACE_RDLOCKING_RWLOCK() do {} while(0)
  839. #define _STARPU_TRACE_RWLOCK_RDLOCKED() do {} while(0)
  840. #define _STARPU_TRACE_WRLOCKING_RWLOCK() do {} while(0)
  841. #define _STARPU_TRACE_RWLOCK_WRLOCKED() do {} while(0)
  842. #define _STARPU_TRACE_UNLOCKING_RWLOCK() do {} while(0)
  843. #define _STARPU_TRACE_RWLOCK_UNLOCKED() do {} while(0)
  844. #define _STARPU_TRACE_LOCKING_SPINLOCK(file, line) do {(void)(file); (void)(line);} while(0)
  845. #define _STARPU_TRACE_SPINLOCK_LOCKED(file, line) do {(void)(file); (void)(line);} while(0)
  846. #define _STARPU_TRACE_UNLOCKING_SPINLOCK(file, line) do {(void)(file); (void)(line);} while(0)
  847. #define _STARPU_TRACE_SPINLOCK_UNLOCKED(file, line) do {(void)(file); (void)(line);} while(0)
  848. #define _STARPU_TRACE_TRYLOCK_SPINLOCK(file, line) do {(void)(file); (void)(line);} while(0)
  849. #define _STARPU_TRACE_COND_WAIT_BEGIN() do {} while(0)
  850. #define _STARPU_TRACE_COND_WAIT_END() do {} while(0)
  851. #define _STARPU_TRACE_BARRIER_WAIT_BEGIN() do {} while(0)
  852. #define _STARPU_TRACE_BARRIER_WAIT_END() do {} while(0)
  853. #define _STARPU_TRACE_MEMORY_FULL(size) do {(void)(size);} while(0)
  854. #define _STARPU_TRACE_DATA_LOAD(workerid,size) do {(void)(workerid); (void)(size);} while(0)
  855. #define _STARPU_TRACE_START_UNPARTITION(handle, memnode) do {(void)(handle); (void)(memnode);} while(0)
  856. #define _STARPU_TRACE_END_UNPARTITION(handle, memnode) do {(void)(handle); (void)(memnode);} while(0)
  857. #define _STARPU_TRACE_SCHED_COMPONENT_PUSH_PRIO(workerid, ntasks, exp_len) do {(void)(workerid); (void)(ntasks); (void)(exp_len);} while(0)
  858. #define _STARPU_TRACE_SCHED_COMPONENT_POP_PRIO(workerid, ntasks, exp_len) do {(void)(workerid); (void)(ntasks); (void)(exp_len);} while(0)
  859. #define _STARPU_TRACE_HYPERVISOR_BEGIN() do {} while(0)
  860. #define _STARPU_TRACE_HYPERVISOR_END() do {} while(0)
  861. #define _STARPU_TRACE_SCHED_COMPONENT_NEW(component) do {(void)(component);} while (0)
  862. #define _STARPU_TRACE_SCHED_COMPONENT_CONNECT(parent, child) do {(void)(parent); (void)(child);} while (0)
  863. #define _STARPU_TRACE_SCHED_COMPONENT_PUSH(from, to, task) do {(void)(from); (void)(to); (void)(task);} while (0)
  864. #define _STARPU_TRACE_SCHED_COMPONENT_PULL(from, to, task) do {(void)(from); (void)(to); (void)(task);} while (0)
  865. #define _STARPU_TRACE_HANDLE_DATA_REGISTER(handle) do {(void)(handle);} while (0)
  866. #define _STARPU_TRACE_DATA_INVALIDATE(handle, node) do {(void)(handle); (void)(node);} while (0)
  867. #define _STARPU_TRACE_WORKER_START_FETCH_INPUT(job, id) do {(void)(job); (void)(id);} while(0)
  868. #define _STARPU_TRACE_WORKER_END_FETCH_INPUT(job, id) do {(void)(job); (void)(id);} while(0)
  869. #endif // STARPU_USE_FXT
  870. #endif // __FXT_H__