starpu_mpi_fxt.h 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2010-2020 Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
  4. * Copyright (C) 2019 Federal University of Rio Grande do Sul (UFRGS)
  5. *
  6. * StarPU is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU Lesser General Public License as published by
  8. * the Free Software Foundation; either version 2.1 of the License, or (at
  9. * your option) any later version.
  10. *
  11. * StarPU is distributed in the hope that it will be useful, but
  12. * WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  14. *
  15. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  16. */
  17. #ifndef __STARPU_MPI_FXT_H__
  18. #define __STARPU_MPI_FXT_H__
  19. #include <starpu.h>
  20. #include <common/config.h>
  21. #include <common/fxt.h>
  22. #ifdef __cplusplus
  23. extern "C"
  24. {
  25. #endif
  26. #define _STARPU_MPI_FUT_START 0x5201
  27. #define _STARPU_MPI_FUT_STOP 0x5202
  28. #define _STARPU_MPI_FUT_BARRIER 0x5203
  29. #define _STARPU_MPI_FUT_ISEND_SUBMIT_BEGIN 0x5204
  30. #define _STARPU_MPI_FUT_ISEND_SUBMIT_END 0x5205
  31. #define _STARPU_MPI_FUT_IRECV_SUBMIT_BEGIN 0x5206
  32. #define _STARPU_MPI_FUT_IRECV_SUBMIT_END 0x5207
  33. #define _STARPU_MPI_FUT_ISEND_COMPLETE_BEGIN 0x5208
  34. #define _STARPU_MPI_FUT_ISEND_COMPLETE_END 0x5209
  35. #define _STARPU_MPI_FUT_DATA_SET_RANK 0x521a
  36. #define _STARPU_MPI_FUT_IRECV_TERMINATED 0x521b
  37. #define _STARPU_MPI_FUT_ISEND_TERMINATED 0x521c
  38. #define _STARPU_MPI_FUT_TESTING_DETACHED_BEGIN 0x521d
  39. #define _STARPU_MPI_FUT_TESTING_DETACHED_END 0x521e
  40. #define _STARPU_MPI_FUT_TEST_BEGIN 0x521f
  41. #define _STARPU_MPI_FUT_TEST_END 0x5220
  42. #define _STARPU_MPI_FUT_IRECV_COMPLETE_BEGIN 0x520a
  43. #define _STARPU_MPI_FUT_IRECV_COMPLETE_END 0x520b
  44. #define _STARPU_MPI_FUT_SLEEP_BEGIN 0x520c
  45. #define _STARPU_MPI_FUT_SLEEP_END 0x520d
  46. #define _STARPU_MPI_FUT_DTESTING_BEGIN 0x520e
  47. #define _STARPU_MPI_FUT_DTESTING_END 0x520f
  48. #define _STARPU_MPI_FUT_UTESTING_BEGIN 0x5210
  49. #define _STARPU_MPI_FUT_UTESTING_END 0x5211
  50. #define _STARPU_MPI_FUT_UWAIT_BEGIN 0x5212
  51. #define _STARPU_MPI_FUT_UWAIT_END 0x5213
  52. #define _STARPU_MPI_FUT_POLLING_BEGIN 0x5214
  53. #define _STARPU_MPI_FUT_POLLING_END 0x5215
  54. #define _STARPU_MPI_FUT_DRIVER_RUN_BEGIN 0x5216
  55. #define _STARPU_MPI_FUT_DRIVER_RUN_END 0x5217
  56. #define _STARPU_MPI_FUT_DATA_SET_TAG 0x5218
  57. #ifdef STARPU_USE_FXT
  58. #define _STARPU_MPI_TRACE_START(rank, worldsize) \
  59. FUT_DO_ALWAYS_PROBE3(_STARPU_MPI_FUT_START, (rank), (worldsize), _starpu_gettid());
  60. #define _STARPU_MPI_TRACE_STOP(rank, worldsize) \
  61. FUT_DO_ALWAYS_PROBE3(_STARPU_MPI_FUT_STOP, (rank), (worldsize), _starpu_gettid());
  62. #define _STARPU_MPI_TRACE_BARRIER(rank, worldsize, key) do {\
  63. if (_starpu_fxt_started) \
  64. FUT_DO_ALWAYS_PROBE4(_STARPU_MPI_FUT_BARRIER, (rank), (worldsize), (key), _starpu_gettid()); \
  65. } while (0)
  66. #define _STARPU_MPI_TRACE_ISEND_SUBMIT_BEGIN(dest, data_tag, size) \
  67. FUT_FULL_PROBE4(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_ISEND_SUBMIT_BEGIN, (dest), (data_tag), (size), _starpu_gettid());
  68. #define _STARPU_MPI_TRACE_ISEND_SUBMIT_END(dest, data_tag, size, jobid, handle) \
  69. FUT_FULL_PROBE6(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_ISEND_SUBMIT_END, (dest), (data_tag), (size), (jobid), (handle), _starpu_gettid());
  70. #define _STARPU_MPI_TRACE_IRECV_SUBMIT_BEGIN(src, data_tag) \
  71. FUT_FULL_PROBE3(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_IRECV_SUBMIT_BEGIN, (src), (data_tag), _starpu_gettid());
  72. #define _STARPU_MPI_TRACE_IRECV_SUBMIT_END(src, data_tag) \
  73. FUT_FULL_PROBE3(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_IRECV_SUBMIT_END, (src), (data_tag), _starpu_gettid());
  74. #define _STARPU_MPI_TRACE_ISEND_COMPLETE_BEGIN(dest, data_tag, size) \
  75. FUT_FULL_PROBE4(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_ISEND_COMPLETE_BEGIN, (dest), (data_tag), (size), _starpu_gettid());
  76. #define _STARPU_MPI_TRACE_COMPLETE_BEGIN(type, rank, data_tag) \
  77. if (type == RECV_REQ) { _STARPU_MPI_TRACE_IRECV_COMPLETE_BEGIN((rank), (data_tag)); } else if (type == SEND_REQ) { _STARPU_MPI_TRACE_ISEND_COMPLETE_BEGIN((rank), (data_tag), 0); }
  78. #define _STARPU_MPI_TRACE_ISEND_COMPLETE_END(dest, data_tag, size) \
  79. FUT_FULL_PROBE4(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_ISEND_COMPLETE_END, (dest), (data_tag), (size), _starpu_gettid());
  80. #define _STARPU_MPI_TRACE_IRECV_COMPLETE_BEGIN(src, data_tag) \
  81. FUT_FULL_PROBE3(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_IRECV_COMPLETE_BEGIN, (src), (data_tag), _starpu_gettid());
  82. #define _STARPU_MPI_TRACE_IRECV_COMPLETE_END(src, data_tag) \
  83. FUT_FULL_PROBE3(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_IRECV_COMPLETE_END, (src), (data_tag), _starpu_gettid());
  84. #define _STARPU_MPI_TRACE_COMPLETE_END(type, rank, data_tag) \
  85. if (type == RECV_REQ) { _STARPU_MPI_TRACE_IRECV_COMPLETE_END((rank), (data_tag)); } else if (type == SEND_REQ) { _STARPU_MPI_TRACE_ISEND_COMPLETE_END((rank), (data_tag), 0); }
  86. #define _STARPU_MPI_TRACE_TERMINATED(req, rank, data_tag) \
  87. if ((req)->request_type == RECV_REQ) FUT_FULL_PROBE5(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_IRECV_TERMINATED, (rank), (data_tag), (req)->post_sync_jobid, _starpu_gettid(), (req)->data_handle); else \
  88. if ((req)->request_type == SEND_REQ) FUT_FULL_PROBE3(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_ISEND_TERMINATED, (rank), (data_tag), _starpu_gettid());
  89. #define _STARPU_MPI_TRACE_SLEEP_BEGIN() \
  90. FUT_FULL_PROBE1(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_SLEEP_BEGIN, _starpu_gettid());
  91. #define _STARPU_MPI_TRACE_SLEEP_END() \
  92. FUT_FULL_PROBE1(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_SLEEP_END, _starpu_gettid());
  93. #define _STARPU_MPI_TRACE_DTESTING_BEGIN() \
  94. FUT_FULL_PROBE1(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_DTESTING_BEGIN, _starpu_gettid());
  95. #define _STARPU_MPI_TRACE_DTESTING_END() \
  96. FUT_FULL_PROBE1(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_DTESTING_END, _starpu_gettid());
  97. #define _STARPU_MPI_TRACE_UTESTING_BEGIN(src, data_tag) \
  98. FUT_FULL_PROBE3(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_UTESTING_BEGIN, (src), (data_tag), _starpu_gettid());
  99. #define _STARPU_MPI_TRACE_UTESTING_END(src, data_tag) \
  100. FUT_FULL_PROBE3(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_UTESTING_END, (src), (data_tag), _starpu_gettid());
  101. #define _STARPU_MPI_TRACE_UWAIT_BEGIN(src, data_tag) \
  102. FUT_FULL_PROBE3(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_UWAIT_BEGIN, (src), (data_tag), _starpu_gettid());
  103. #define _STARPU_MPI_TRACE_UWAIT_END(src, data_tag) \
  104. FUT_FULL_PROBE3(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_UWAIT_END, (src), (data_tag), _starpu_gettid());
  105. #define _STARPU_MPI_TRACE_DATA_SET_RANK(handle, rank) \
  106. FUT_FULL_PROBE3(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_DATA_SET_RANK, (handle), (rank), _starpu_gettid());
  107. #define _STARPU_MPI_TRACE_DATA_SET_TAG(handle, data_tag) \
  108. FUT_FULL_PROBE3(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_DATA_SET_TAG, (handle), (data_tag), _starpu_gettid());
  109. #if 0
  110. /* This is very expensive in the trace, only enable for debugging */
  111. #define _STARPU_MPI_TRACE_TESTING_DETACHED_BEGIN() \
  112. FUT_DO_PROBE1(_STARPU_MPI_FUT_TESTING_DETACHED_BEGIN, _starpu_gettid());
  113. #define _STARPU_MPI_TRACE_TESTING_DETACHED_END() \
  114. FUT_DO_PROBE1(_STARPU_MPI_FUT_TESTING_DETACHED_END, _starpu_gettid());
  115. #define _STARPU_MPI_TRACE_TEST_BEGIN(peer, data_tag) \
  116. FUT_DO_PROBE3(_STARPU_MPI_FUT_TEST_BEGIN, (peer), (data_tag), _starpu_gettid());
  117. #define _STARPU_MPI_TRACE_TEST_END(peer, data_tag) \
  118. FUT_DO_PROBE3(_STARPU_MPI_FUT_TEST_END, (peer), (data_tag), _starpu_gettid());
  119. #else
  120. #define _STARPU_MPI_TRACE_TESTING_DETACHED_BEGIN() do {} while(0)
  121. #define _STARPU_MPI_TRACE_TESTING_DETACHED_END() do {} while(0)
  122. #define _STARPU_MPI_TRACE_TEST_BEGIN(peer, data_tag) do {} while(0)
  123. #define _STARPU_MPI_TRACE_TEST_END(peer, data_tag) do {} while(0)
  124. #endif
  125. #define _STARPU_MPI_TRACE_POLLING_BEGIN() \
  126. if(!trace_loop) { \
  127. trace_loop = 1; \
  128. FUT_FULL_PROBE1(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_POLLING_BEGIN, _starpu_gettid()); \
  129. }
  130. #define _STARPU_MPI_TRACE_POLLING_END() \
  131. if(trace_loop) { \
  132. trace_loop = 0; \
  133. FUT_FULL_PROBE1(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_POLLING_END, _starpu_gettid()); \
  134. }
  135. #define _STARPU_MPI_TRACE_DRIVER_RUN_BEGIN() \
  136. FUT_FULL_PROBE1(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_DRIVER_RUN_BEGIN, _starpu_gettid());
  137. #define _STARPU_MPI_TRACE_DRIVER_RUN_END() \
  138. FUT_FULL_PROBE1(_STARPU_FUT_KEYMASK_MPI, _STARPU_MPI_FUT_DRIVER_RUN_END, _starpu_gettid());
  139. #define TRACE
  140. #else
  141. #define _STARPU_MPI_TRACE_START(a, b) do {} while(0);
  142. #define _STARPU_MPI_TRACE_STOP(a, b) do {} while(0);
  143. #define _STARPU_MPI_TRACE_BARRIER(a, b, c) do {} while(0);
  144. #define _STARPU_MPI_TRACE_ISEND_SUBMIT_BEGIN(a, b, c) do {} while(0);
  145. #define _STARPU_MPI_TRACE_ISEND_SUBMIT_END(a, b, c, d, e) do {} while(0);
  146. #define _STARPU_MPI_TRACE_IRECV_SUBMIT_BEGIN(a, b) do {} while(0);
  147. #define _STARPU_MPI_TRACE_IRECV_SUBMIT_END(a, b) do {} while(0);
  148. #define _STARPU_MPI_TRACE_ISEND_COMPLETE_BEGIN(a, b, c) do {} while(0);
  149. #define _STARPU_MPI_TRACE_COMPLETE_BEGIN(a, b, c) do {} while(0);
  150. #define _STARPU_MPI_TRACE_COMPLETE_END(a, b, c) do {} while(0);
  151. #define _STARPU_MPI_TRACE_TERMINATED(a, b, c) do {} while(0);
  152. #define _STARPU_MPI_TRACE_ISEND_COMPLETE_END(a, b, c) do {} while(0);
  153. #define _STARPU_MPI_TRACE_IRECV_COMPLETE_BEGIN(a, b) do {} while(0);
  154. #define _STARPU_MPI_TRACE_IRECV_COMPLETE_END(a, b) do {} while(0);
  155. #define _STARPU_MPI_TRACE_SLEEP_BEGIN() do {} while(0);
  156. #define _STARPU_MPI_TRACE_SLEEP_END() do {} while(0);
  157. #define _STARPU_MPI_TRACE_DTESTING_BEGIN() do {} while(0);
  158. #define _STARPU_MPI_TRACE_DTESTING_END() do {} while(0);
  159. #define _STARPU_MPI_TRACE_UTESTING_BEGIN(a, b) do {} while(0);
  160. #define _STARPU_MPI_TRACE_UTESTING_END(a, b) do {} while(0);
  161. #define _STARPU_MPI_TRACE_UWAIT_BEGIN(a, b) do {} while(0);
  162. #define _STARPU_MPI_TRACE_UWAIT_END(a, b) do {} while(0);
  163. #define _STARPU_MPI_TRACE_DATA_SET_RANK(a, b) do {} while(0);
  164. #define _STARPU_MPI_TRACE_DATA_SET_TAG(a, b) do {} while(0);
  165. #define _STARPU_MPI_TRACE_TESTING_DETACHED_BEGIN() do {} while(0)
  166. #define _STARPU_MPI_TRACE_TESTING_DETACHED_END() do {} while(0)
  167. #define _STARPU_MPI_TRACE_TEST_BEGIN(peer, data_tag) do {} while(0)
  168. #define _STARPU_MPI_TRACE_TEST_END(peer, data_tag) do {} while(0)
  169. #define _STARPU_MPI_TRACE_POLLING_BEGIN() do {} while(0);
  170. #define _STARPU_MPI_TRACE_POLLING_END() do {} while(0);
  171. #define _STARPU_MPI_TRACE_DRIVER_RUN_BEGIN() do {} while(0);
  172. #define _STARPU_MPI_TRACE_DRIVER_RUN_END() do {} while(0);
  173. #endif
  174. #ifdef __cplusplus
  175. }
  176. #endif
  177. #endif // __STARPU_MPI_FXT_H__