codelet_and_tasks.doxy 25 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596
  1. /*
  2. * This file is part of the StarPU Handbook.
  3. * Copyright (C) 2009--2011 Universit@'e de Bordeaux 1
  4. * Copyright (C) 2010, 2011, 2012, 2013 Centre National de la Recherche Scientifique
  5. * Copyright (C) 2011, 2012 Institut National de Recherche en Informatique et Automatique
  6. * See the file version.doxy for copying conditions.
  7. */
  8. /*! \defgroup Codelet_And_Tasks Codelet And Tasks
  9. \brief This section describes the interface to manipulate codelets and tasks.
  10. \def STARPU_CPU
  11. \ingroup Codelet_And_Tasks
  12. This macro is used when setting the field starpu_codelet::where
  13. to specify the codelet may be executed on a CPU processing unit.
  14. \def STARPU_CUDA
  15. \ingroup Codelet_And_Tasks
  16. This macro is used when setting the field starpu_codelet::where
  17. to specify the codelet may be executed on a CUDA processing unit.
  18. \def STARPU_OPENCL
  19. \ingroup Codelet_And_Tasks
  20. This macro is used when setting the field starpu_codelet::where to
  21. specify the codelet may be executed on a OpenCL processing unit.
  22. \def STARPU_MULTIPLE_CPU_IMPLEMENTATIONS
  23. \deprecated
  24. \ingroup Codelet_And_Tasks
  25. Setting the field starpu_codelet::cpu_func with this macro
  26. indicates the codelet will have several implementations. The use of
  27. this macro is deprecated. One should always only define the field
  28. starpu_codelet::cpu_funcs.
  29. \def STARPU_MULTIPLE_CUDA_IMPLEMENTATIONS
  30. \deprecated
  31. \ingroup Codelet_And_Tasks
  32. Setting the field starpu_codelet::cuda_func with this macro
  33. indicates the codelet will have several implementations. The use of
  34. this macro is deprecated. One should always only define the field
  35. starpu_codelet::cuda_funcs.
  36. \def STARPU_MULTIPLE_OPENCL_IMPLEMENTATIONS
  37. \deprecated
  38. \ingroup Codelet_And_Tasks
  39. Setting the field starpu_codelet::opencl_func with
  40. this macro indicates the codelet will have several implementations.
  41. The use of this macro is deprecated. One should always only define the
  42. field starpu_codelet::opencl_funcs.
  43. \def starpu_cpu_func_t
  44. \ingroup Codelet_And_Tasks
  45. CPU implementation of a codelet.
  46. \def starpu_cuda_func_t
  47. \ingroup Codelet_And_Tasks
  48. CUDA implementation of a codelet.
  49. \def starpu_opencl_func_t
  50. \ingroup Codelet_And_Tasks
  51. OpenCL implementation of a codelet.
  52. \def starpu_mic_func_t
  53. \ingroup Codelet_And_Tasks
  54. MIC implementation of a codelet.
  55. \def starpu_scc_func_t
  56. \ingroup Codelet_And_Tasks
  57. SCC implementation of a codelet.
  58. \struct starpu_codelet
  59. \brief The codelet structure describes a kernel that is possibly
  60. implemented on various targets. For compatibility, make sure to
  61. initialize the whole structure to zero, either by using explicit
  62. memset, or the function starpu_codelet_init(), or by letting the
  63. compiler implicitly do it in e.g. static storage case.
  64. \ingroup Codelet_And_Tasks
  65. \var starpu_codelet::where.
  66. Optional field to indicate which types of processing units are able to
  67. execute the codelet. The different values ::STARPU_CPU, ::STARPU_CUDA,
  68. ::STARPU_OPENCL can be combined to specify on which types of processing
  69. units the codelet can be executed. ::STARPU_CPU|::STARPU_CUDA for instance
  70. indicates that the codelet is implemented for both CPU cores and CUDA
  71. devices while ::STARPU_OPENCL indicates that it is only available on
  72. OpenCL devices. If the field is unset, its value will be automatically
  73. set based on the availability of the XXX_funcs fields defined below.
  74. \var starpu_codelet::can_execute
  75. Define a function which should return 1 if the worker designated by
  76. workerid can execute the <c>nimpl</c>th implementation of the given
  77. task, 0 otherwise.
  78. \var starpu_codelet::type
  79. Optional field to specify the type of the codelet. The default is
  80. ::STARPU_SEQ, i.e. usual sequential implementation. Other values
  81. (::STARPU_SPMD or ::STARPU_FORKJOIN declare that a parallel implementation
  82. is also available. See \ref Parallel_Tasks for details.
  83. \var starpu_codelet::max_parallelism
  84. Optional field. If a parallel implementation is available, this
  85. denotes the maximum combined worker size that StarPU will use to
  86. execute parallel tasks for this codelet.
  87. \var starpu_codelet::cpu_func
  88. \deprecated
  89. Optional field which has been made deprecated. One should use instead
  90. the field starpu_codelet::cpu_funcs.
  91. \var starpu_codelet::cuda_func
  92. \deprecated
  93. Optional field which has been made deprecated. One should use instead
  94. the starpu_codelet::cuda_funcs field.
  95. \var starpu_codelet::opencl_func
  96. \deprecated
  97. Optional field which has been made deprecated. One should use instead
  98. the starpu_codelet::opencl_funcs field.
  99. \var starpu_codelet::cpu_funcs
  100. Optional array of function pointers to the CPU implementations of the
  101. codelet. It must be terminated by a NULL value. The functions
  102. prototype must be:
  103. \code{.c}
  104. void cpu_func(void *buffers[], void *cl_arg)
  105. \endcode
  106. The first argument being the array of data managed by the data
  107. management library, and the second argument is a pointer to the
  108. argument passed from the field starpu_task::cl_arg. If the field
  109. starpu_codelet::where is set, then the field starpu_codelet::cpu_funcs
  110. is ignored if ::STARPU_CPU does not appear in the field
  111. starpu_codelet::where, it must be non-null otherwise.
  112. \var starpu_codelet::cuda_funcs
  113. Optional array of function pointers to the CUDA implementations of the
  114. codelet. It must be terminated by a NULL value. The functions must be
  115. host-functions written in the CUDA runtime API. Their prototype must
  116. be:
  117. \code{.c}
  118. void cuda_func(void *buffers[], void *cl_arg)
  119. \endcode
  120. If the field starpu_codelet::where is set, then the field
  121. starpu_codelet::cuda_funcs is ignored if ::STARPU_CUDA does not appear
  122. in the field starpu_codelet::where, it must be non-null otherwise.
  123. \var starpu_codelet::opencl_funcs
  124. Optional array of function pointers to the OpenCL implementations of
  125. the codelet. It must be terminated by a NULL value. The functions
  126. prototype must be:
  127. \code{.c}
  128. void opencl_func(void *buffers[], void *cl_arg)
  129. \endcode
  130. If the field starpu_codelet::where field is set, then the field
  131. starpu_codelet::opencl_funcs is ignored if ::STARPU_OPENCL does not
  132. appear in the field starpu_codelet::where, it must be non-null
  133. otherwise.
  134. \var starpu_codelet::nbuffers
  135. Specify the number of arguments taken by the codelet. These arguments
  136. are managed by the DSM and are accessed from the <c>void *buffers[]</c>
  137. array. The constant argument passed with the field starpu_task::cl_arg
  138. is not counted in this number. This value should not be above
  139. STARPU_NMAXBUFS.
  140. \var starpu_codelet::modes
  141. Is an array of ::starpu_data_access_mode. It describes the required
  142. access modes to the data neeeded by the codelet (e.g. ::STARPU_RW). The
  143. number of entries in this array must be specified in the field
  144. starpu_codelet::nbuffers, and should not exceed STARPU_NMAXBUFS. If
  145. unsufficient, this value can be set with the <c>--enable-maxbuffers</c>
  146. option when configuring StarPU.
  147. \var starpu_codelet::dyn_modes
  148. Is an array of ::starpu_data_access_mode. It describes the required
  149. access modes to the data neeeded by the codelet (e.g. ::STARPU_RW).
  150. The number of entries in this array must be specified in the field
  151. starpu_codelet::nbuffers. This field should be used for codelets having a
  152. number of datas greater than STARPU_NMAXBUFS (see \ref
  153. Setting_the_Data_Handles_for_a_Task). When defining a codelet, one
  154. should either define this field or the field starpu_codelet::modes defined above.
  155. \var starpu_codelet::model
  156. Optional pointer to the task duration performance model associated to
  157. this codelet. This optional field is ignored when set to <c>NULL</c> or when
  158. its field starpu_perfmodel::symbol is not set.
  159. \var starpu_codelet::power_model
  160. Optional pointer to the task power consumption performance model
  161. associated to this codelet. This optional field is ignored when set to
  162. <c>NULL</c> or when its field starpu_perfmodel::field is not set. In
  163. the case of parallel codelets, this has to account for all processing
  164. units involved in the parallel execution.
  165. \var starpu_codelet::per_worker_stats
  166. Optional array for statistics collected at runtime: this is filled by
  167. StarPU and should not be accessed directly, but for example by calling
  168. the function starpu_codelet_display_stats() (See
  169. starpu_codelet_display_stats() for details).
  170. \var starpu_codelet::name
  171. Optional name of the codelet. This can be useful for debugging
  172. purposes.
  173. \fn void starpu_codelet_init(struct starpu_codelet *cl)
  174. \ingroup Codelet_And_Tasks
  175. Initialize \p cl with default values. Codelets should
  176. preferably be initialized statically as shown in \ref
  177. Defining_a_Codelet. However such a initialisation is not always
  178. possible, e.g. when using C++.
  179. \struct starpu_data_descr
  180. \ingroup Codelet_And_Tasks
  181. \brief This type is used to describe a data handle along with an
  182. access mode.
  183. \var starpu_data_descr::handle
  184. describes a data
  185. \var starpu_data_descr::mode
  186. describes its access mode
  187. \struct starpu_task
  188. \ingroup Codelet_And_Tasks
  189. \brief The structure describes a task that can be offloaded on the
  190. various processing units managed by StarPU. It instantiates a codelet.
  191. It can either be allocated dynamically with the function
  192. starpu_task_create(), or declared statically. In the latter case, the
  193. programmer has to zero the structure starpu_task and to fill the
  194. different fields properly. The indicated default values correspond to
  195. the configuration of a task allocated with starpu_task_create().
  196. \var starpu_task::cl
  197. Is a pointer to the corresponding structure starpu_codelet. This
  198. describes where the kernel should be executed, and supplies the
  199. appropriate implementations. When set to NULL, no code is executed
  200. during the tasks, such empty tasks can be useful for synchronization
  201. purposes.
  202. \var starpu_task::buffers
  203. \deprecated
  204. This field has been made deprecated. One should use instead the
  205. field starpu_task::handles to specify the data handles accessed
  206. by the task. The access modes are now defined in the field
  207. starpu_codelet::mode.
  208. \var starpu_task::handles
  209. Is an array of starpu_data_handle_t. It specifies the handles to the
  210. different pieces of data accessed by the task. The number of entries
  211. in this array must be specified in the field starpu_codelet::nbuffers,
  212. and should not exceed STARPU_NMAXBUFS. If unsufficient, this value can
  213. be set with the option <c>--enable-maxbuffers</c> when configuring
  214. StarPU.
  215. \var starpu_task::dyn_handles
  216. Is an array of starpu_data_handle_t. It specifies the handles to the
  217. different pieces of data accessed by the task. The number of entries
  218. in this array must be specified in the field starpu_codelet::nbuffers.
  219. This field should be used for tasks having a number of datas greater
  220. than STARPU_NMAXBUFS (see \ref Setting_the_Data_Handles_for_a_Task).
  221. When defining a task, one should either define this field or the field
  222. starpu_task::handles defined above.
  223. \var starpu_task::interfaces
  224. The actual data pointers to the memory node where execution will
  225. happen, managed by the DSM.
  226. \var starpu_task::dyn_interfaces
  227. The actual data pointers to the memory node where execution will
  228. happen, managed by the DSM. Is used when the field
  229. starpu_task::dyn_handles is defined.
  230. \var starpu_task::cl_arg
  231. Optional pointer which is passed to the codelet through the second
  232. argument of the codelet implementation (e.g. starpu_codelet::cpu_func
  233. or starpu_codelet::cuda_func). The default value is <c>NULL</c>.
  234. \var starpu_task::cl_arg_size
  235. Optional field. For some specific drivers, the pointer
  236. starpu_task::cl_arg cannot not be directly given to the driver
  237. function. A buffer of size starpu_task::cl_arg_size needs to be
  238. allocated on the driver. This buffer is then filled with the
  239. starpu_task::cl_arg_size bytes starting at address
  240. starpu_task::cl_arg. In this case, the argument given to the codelet
  241. is therefore not the starpu_task::cl_arg pointer, but the address of
  242. the buffer in local store (LS) instead. This field is ignored for CPU,
  243. CUDA and OpenCL codelets, where the starpu_task::cl_arg pointer is
  244. given as such.
  245. \var starpu_task::callback_func
  246. Optional field, the default value is <c>NULL</c>. This is a function
  247. pointer of prototype <c>void (*f)(void *)</c> which specifies a
  248. possible callback. If this pointer is non-null, the callback function
  249. is executed on the host after the execution of the task. Tasks which
  250. depend on it might already be executing. The callback is passed the
  251. value contained in the starpu_task::callback_arg field. No callback is
  252. executed if the field is set to NULL.
  253. \var starpu_task::callback_arg (optional) (default: NULL)
  254. Optional field, the default value is <c>NULL</c>. This is the pointer
  255. passed to the callback function. This field is ignored if the
  256. callback_func is set to <c>NULL</c>.
  257. \var starpu_task::use_tag
  258. Optional field, the default value is 0. If set, this flag indicates
  259. that the task should be associated with the tag contained in the
  260. starpu_task::tag_id field. Tag allow the application to synchronize
  261. with the task and to express task dependencies easily.
  262. \var starpu_task::tag_id
  263. This optional field contains the tag associated to the task if the
  264. field starpu_task::use_tag is set, it is ignored otherwise.
  265. \var starpu_task::sequential_consistency
  266. If this flag is set (which is the default), sequential consistency is
  267. enforced for the data parameters of this task for which sequential
  268. consistency is enabled. Clearing this flag permits to disable
  269. sequential consistency for this task, even if data have it enabled.
  270. \var starpu_task::synchronous
  271. If this flag is set, the function starpu_task_submit() is blocking and
  272. returns only when the task has been executed (or if no worker is able
  273. to process the task). Otherwise, starpu_task_submit() returns
  274. immediately.
  275. \var starpu_task::priority
  276. Optional field, the default value is STARPU_DEFAULT_PRIO. This field
  277. indicates a level of priority for the task. This is an integer value
  278. that must be set between the return values of the function
  279. starpu_sched_get_min_priority() for the least important tasks, and
  280. that of the function starpu_sched_get_max_priority() for the most
  281. important tasks (included). The STARPU_MIN_PRIO and STARPU_MAX_PRIO
  282. macros are provided for convenience and respectively returns the value
  283. of starpu_sched_get_min_priority() and
  284. starpu_sched_get_max_priority(). Default priority is
  285. STARPU_DEFAULT_PRIO, which is always defined as 0 in order to allow
  286. static task initialization. Scheduling strategies that take priorities
  287. into account can use this parameter to take better scheduling
  288. decisions, but the scheduling policy may also ignore it.
  289. \var starpu_task::execute_on_a_specific_worker
  290. Default value is 0. If this flag is set, StarPU will bypass the
  291. scheduler and directly affect this task to the worker specified by the
  292. field starpu_task::workerid.
  293. \var starpu_task::workerid
  294. Optional field. If the field starpu_task::execute_on_a_specific_worker
  295. is set, this field indicates the identifier of the worker that should
  296. process this task (as returned by starpu_worker_get_id()). This field
  297. is ignored if the field starpu_task::execute_on_a_specific_worker is
  298. set to 0.
  299. \var starpu_task::bundle
  300. Optional field. The bundle that includes this task. If no bundle is
  301. used, this should be NULL.
  302. \var starpu_task::detach
  303. Optional field, default value is 1. If this flag is set, it is not
  304. possible to synchronize with the task by the means of starpu_task_wait()
  305. later on. Internal data structures are only guaranteed to be freed
  306. once starpu_task_wait() is called if the flag is not set.
  307. \var starpu_task::destroy
  308. Optional value. Default value is 0 for starpu_task_init(), and 1 for
  309. starpu_task_create(). If this flag is set, the task structure will
  310. automatically be freed, either after the execution of the callback if
  311. the task is detached, or during starpu_task_wait() otherwise. If this
  312. flag is not set, dynamically allocated data structures will not be
  313. freed until starpu_task_destroy() is called explicitly. Setting this
  314. flag for a statically allocated task structure will result in
  315. undefined behaviour. The flag is set to 1 when the task is created by
  316. calling starpu_task_create(). Note that starpu_task_wait_for_all()
  317. will not free any task.
  318. \var starpu_task::regenerate
  319. Optional field. If this flag is set, the task will be re-submitted to
  320. StarPU once it has been executed. This flag must not be set if the
  321. destroy flag is set.
  322. \var starpu_task::status
  323. Optional field. Current state of the task.
  324. \var starpu_task::profiling_info
  325. Optional field. Profiling information for the task.
  326. \var starpu_task::predicted
  327. Output field. Predicted duration of the task. This field is only set
  328. if the scheduling strategy used performance models.
  329. \var starpu_task::predicted_transfer
  330. Optional field. Predicted data transfer duration for the task in
  331. microseconds. This field is only valid if the scheduling strategy uses
  332. performance models.
  333. \var starpu_task::prev
  334. \private
  335. A pointer to the previous task. This should only be used by StarPU.
  336. \var starpu_task::next
  337. \private
  338. A pointer to the next task. This should only be used by StarPU.
  339. \var starpu_task::mf_skip
  340. \private
  341. This is only used for tasks that use multiformat handle. This should
  342. only be used by StarPU.
  343. \var starpu_task::flops
  344. This can be set to the number of floating points operations that the
  345. task will have to achieve. This is useful for easily getting GFlops
  346. curves from starpu_perfmodel_plot(), and for the hypervisor load
  347. balancing.
  348. \var starpu_task::starpu_private
  349. \private
  350. This is private to StarPU, do not modify. If the task is allocated by
  351. hand (without starpu_task_create()), this field should be set to NULL.
  352. \var starpu_task::magic
  353. \private
  354. This field is set when initializing a task. The function
  355. starpu_task_submit() will fail if the field does not have the right
  356. value. This will hence avoid submitting tasks which have not been
  357. properly initialised.
  358. \var starpu_task::sched_ctx
  359. Scheduling context.
  360. \var starpu_task::hypervisor_tag
  361. Helps the hypervisor monitor the execution of this task.
  362. \var starpu_task::scheduled
  363. Whether the scheduler has pushed the task on some queue
  364. \fn void starpu_task_init(struct starpu_task *task)
  365. \ingroup Codelet_And_Tasks
  366. Initialize task with default values. This function is
  367. implicitly called by starpu_task_create(). By default, tasks initialized
  368. with starpu_task_init() must be deinitialized explicitly with
  369. starpu_task_clean(). Tasks can also be initialized statically, using
  370. STARPU_TASK_INITIALIZER.
  371. \def STARPU_TASK_INITIALIZER
  372. \ingroup Codelet_And_Tasks
  373. It is possible to initialize statically allocated tasks with
  374. this value. This is equivalent to initializing a structure starpu_task
  375. with the function starpu_task_init() function.
  376. \def STARPU_TASK_GET_HANDLE(struct starpu_task *task, int i)
  377. \ingroup Codelet_And_Tasks
  378. Return the \p i th data handle of the given task. If the task
  379. is defined with a static or dynamic number of handles, will either
  380. return the \p i th element of the field starpu_task::handles or the \p
  381. i th element of the field starpu_task::dyn_handles (see \ref
  382. Setting_the_Data_Handles_for_a_Task)
  383. \def STARPU_TASK_SET_HANDLE(struct starpu_task *task, starpu_data_handle_t handle, int i)
  384. \ingroup Codelet_And_Tasks
  385. Set the \p i th data handle of the given task with the given
  386. dat handle. If the task is defined with a static or dynamic number of
  387. handles, will either set the \p i th element of the field
  388. starpu_task::handles or the \p i th element of the field
  389. starpu_task::dyn_handles (see \ref
  390. Setting_the_Data_Handles_for_a_Task)
  391. \def STARPU_CODELET_GET_MODE(struct starpu_codelet *codelet, int i)
  392. \ingroup Codelet_And_Tasks
  393. Return the access mode of the \p i th data handle of the given
  394. codelet. If the codelet is defined with a static or dynamic number of
  395. handles, will either return the \p i th element of the field
  396. starpu_codelet::modes or the \p i th element of the field
  397. starpu_codelet::dyn_modes (see \ref
  398. Setting_the_Data_Handles_for_a_Task)
  399. \def STARPU_CODELET_SET_MODE(struct starpu_codelet *codelet, enum starpu_data_access_mode mode, int i)
  400. \ingroup Codelet_And_Tasks
  401. Set the access mode of the \p i th data handle of the given
  402. codelet. If the codelet is defined with a static or dynamic number of
  403. handles, will either set the \p i th element of the field
  404. starpu_codelet::modes or the \p i th element of the field
  405. starpu_codelet::dyn_modes (see \ref
  406. Setting_the_Data_Handles_for_a_Task)
  407. \fn struct starpu_task * starpu_task_create(void)
  408. \ingroup Codelet_And_Tasks
  409. Allocate a task structure and initialize it with default
  410. values. Tasks allocated dynamically with starpu_task_create() are
  411. automatically freed when the task is terminated. This means that the
  412. task pointer can not be used any more once the task is submitted,
  413. since it can be executed at any time (unless dependencies make it
  414. wait) and thus freed at any time. If the field starpu_task::destroy is
  415. explicitly unset, the resources used by the task have to be freed by
  416. calling starpu_task_destroy().
  417. \fn struct starpu_task * starpu_task_dup(struct starpu_task *task)
  418. \ingroup Codelet_And_Tasks
  419. Allocate a task structure which is the exact duplicate of the
  420. given task.
  421. \fn void starpu_task_clean(struct starpu_task *task)
  422. \ingroup Codelet_And_Tasks
  423. Release all the structures automatically allocated to execute
  424. task, but not the task structure itself and values set by the user
  425. remain unchanged. It is thus useful for statically allocated tasks for
  426. instance. It is also useful when users want to execute the same
  427. operation several times with as least overhead as possible. It is
  428. called automatically by starpu_task_destroy(). It has to be called
  429. only after explicitly waiting for the task or after starpu_shutdown()
  430. (waiting for the callback is not enough, since StarPU still
  431. manipulates the task after calling the callback).
  432. \fn void starpu_task_destroy(struct starpu_task *task)
  433. \ingroup Codelet_And_Tasks
  434. Free the resource allocated during starpu_task_create() and
  435. associated with task. This function is already called automatically
  436. after the execution of a task when the field starpu_task::destroy is
  437. set, which is the default for tasks created by starpu_task_create().
  438. Calling this function on a statically allocated task results in an
  439. undefined behaviour.
  440. \fn int starpu_task_wait(struct starpu_task *task)
  441. \ingroup Codelet_And_Tasks
  442. This function blocks until \p task has been executed. It is not
  443. possible to synchronize with a task more than once. It is not possible
  444. to wait for synchronous or detached tasks. Upon successful completion,
  445. this function returns 0. Otherwise, <c>-EINVAL</c> indicates that the
  446. specified task was either synchronous or detached.
  447. \fn int starpu_task_submit(struct starpu_task *task)
  448. \ingroup Codelet_And_Tasks
  449. This function submits task to StarPU. Calling this function
  450. does not mean that the task will be executed immediately as there can
  451. be data or task (tag) dependencies that are not fulfilled yet: StarPU
  452. will take care of scheduling this task with respect to such
  453. dependencies. This function returns immediately if the field
  454. starpu_task::synchronous is set to 0, and block until the
  455. termination of the task otherwise. It is also possible to synchronize
  456. the application with asynchronous tasks by the means of tags, using
  457. the function starpu_tag_wait() function for instance. In case of
  458. success, this function returns 0, a return value of <c>-ENODEV</c>
  459. means that there is no worker able to process this task (e.g. there is
  460. no GPU available and this task is only implemented for CUDA devices).
  461. starpu_task_submit() can be called from anywhere, including codelet
  462. functions and callbacks, provided that the field
  463. starpu_task::synchronous is set to 0.
  464. \fn int starpu_task_wait_for_all(void)
  465. \ingroup Codelet_And_Tasks
  466. This function blocks until all the tasks that were submitted
  467. (to the current context or the global one if there aren't any) are
  468. terminated. It does not destroy these tasks.
  469. \fn int starpu_task_wait_for_all_in_ctx(unsigned sched_ctx_id)
  470. \ingroup Codelet_And_Tasks
  471. This function waits until all the tasks that were already
  472. submitted to the context \p sched_ctx_id have been executed
  473. \fn int starpu_task_nready(void)
  474. \ingroup Codelet_And_Tasks
  475. TODO
  476. \fn int starpu_task_nsubmitted(void)
  477. \ingroup Codelet_And_Tasks
  478. Return the number of submitted tasks which have not completed yet.
  479. \fn int starpu_task_nready(void)
  480. \ingroup Codelet_And_Tasks
  481. Return the number of submitted tasks which are ready for
  482. execution are already executing. It thus does not include tasks
  483. waiting for dependencies.
  484. \fn struct starpu_task * starpu_task_get_current(void)
  485. \ingroup Codelet_And_Tasks
  486. This function returns the task currently executed by the
  487. worker, or <c>NULL</c> if it is called either from a thread that is not a
  488. task or simply because there is no task being executed at the moment.
  489. \fn void starpu_codelet_display_stats(struct starpu_codelet *cl)
  490. \ingroup Codelet_And_Tasks
  491. Output on stderr some statistics on the codelet \p cl.
  492. \fn int starpu_task_wait_for_no_ready(void)
  493. \ingroup Codelet_And_Tasks
  494. This function waits until there is no more ready task.
  495. \fn void starpu_task_set_implementation(struct starpu_task *task, unsigned impl)
  496. \ingroup Codelet_And_Tasks
  497. This function should be called by schedulers to specify the
  498. codelet implementation to be executed when executing the task.
  499. \fn unsigned starpu_task_get_implementation(struct starpu_task *task)
  500. \ingroup Codelet_And_Tasks
  501. This function return the codelet implementation to be executed
  502. when executing the task.
  503. \fn void starpu_create_sync_task(starpu_tag_t sync_tag, unsigned ndeps, starpu_tag_t *deps, void (*callback)(void *), void *callback_arg)
  504. \ingroup Codelet_And_Tasks
  505. This creates (and submits) an empty task that unlocks a tag once all
  506. its dependencies are fulfilled.
  507. */