advanced-api.texi 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429
  1. @c -*-texinfo-*-
  2. @c This file is part of the StarPU Handbook.
  3. @c Copyright (C) 2009--2011 Universit@'e de Bordeaux 1
  4. @c Copyright (C) 2010, 2011, 2012 Centre National de la Recherche Scientifique
  5. @c Copyright (C) 2011, 2012 Institut National de Recherche en Informatique et Automatique
  6. @c See the file starpu.texi for copying conditions.
  7. @menu
  8. * Defining a new data interface::
  9. * Multiformat Data Interface::
  10. * Task Bundles::
  11. * Task Lists::
  12. * Using Parallel Tasks::
  13. * Defining a new scheduling policy::
  14. * Expert mode::
  15. @end menu
  16. @node Defining a new data interface
  17. @section Defining a new data interface
  18. @menu
  19. * Data Interface API:: Data Interface API
  20. * An example of data interface:: An example of data interface
  21. @end menu
  22. @node Data Interface API
  23. @subsection Data Interface API
  24. @deftp {Data Type} {struct starpu_data_interface_ops}
  25. @anchor{struct starpu_data_interface_ops}
  26. Defines the per-interface methods.
  27. @table @asis
  28. @item @code{int @{ram,cuda,opencl,spu@}_to_@{ram,cuda,opencl,spu@}(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);}
  29. These sixteen functions define how to copy data from the @var{src_interface}
  30. interface on the @var{src_node} node to the @var{dst_interface} interface
  31. on the @var{dst_node} node. They return 0 on success.
  32. @item @code{int (*ram_to_cuda_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);}
  33. Define how to copy data from the @var{src_interface} interface on the
  34. @var{src_node} node (in RAM) to the @var{dst_interface} interface on the
  35. @var{dst_node} node (on a CUDA device), using the given @var{stream}. Return 0
  36. on success.
  37. @item @code{int (*cuda_to_ram_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);}
  38. Define how to copy data from the @var{src_interface} interface on the
  39. @var{src_node} node (on a CUDA device) to the @var{dst_interface} interface on the
  40. @var{dst_node} node (in RAM), using the given @var{stream}. Return 0
  41. on success.
  42. @item @code{int (*cuda_to_cuda_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);}
  43. Define how to copy data from the @var{src_interface} interface on the
  44. @var{src_node} node (on a CUDA device) to the @var{dst_interface} interface on
  45. the @var{dst_node} node (on another CUDA device), using the given @var{stream}.
  46. Return 0 on success.
  47. @item @code{int (*ram_to_opencl_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, /* cl_event * */ void *event);}
  48. Define how to copy data from the @var{src_interface} interface on the
  49. @var{src_node} node (in RAM) to the @var{dst_interface} interface on the
  50. @var{dst_node} node (on an OpenCL device), using @var{event}, a pointer to a
  51. cl_event. Return 0 on success.
  52. @item @code{int (*opencl_to_ram_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, /* cl_event * */ void *event);}
  53. Define how to copy data from the @var{src_interface} interface on the
  54. @var{src_node} node (on an OpenCL device) to the @var{dst_interface} interface
  55. on the @var{dst_node} node (in RAM), using the given @var{event}, a pointer to
  56. a cl_event. Return 0 on success.
  57. @item @code{int (*opencl_to_opencl_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, /* cl_event * */ void *event);}
  58. Define how to copy data from the @var{src_interface} interface on the
  59. @var{src_node} node (on an OpenCL device) to the @var{dst_interface} interface
  60. on the @var{dst_node} node (on another OpenCL device), using the given
  61. @var{event}, a pointer to a cl_event. Return 0 on success.
  62. @end table
  63. @end deftp
  64. @deftp {Data Type} {struct starpu_data_copy_methods}
  65. @table @asis
  66. Per-interface data transfer methods.
  67. @item @code{void (*register_data_handle)(starpu_data_handle_t handle, uint32_t home_node, void *data_interface);}
  68. Register an existing interface into a data handle.
  69. @item @code{starpu_ssize_t (*allocate_data_on_node)(void *data_interface, uint32_t node);}
  70. Allocate data for the interface on a given node.
  71. @item @code{ void (*free_data_on_node)(void *data_interface, uint32_t node);}
  72. Free data of the interface on a given node.
  73. @item @code{ const struct starpu_data_copy_methods *copy_methods;}
  74. ram/cuda/spu/opencl synchronous and asynchronous transfer methods.
  75. @item @code{ void * (*handle_to_pointer)(starpu_data_handle_t handle, uint32_t node);}
  76. Return the current pointer (if any) for the handle on the given node.
  77. @item @code{ size_t (*get_size)(starpu_data_handle_t handle);}
  78. Return an estimation of the size of data, for performance models.
  79. @item @code{ uint32_t (*footprint)(starpu_data_handle_t handle);}
  80. Return a 32bit footprint which characterizes the data size.
  81. @item @code{ int (*compare)(void *data_interface_a, void *data_interface_b);}
  82. Compare the data size of two interfaces.
  83. @item @code{ void (*display)(starpu_data_handle_t handle, FILE *f);}
  84. Dump the sizes of a handle to a file.
  85. @item @code{ int (*convert_to_gordon)(void *data_interface, uint64_t *ptr, gordon_strideSize_t *ss); }
  86. Convert the data size to the spu size format. If no SPUs are used, this field can be seto NULL.
  87. @item @code{enum starpu_data_interface_id interfaceid;}
  88. An identifier that is unique to each interface.
  89. @item @code{size_t interface_size;}
  90. The size of the interface data descriptor.
  91. @end table
  92. @end deftp
  93. @node An example of data interface
  94. @subsection An example of data interface
  95. TODO
  96. See @code{src/datawizard/interfaces/vector_interface.c} for now.
  97. @node Multiformat Data Interface
  98. @section Multiformat Data Interface
  99. @deftp {Data Type} {struct starpu_multiformat_data_interface_ops}
  100. todo. The different fields are:
  101. @table @asis
  102. @item @code{cpu_elemsize}
  103. the size of each element on CPUs,
  104. @item @code{opencl_elemsize}
  105. the size of each element on OpenCL devices,
  106. @item @code{cuda_elemsize}
  107. the size of each element on CUDA devices,
  108. @item @code{cpu_to_opencl_cl}
  109. pointer to a codelet which converts from CPU to OpenCL
  110. @item @code{opencl_to_cpu_cl}
  111. pointer to a codelet which converts from OpenCL to CPU
  112. @item @code{cpu_to_cuda_cl}
  113. pointer to a codelet which converts from CPU to CUDA
  114. @item @code{cuda_to_cpu_cl}
  115. pointer to a codelet which converts from CUDA to CPU
  116. @end table
  117. @end deftp
  118. @deftypefun void starpu_multiformat_data_register (starpu_data_handle_t *@var{handle}, uint32_t @var{home_node}, void *@var{ptr}, uint32_t @var{nobjects}, struct starpu_multiformat_data_interface_ops *@var{format_ops})
  119. Register a piece of data that can be represented in different ways, depending upon
  120. the processing unit that manipulates it. It allows the programmer, for instance, to
  121. use an array of structures when working on a CPU, and a structure of arrays when
  122. working on a GPU.
  123. @var{nobjects} is the number of elements in the data. @var{format_ops} describes
  124. the format.
  125. @end deftypefun
  126. @node Task Bundles
  127. @section Task Bundles
  128. @deftp {Data Type} {starpu_task_bundle_t}
  129. Opaque structure describing a list of tasks that should be scheduled
  130. on the same worker whenever it's possible. It must be considered as a
  131. hint given to the scheduler as there is no guarantee that they will be
  132. executed on the same worker.
  133. @end deftp
  134. @deftypefun void starpu_task_bundle_create ({starpu_task_bundle_t *}@var{bundle})
  135. Factory function creating and initializing @var{bundle}, when the call returns, memory needed is allocated and @var{bundle} is ready to use.
  136. @end deftypefun
  137. @deftypefun int starpu_task_bundle_insert (starpu_task_bundle_t @var{bundle}, {struct starpu_task *}@var{task})
  138. Insert @var{task} in @var{bundle}. Until @var{task} is removed from @var{bundle} its expected length and data transfer time will be considered along those of the other tasks of @var{bundle}.
  139. This function mustn't be called if @var{bundle} is already closed and/or @var{task} is already submitted.
  140. @end deftypefun
  141. @deftypefun int starpu_task_bundle_remove (starpu_task_bundle_t @var{bundle}, {struct starpu_task *}@var{task})
  142. Remove @var{task} from @var{bundle}.
  143. Of course @var{task} must have been previously inserted @var{bundle}.
  144. This function mustn't be called if @var{bundle} is already closed and/or @var{task} is already submitted. Doing so would result in undefined behaviour.
  145. @end deftypefun
  146. @deftypefun void starpu_task_bundle_close (starpu_task_bundle_t @var{bundle})
  147. Inform the runtime that the user won't modify @var{bundle} anymore, it means no more inserting or removing task. Thus the runtime can destroy it when possible.
  148. @end deftypefun
  149. @node Task Lists
  150. @section Task Lists
  151. @deftp {Data Type} {struct starpu_task_list}
  152. Stores a double-chained list of tasks
  153. @end deftp
  154. @deftypefun void starpu_task_list_init ({struct starpu_task_list *}@var{list})
  155. Initialize a list structure
  156. @end deftypefun
  157. @deftypefun void starpu_task_list_push_front ({struct starpu_task_list *}@var{list}, {struct starpu_task *}@var{task})
  158. Push a task at the front of a list
  159. @end deftypefun
  160. @deftypefun void starpu_task_list_push_back ({struct starpu_task_list *}@var{list}, {struct starpu_task *}@var{task})
  161. Push a task at the back of a list
  162. @end deftypefun
  163. @deftypefun {struct starpu_task *} starpu_task_list_front ({struct starpu_task_list *}@var{list})
  164. Get the front of the list (without removing it)
  165. @end deftypefun
  166. @deftypefun {struct starpu_task *} starpu_task_list_back ({struct starpu_task_list *}@var{list})
  167. Get the back of the list (without removing it)
  168. @end deftypefun
  169. @deftypefun int starpu_task_list_empty ({struct starpu_task_list *}@var{list})
  170. Test if a list is empty
  171. @end deftypefun
  172. @deftypefun void starpu_task_list_erase ({struct starpu_task_list *}@var{list}, {struct starpu_task *}@var{task})
  173. Remove an element from the list
  174. @end deftypefun
  175. @deftypefun {struct starpu_task *} starpu_task_list_pop_front ({struct starpu_task_list *}@var{list})
  176. Remove the element at the front of the list
  177. @end deftypefun
  178. @deftypefun {struct starpu_task *} starpu_task_list_pop_back ({struct starpu_task_list *}@var{list})
  179. Remove the element at the back of the list
  180. @end deftypefun
  181. @deftypefun {struct starpu_task *} starpu_task_list_begin ({struct starpu_task_list *}@var{list})
  182. Get the first task of the list.
  183. @end deftypefun
  184. @deftypefun {struct starpu_task *} starpu_task_list_end ({struct starpu_task_list *}@var{list})
  185. Get the end of the list.
  186. @end deftypefun
  187. @deftypefun {struct starpu_task *} starpu_task_list_next ({struct starpu_task *}@var{task})
  188. Get the next task of the list. This is not erase-safe.
  189. @end deftypefun
  190. @node Using Parallel Tasks
  191. @section Using Parallel Tasks
  192. @deftypefun unsigned starpu_combined_worker_get_count (void)
  193. todo
  194. @end deftypefun
  195. @deftypefun int starpu_combined_worker_get_id (void)
  196. todo
  197. @end deftypefun
  198. @deftypefun int starpu_combined_worker_get_size (void)
  199. todo
  200. @end deftypefun
  201. @deftypefun int starpu_combined_worker_get_rank (void)
  202. todo
  203. @end deftypefun
  204. @deftypefun int starpu_combined_worker_assign_workerid (int nworkers, int workerid_array[])
  205. Register a new combined worker and get its identifier
  206. @end deftypefun
  207. @deftypefun int starpu_combined_worker_get_description (int workerid, {int *}worker_size, {int **}combined_workerid)
  208. Get the description of a combined worker
  209. @end deftypefun
  210. @deftypefun int starpu_combined_worker_can_execute_task (unsigned workerid, {struct starpu_task *}task, unsigned nimpl)
  211. Variant of starpu_worker_can_execute_task compatible with combined workers
  212. @end deftypefun
  213. @node Defining a new scheduling policy
  214. @section Defining a new scheduling policy
  215. TODO
  216. A full example showing how to define a new scheduling policy is available in
  217. the StarPU sources in the directory @code{examples/scheduler/}.
  218. @menu
  219. * Scheduling Policy API:: Scheduling Policy API
  220. * Source code::
  221. @end menu
  222. @node Scheduling Policy API
  223. @subsection Scheduling Policy API
  224. @deftp {Data Type} {struct starpu_machine_topology}
  225. TODO
  226. @end deftp
  227. @deftp {Data Type} {struct starpu_sched_policy}
  228. This structure contains all the methods that implement a scheduling policy. An
  229. application may specify which scheduling strategy in the @code{sched_policy}
  230. field of the @code{starpu_conf} structure passed to the @code{starpu_init}
  231. function. The different fields are:
  232. @table @asis
  233. @item @code{init_sched}
  234. Initialize the scheduling policy.
  235. @item @code{deinit_sched}
  236. Cleanup the scheduling policy.
  237. @item @code{push_task}
  238. Insert a task into the scheduler.
  239. @item @code{push_task_notify}
  240. Notify the scheduler that a task was pushed on a given worker. This method is
  241. called when a task that was explicitely assigned to a worker becomes ready and
  242. is about to be executed by the worker. This method therefore permits to keep
  243. the state of of the scheduler coherent even when StarPU bypasses the scheduling
  244. strategy.
  245. @item @code{pop_task} (optional)
  246. Get a task from the scheduler. The mutex associated to the worker is already
  247. taken when this method is called. If this method is defined as @code{NULL}, the
  248. worker will only execute tasks from its local queue. In this case, the
  249. @code{push_task} method should use the @code{starpu_push_local_task} method to
  250. assign tasks to the different workers.
  251. @item @code{pop_every_task}
  252. Remove all available tasks from the scheduler (tasks are chained by the means
  253. of the prev and next fields of the starpu_task structure). The mutex associated
  254. to the worker is already taken when this method is called. This is currently
  255. only used by the Gordon driver.
  256. @item @code{post_exec_hook} (optional)
  257. This method is called every time a task has been executed.
  258. @item @code{policy_name}
  259. Name of the policy (optional).
  260. @item @code{policy_description}
  261. Description of the policy (optional).
  262. @end table
  263. @end deftp
  264. @deftypefun void starpu_worker_set_sched_condition (int @var{workerid}, pthread_cond_t *@var{sched_cond}, pthread_mutex_t *@var{sched_mutex})
  265. This function specifies the condition variable associated to a worker
  266. When there is no available task for a worker, StarPU blocks this worker on a
  267. condition variable. This function specifies which condition variable (and the
  268. associated mutex) should be used to block (and to wake up) a worker. Note that
  269. multiple workers may use the same condition variable. For instance, in the case
  270. of a scheduling strategy with a single task queue, the same condition variable
  271. would be used to block and wake up all workers.
  272. The initialization method of a scheduling strategy (@code{init_sched}) must
  273. call this function once per worker.
  274. @end deftypefun
  275. @deftypefun void starpu_sched_set_min_priority (int @var{min_prio})
  276. Defines the minimum priority level supported by the scheduling policy. The
  277. default minimum priority level is the same as the default priority level which
  278. is 0 by convention. The application may access that value by calling the
  279. @code{starpu_sched_get_min_priority} function. This function should only be
  280. called from the initialization method of the scheduling policy, and should not
  281. be used directly from the application.
  282. @end deftypefun
  283. @deftypefun void starpu_sched_set_max_priority (int @var{max_prio})
  284. Defines the maximum priority level supported by the scheduling policy. The
  285. default maximum priority level is 1. The application may access that value by
  286. calling the @code{starpu_sched_get_max_priority} function. This function should
  287. only be called from the initialization method of the scheduling policy, and
  288. should not be used directly from the application.
  289. @end deftypefun
  290. @deftypefun int starpu_sched_get_min_priority (void)
  291. Returns the current minimum priority level supported by the
  292. scheduling policy
  293. @end deftypefun
  294. @deftypefun int starpu_sched_get_max_priority (void)
  295. Returns the current maximum priority level supported by the
  296. scheduling policy
  297. @end deftypefun
  298. @deftypefun int starpu_push_local_task (int @var{workerid}, {struct starpu_task} *@var{task}, int @var{back})
  299. The scheduling policy may put tasks directly into a worker's local queue so
  300. that it is not always necessary to create its own queue when the local queue
  301. is sufficient. If @var{back} not null, @var{task} is put at the back of the queue
  302. where the worker will pop tasks first. Setting @var{back} to 0 therefore ensures
  303. a FIFO ordering.
  304. @end deftypefun
  305. @deftypefun int starpu_worker_can_execute_task (unsigned @var{workerid}, {struct starpu_task *}@var{task}, unsigned {nimpl})
  306. Check if the worker specified by workerid can execute the codelet. Schedulers need to call it before assigning a task to a worker, otherwise the task may fail to execute.
  307. @end deftypefun
  308. @deftypefun double starpu_timing_now (void)
  309. Return the current date in µs
  310. @end deftypefun
  311. @deftypefun double starpu_task_expected_length ({struct starpu_task *}@var{task}, {enum starpu_perf_archtype} @var{arch}, unsigned @var{nimpl})
  312. Returns expected task duration in µs
  313. @end deftypefun
  314. @deftypefun double starpu_worker_get_relative_speedup ({enum starpu_perf_archtype} @var{perf_archtype})
  315. Returns an estimated speedup factor relative to CPU speed
  316. @end deftypefun
  317. @deftypefun double starpu_task_expected_data_transfer_time (uint32_t @var{memory_node}, {struct starpu_task *}@var{task})
  318. Returns expected data transfer time in µs
  319. @end deftypefun
  320. @deftypefun double starpu_data_expected_transfer_time (starpu_data_handle_t @var{handle}, unsigned @var{memory_node}, {enum starpu_access_mode} @var{mode})
  321. Predict the transfer time (in µs) to move a handle to a memory node
  322. @end deftypefun
  323. @deftypefun double starpu_task_expected_power ({struct starpu_task *}@var{task}, {enum starpu_perf_archtype} @var{arch}, unsigned @var{nimpl})
  324. Returns expected power consumption in J
  325. @end deftypefun
  326. @deftypefun double starpu_task_expected_conversion_time ({struct starpu_task *}@var{task}, {enum starpu_perf_archtype} @var{arch}, unsigned {nimpl})
  327. Returns expected conversion time in ms (multiformat interface only)
  328. @end deftypefun
  329. @node Source code
  330. @subsection Source code
  331. @cartouche
  332. @smallexample
  333. static struct starpu_sched_policy dummy_sched_policy = @{
  334. .init_sched = init_dummy_sched,
  335. .deinit_sched = deinit_dummy_sched,
  336. .push_task = push_task_dummy,
  337. .push_prio_task = NULL,
  338. .pop_task = pop_task_dummy,
  339. .post_exec_hook = NULL,
  340. .pop_every_task = NULL,
  341. .policy_name = "dummy",
  342. .policy_description = "dummy scheduling strategy"
  343. @};
  344. @end smallexample
  345. @end cartouche
  346. @node Expert mode
  347. @section Expert mode
  348. @deftypefun void starpu_wake_all_blocked_workers (void)
  349. todo
  350. @end deftypefun
  351. @deftypefun int starpu_progression_hook_register (unsigned (*@var{func})(void *arg), void *@var{arg})
  352. todo
  353. @end deftypefun
  354. @deftypefun void starpu_progression_hook_deregister (int @var{hook_id})
  355. todo
  356. @end deftypefun