advanced-api.texi 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396
  1. @c -*-texinfo-*-
  2. @c This file is part of the StarPU Handbook.
  3. @c Copyright (C) 2009--2011 Universit@'e de Bordeaux 1
  4. @c Copyright (C) 2010, 2011, 2012 Centre National de la Recherche Scientifique
  5. @c Copyright (C) 2011, 2012 Institut National de Recherche en Informatique et Automatique
  6. @c See the file starpu.texi for copying conditions.
  7. @menu
  8. * Defining a new data interface::
  9. * Multiformat Data Interface::
  10. * Task Bundles::
  11. * Task Lists::
  12. * Defining a new scheduling policy::
  13. * Expert mode::
  14. @end menu
  15. @node Defining a new data interface
  16. @section Defining a new data interface
  17. @menu
  18. * Data Interface API:: Data Interface API
  19. * An example of data interface:: An example of data interface
  20. @end menu
  21. @node Data Interface API
  22. @subsection Data Interface API
  23. @deftp {Data Type} {struct starpu_data_interface_ops}
  24. @anchor{struct starpu_data_interface_ops}
  25. Defines the per-interface methods.
  26. @table @asis
  27. @item @code{int @{ram,cuda,opencl,spu@}_to_@{ram,cuda,opencl,spu@}(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);}
  28. These sixteen functions define how to copy data from the @var{src_interface}
  29. interface on the @var{src_node} node to the @var{dst_interface} interface
  30. on the @var{dst_node} node. They return 0 on success.
  31. @item @code{int (*ram_to_cuda_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);}
  32. Define how to copy data from the @var{src_interface} interface on the
  33. @var{src_node} node (in RAM) to the @var{dst_interface} interface on the
  34. @var{dst_node} node (on a CUDA device), using the given @var{stream}. Return 0
  35. on success.
  36. @item @code{int (*cuda_to_ram_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);}
  37. Define how to copy data from the @var{src_interface} interface on the
  38. @var{src_node} node (on a CUDA device) to the @var{dst_interface} interface on the
  39. @var{dst_node} node (in RAM), using the given @var{stream}. Return 0
  40. on success.
  41. @item @code{int (*cuda_to_cuda_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);}
  42. Define how to copy data from the @var{src_interface} interface on the
  43. @var{src_node} node (on a CUDA device) to the @var{dst_interface} interface on
  44. the @var{dst_node} node (on another CUDA device), using the given @var{stream}.
  45. Return 0 on success.
  46. @item @code{int (*ram_to_opencl_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, /* cl_event * */ void *event);}
  47. Define how to copy data from the @var{src_interface} interface on the
  48. @var{src_node} node (in RAM) to the @var{dst_interface} interface on the
  49. @var{dst_node} node (on an OpenCL device), using @var{event}, a pointer to a
  50. cl_event. Return 0 on success.
  51. @item @code{int (*opencl_to_ram_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, /* cl_event * */ void *event);}
  52. Define how to copy data from the @var{src_interface} interface on the
  53. @var{src_node} node (on an OpenCL device) to the @var{dst_interface} interface
  54. on the @var{dst_node} node (in RAM), using the given @var{event}, a pointer to
  55. a cl_event. Return 0 on success.
  56. @item @code{int (*opencl_to_opencl_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, /* cl_event * */ void *event);}
  57. Define how to copy data from the @var{src_interface} interface on the
  58. @var{src_node} node (on an OpenCL device) to the @var{dst_interface} interface
  59. on the @var{dst_node} node (on another OpenCL device), using the given
  60. @var{event}, a pointer to a cl_event. Return 0 on success.
  61. @end table
  62. @end deftp
  63. @deftp {Data Type} {struct starpu_data_copy_methods}
  64. @table @asis
  65. Per-interface data transfer methods.
  66. @item @code{void (*register_data_handle)(starpu_data_handle_t handle, uint32_t home_node, void *data_interface);}
  67. Register an existing interface into a data handle.
  68. @item @code{starpu_ssize_t (*allocate_data_on_node)(void *data_interface, uint32_t node);}
  69. Allocate data for the interface on a given node.
  70. @item @code{ void (*free_data_on_node)(void *data_interface, uint32_t node);}
  71. Free data of the interface on a given node.
  72. @item @code{ const struct starpu_data_copy_methods *copy_methods;}
  73. ram/cuda/spu/opencl synchronous and asynchronous transfer methods.
  74. @item @code{ void * (*handle_to_pointer)(starpu_data_handle_t handle, uint32_t node);}
  75. Return the current pointer (if any) for the handle on the given node.
  76. @item @code{ size_t (*get_size)(starpu_data_handle_t handle);}
  77. Return an estimation of the size of data, for performance models.
  78. @item @code{ uint32_t (*footprint)(starpu_data_handle_t handle);}
  79. Return a 32bit footprint which characterizes the data size.
  80. @item @code{ int (*compare)(void *data_interface_a, void *data_interface_b);}
  81. Compare the data size of two interfaces.
  82. @item @code{ void (*display)(starpu_data_handle_t handle, FILE *f);}
  83. Dump the sizes of a handle to a file.
  84. @item @code{ int (*convert_to_gordon)(void *data_interface, uint64_t *ptr, gordon_strideSize_t *ss); }
  85. Convert the data size to the spu size format. If no SPUs are used, this field can be seto NULL.
  86. @item @code{enum starpu_data_interface_id interfaceid;}
  87. An identifier that is unique to each interface.
  88. @item @code{size_t interface_size;}
  89. The size of the interface data descriptor.
  90. @end table
  91. @end deftp
  92. @node An example of data interface
  93. @subsection An example of data interface
  94. TODO
  95. See @code{src/datawizard/interfaces/vector_interface.c} for now.
  96. @node Multiformat Data Interface
  97. @section Multiformat Data Interface
  98. @deftp {Data Type} {struct starpu_multiformat_data_interface_ops}
  99. todo. The different fields are:
  100. @table @asis
  101. @item @code{cpu_elemsize}
  102. the size of each element on CPUs,
  103. @item @code{opencl_elemsize}
  104. the size of each element on OpenCL devices,
  105. @item @code{cuda_elemsize}
  106. the size of each element on CUDA devices,
  107. @item @code{cpu_to_opencl_cl}
  108. pointer to a codelet which converts from CPU to OpenCL
  109. @item @code{opencl_to_cpu_cl}
  110. pointer to a codelet which converts from OpenCL to CPU
  111. @item @code{cpu_to_cuda_cl}
  112. pointer to a codelet which converts from CPU to CUDA
  113. @item @code{cuda_to_cpu_cl}
  114. pointer to a codelet which converts from CUDA to CPU
  115. @end table
  116. @end deftp
  117. @deftypefun void starpu_multiformat_data_register (starpu_data_handle_t *@var{handle}, uint32_t @var{home_node}, void *@var{ptr}, uint32_t @var{nobjects}, struct starpu_multiformat_data_interface_ops *@var{format_ops});
  118. Register a piece of data that can be represented in different ways, depending upon
  119. the processing unit that manipulates it. It allows the programmer, for instance, to
  120. use an array of structures when working on a CPU, and a structure of arrays when
  121. working on a GPU.
  122. @var{nobjects} is the number of elements in the data. @var{format_ops} describes
  123. the format.
  124. @end deftypefun
  125. @node Task Bundles
  126. @section Task Bundles
  127. @deftp {Data Type} starpu_task_bundle_t
  128. Opaque structure describing a list of tasks that should be scheduled
  129. on the same worker whenever it's possible. It must be considered as a
  130. hint given to the scheduler as there is no guarantee that they will be
  131. executed on the same worker.
  132. @end deftp
  133. @deftypefun void starpu_task_bundle_create ({starpu_task_bundle_t *}@var{bundle})
  134. Factory function creating and initializing @var{bundle}, when the call returns, memory needed is allocated and @var{bundle} is ready to use.
  135. @end deftypefun
  136. @deftypefun int starpu_task_bundle_insert (starpu_task_bundle_t @var{bundle}, {struct starpu_task *}@var{task})
  137. Insert @var{task} in @var{bundle}. Until @var{task} is removed from @var{bundle} its expected length and data transfer time will be considered along those of the other tasks of @var{bundle}.
  138. This function mustn't be called if @var{bundle} is already closed and/or @var{task} is already submitted.
  139. @end deftypefun
  140. @deftypefun int starpu_task_bundle_remove (starpu_task_bundle_t @var{bundle}, {struct starpu_task *}@var{task})
  141. Remove @var{task} from @var{bundle}.
  142. Of course @var{task} must have been previously inserted @var{bundle}.
  143. This function mustn't be called if @var{bundle} is already closed and/or @var{task} is already submitted. Doing so would result in undefined behaviour.
  144. @end deftypefun
  145. @deftypefun void starpu_task_bundle_close (starpu_task_bundle_t @var{bundle});
  146. Inform the runtime that the user won't modify @var{bundle} anymore, it means no more inserting or removing task. Thus the runtime can destroy it when possible.
  147. @end deftypefun
  148. @node Task Lists
  149. @section Task Lists
  150. @deftp {Data Type} {struct starpu_task_list}
  151. Stores a double-chained list of tasks
  152. @end deftp
  153. @deftypefun void starpu_task_list_init ({struct starpu_task_list *}@var{list})
  154. Initialize a list structure
  155. @end deftypefun
  156. @deftypefun void starpu_task_list_push_front ({struct starpu_task_list *}@var{list}, {struct starpu_task *}@var{task})
  157. Push a task at the front of a list
  158. @end deftypefun
  159. @deftypefun void starpu_task_list_push_back ({struct starpu_task_list *}@var{list}, {struct starpu_task *}@var{task})
  160. Push a task at the back of a list
  161. @end deftypefun
  162. @deftypefun {struct starpu_task *} starpu_task_list_front ({struct starpu_task_list *}@var{list})
  163. Get the front of the list (without removing it)
  164. @end deftypefun
  165. @deftypefun {struct starpu_task *} starpu_task_list_back ({struct starpu_task_list *}@var{list})
  166. Get the back of the list (without removing it)
  167. @end deftypefun
  168. @deftypefun int starpu_task_list_empty ({struct starpu_task_list *}@var{list})
  169. Test if a list is empty
  170. @end deftypefun
  171. @deftypefun void starpu_task_list_erase ({struct starpu_task_list *}@var{list}, {struct starpu_task *}@var{task})
  172. Remove an element from the list
  173. @end deftypefun
  174. @deftypefun {struct starpu_task *} starpu_task_list_pop_front ({struct starpu_task_list *}@var{list})
  175. Remove the element at the front of the list
  176. @end deftypefun
  177. @deftypefun {struct starpu_task *} starpu_task_list_pop_back ({struct starpu_task_list *}@var{list})
  178. Remove the element at the back of the list
  179. @end deftypefun
  180. @deftypefun {struct starpu_task *} starpu_task_list_begin ({struct starpu_task_list *}@var{list})
  181. Get the first task of the list.
  182. @end deftypefun
  183. @deftypefun {struct starpu_task *} starpu_task_list_end ({struct starpu_task_list *}@var{list})
  184. Get the end of the list.
  185. @end deftypefun
  186. @deftypefun {struct starpu_task *} starpu_task_list_next ({struct starpu_task *}@var{task})
  187. Get the next task of the list. This is not erase-safe.
  188. @end deftypefun
  189. @node Defining a new scheduling policy
  190. @section Defining a new scheduling policy
  191. TODO
  192. A full example showing how to define a new scheduling policy is available in
  193. the StarPU sources in the directory @code{examples/scheduler/}.
  194. @menu
  195. * Scheduling Policy API:: Scheduling Policy API
  196. * Source code::
  197. @end menu
  198. @node Scheduling Policy API
  199. @subsection Scheduling Policy API
  200. @deftp {Data Type} {struct starpu_machine_topology}
  201. TODO
  202. @end deftp
  203. @deftp {Data Type} {struct starpu_sched_policy}
  204. This structure contains all the methods that implement a scheduling policy. An
  205. application may specify which scheduling strategy in the @code{sched_policy}
  206. field of the @code{starpu_conf} structure passed to the @code{starpu_init}
  207. function. The different fields are:
  208. @table @asis
  209. @item @code{init_sched}
  210. Initialize the scheduling policy.
  211. @item @code{deinit_sched}
  212. Cleanup the scheduling policy.
  213. @item @code{push_task}
  214. Insert a task into the scheduler.
  215. @item @code{push_task_notify}
  216. Notify the scheduler that a task was pushed on a given worker. This method is
  217. called when a task that was explicitely assigned to a worker becomes ready and
  218. is about to be executed by the worker. This method therefore permits to keep
  219. the state of of the scheduler coherent even when StarPU bypasses the scheduling
  220. strategy.
  221. @item @code{pop_task} (optional)
  222. Get a task from the scheduler. The mutex associated to the worker is already
  223. taken when this method is called. If this method is defined as @code{NULL}, the
  224. worker will only execute tasks from its local queue. In this case, the
  225. @code{push_task} method should use the @code{starpu_push_local_task} method to
  226. assign tasks to the different workers.
  227. @item @code{pop_every_task}
  228. Remove all available tasks from the scheduler (tasks are chained by the means
  229. of the prev and next fields of the starpu_task structure). The mutex associated
  230. to the worker is already taken when this method is called. This is currently
  231. only used by the Gordon driver.
  232. @item @code{post_exec_hook} (optional)
  233. This method is called every time a task has been executed.
  234. @item @code{policy_name}
  235. Name of the policy (optional).
  236. @item @code{policy_description}
  237. Description of the policy (optional).
  238. @end table
  239. @end deftp
  240. @deftypefun void starpu_worker_set_sched_condition (int @var{workerid}, pthread_cond_t *@var{sched_cond}, pthread_mutex_t *@var{sched_mutex})
  241. This function specifies the condition variable associated to a worker
  242. When there is no available task for a worker, StarPU blocks this worker on a
  243. condition variable. This function specifies which condition variable (and the
  244. associated mutex) should be used to block (and to wake up) a worker. Note that
  245. multiple workers may use the same condition variable. For instance, in the case
  246. of a scheduling strategy with a single task queue, the same condition variable
  247. would be used to block and wake up all workers.
  248. The initialization method of a scheduling strategy (@code{init_sched}) must
  249. call this function once per worker.
  250. @end deftypefun
  251. @deftypefun void starpu_sched_set_min_priority (int @var{min_prio})
  252. Defines the minimum priority level supported by the scheduling policy. The
  253. default minimum priority level is the same as the default priority level which
  254. is 0 by convention. The application may access that value by calling the
  255. @code{starpu_sched_get_min_priority} function. This function should only be
  256. called from the initialization method of the scheduling policy, and should not
  257. be used directly from the application.
  258. @end deftypefun
  259. @deftypefun void starpu_sched_set_max_priority (int @var{max_prio})
  260. Defines the maximum priority level supported by the scheduling policy. The
  261. default maximum priority level is 1. The application may access that value by
  262. calling the @code{starpu_sched_get_max_priority} function. This function should
  263. only be called from the initialization method of the scheduling policy, and
  264. should not be used directly from the application.
  265. @end deftypefun
  266. @deftypefun int starpu_sched_get_min_priority (void)
  267. Returns the current minimum priority level supported by the
  268. scheduling policy
  269. @end deftypefun
  270. @deftypefun int starpu_sched_get_max_priority (void)
  271. Returns the current maximum priority level supported by the
  272. scheduling policy
  273. @end deftypefun
  274. @deftypefun int starpu_push_local_task (int @var{workerid}, {struct starpu_task} *@var{task}, int @var{back})
  275. The scheduling policy may put tasks directly into a worker's local queue so
  276. that it is not always necessary to create its own queue when the local queue
  277. is sufficient. If @var{back} not null, @var{task} is put at the back of the queue
  278. where the worker will pop tasks first. Setting @var{back} to 0 therefore ensures
  279. a FIFO ordering.
  280. @end deftypefun
  281. @deftypefun int starpu_worker_can_execute_task (unsigned @var{workerid}, {struct starpu_task *}@var{task}, unsigned {nimpl})
  282. Check if the worker specified by workerid can execute the codelet. Schedulers need to call it before assigning a task to a worker, otherwise the task may fail to execute.
  283. @end deftypefun
  284. @deftypefun double starpu_timing_now (void)
  285. Return the current date in µs
  286. @end deftypefun
  287. @deftypefun double starpu_task_expected_length ({struct starpu_task *}@var{task}, {enum starpu_perf_archtype} @var{arch}, unsigned @var{nimpl})
  288. Returns expected task duration in µs
  289. @end deftypefun
  290. @deftypefun double starpu_worker_get_relative_speedup ({enum starpu_perf_archtype} @var{perf_archtype})
  291. Returns an estimated speedup factor relative to CPU speed
  292. @end deftypefun
  293. @deftypefun double starpu_task_expected_data_transfer_time (uint32_t @var{memory_node}, {struct starpu_task *}@var{task})
  294. Returns expected data transfer time in µs
  295. @end deftypefun
  296. @deftypefun double starpu_data_expected_transfer_time (starpu_data_handle_t @var{handle}, unsigned @var{memory_node}, {enum starpu_access_mode} @var{mode})
  297. Predict the transfer time (in µs) to move a handle to a memory node
  298. @end deftypefun
  299. @deftypefun double starpu_task_expected_power ({struct starpu_task *}@var{task}, {enum starpu_perf_archtype} @var{arch}, unsigned @var{nimpl})
  300. Returns expected power consumption in J
  301. @end deftypefun
  302. @deftypefun double starpu_task_expected_conversion_time ({struct starpu_task *}@var{task}, {enum starpu_perf_archtype} @var{arch}, unsigned {nimpl})
  303. Returns expected conversion time in ms (multiformat interface only)
  304. @end deftypefun
  305. @node Source code
  306. @subsection Source code
  307. @cartouche
  308. @smallexample
  309. static struct starpu_sched_policy dummy_sched_policy = @{
  310. .init_sched = init_dummy_sched,
  311. .deinit_sched = deinit_dummy_sched,
  312. .push_task = push_task_dummy,
  313. .push_prio_task = NULL,
  314. .pop_task = pop_task_dummy,
  315. .post_exec_hook = NULL,
  316. .pop_every_task = NULL,
  317. .policy_name = "dummy",
  318. .policy_description = "dummy scheduling strategy"
  319. @};
  320. @end smallexample
  321. @end cartouche
  322. @node Expert mode
  323. @section Expert mode
  324. @deftypefun void starpu_wake_all_blocked_workers (void)
  325. todo
  326. @end deftypefun
  327. @deftypefun int starpu_progression_hook_register (unsigned (*@var{func})(void *arg), void *@var{arg})
  328. todo
  329. @end deftypefun
  330. @deftypefun void starpu_progression_hook_deregister (int @var{hook_id})
  331. todo
  332. @end deftypefun