starpu_data_interfaces.h 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2010-2012 Université de Bordeaux 1
  4. * Copyright (C) 2010, 2011, 2012 Centre National de la Recherche Scientifique
  5. * Copyright (C) 2011-2012 Institut National de Recherche en Informatique et Automatique
  6. *
  7. * StarPU is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU Lesser General Public License as published by
  9. * the Free Software Foundation; either version 2.1 of the License, or (at
  10. * your option) any later version.
  11. *
  12. * StarPU is distributed in the hope that it will be useful, but
  13. * WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  15. *
  16. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  17. */
  18. #ifndef __STARPU_DATA_INTERFACES_H__
  19. #define __STARPU_DATA_INTERFACES_H__
  20. #include <starpu.h>
  21. #ifdef STARPU_USE_GORDON
  22. /* to get the gordon_strideSize_t data structure from gordon */
  23. #include <gordon.h>
  24. #endif
  25. #ifdef STARPU_USE_CUDA
  26. /* to use CUDA streams */
  27. # ifdef STARPU_DONT_INCLUDE_CUDA_HEADERS
  28. typedef void *cudaStream_t;
  29. # else
  30. # include <cuda_runtime.h>
  31. # endif
  32. #endif
  33. #ifdef __cplusplus
  34. extern "C"
  35. {
  36. #endif
  37. /* The following structures are used to describe data interfaces */
  38. /* This structure contains the different methods to transfer data between the
  39. * different types of memory nodes */
  40. struct starpu_data_copy_methods
  41. {
  42. /* src type is ram */
  43. int (*ram_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  44. int (*ram_to_cuda)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  45. int (*ram_to_opencl)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  46. int (*ram_to_spu)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  47. /* src type is cuda */
  48. int (*cuda_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  49. int (*cuda_to_cuda)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  50. int (*cuda_to_opencl)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  51. int (*cuda_to_spu)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  52. /* src type is spu */
  53. int (*spu_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  54. int (*spu_to_cuda)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  55. int (*spu_to_opencl)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  56. int (*spu_to_spu)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  57. /* src type is opencl */
  58. int (*opencl_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  59. int (*opencl_to_cuda)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  60. int (*opencl_to_opencl)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  61. int (*opencl_to_spu)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  62. #ifdef STARPU_USE_CUDA
  63. /* for asynchronous CUDA transfers */
  64. int (*ram_to_cuda_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);
  65. int (*cuda_to_ram_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);
  66. int (*cuda_to_cuda_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);
  67. #endif
  68. #if defined(STARPU_USE_OPENCL) && !defined(__CUDACC__)
  69. /* for asynchronous OpenCL transfers */
  70. int (*ram_to_opencl_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cl_event *event);
  71. int (*opencl_to_ram_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cl_event *event);
  72. int (*opencl_to_opencl_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cl_event *event);
  73. #endif
  74. };
  75. enum starpu_data_interface_id
  76. {
  77. STARPU_MATRIX_INTERFACE_ID=0,
  78. STARPU_BLOCK_INTERFACE_ID=1,
  79. STARPU_VECTOR_INTERFACE_ID=2,
  80. STARPU_CSR_INTERFACE_ID=3,
  81. STARPU_BCSR_INTERFACE_ID=4,
  82. STARPU_VARIABLE_INTERFACE_ID=5,
  83. STARPU_VOID_INTERFACE_ID=6,
  84. STARPU_MULTIFORMAT_INTERFACE_ID=7,
  85. STARPU_MAX_INTERFACE_ID=8 /* maximum number of data interfaces */
  86. };
  87. struct starpu_data_interface_ops
  88. {
  89. /* Register an existing interface into a data handle. */
  90. void (*register_data_handle)(starpu_data_handle_t handle,
  91. uint32_t home_node, void *data_interface);
  92. /* Allocate data for the interface on a given node. */
  93. starpu_ssize_t (*allocate_data_on_node)(void *data_interface, uint32_t node);
  94. /* Free data of the interface on a given node. */
  95. void (*free_data_on_node)(void *data_interface, uint32_t node);
  96. /* ram/cuda/spu/opencl synchronous and asynchronous transfer methods */
  97. struct starpu_data_copy_methods *copy_methods;
  98. /* Return the current pointer (if any) for the handle on the given node. */
  99. void * (*handle_to_pointer)(starpu_data_handle_t handle, uint32_t node);
  100. /* Return an estimation of the size of data, for performance models */
  101. size_t (*get_size)(starpu_data_handle_t handle);
  102. /* Return a 32bit footprint which characterizes the data size */
  103. uint32_t (*footprint)(starpu_data_handle_t handle);
  104. /* Compare the data size of two interfaces */
  105. int (*compare)(void *data_interface_a, void *data_interface_b);
  106. /* Dump the sizes of a handle to a file */
  107. void (*display)(starpu_data_handle_t handle, FILE *f);
  108. #ifdef STARPU_USE_GORDON
  109. /* Convert the data size to the spu size format */
  110. int (*convert_to_gordon)(void *data_interface, uint64_t *ptr, gordon_strideSize_t *ss);
  111. #endif
  112. /* an identifier that is unique to each interface */
  113. enum starpu_data_interface_id interfaceid;
  114. /* The size of the interface data descriptor */
  115. size_t interface_size;
  116. int is_multiformat;
  117. struct starpu_multiformat_data_interface_ops* (*get_mf_ops)(void *data_interface);
  118. /* Pack the data handle into a contiguous buffer at the address ptr */
  119. int (*pack_data)(starpu_data_handle_t handle, uint32_t node, void **ptr);
  120. /* Unpack the data handle from the contiguous buffer at the address ptr */
  121. int (*unpack_data)(starpu_data_handle_t handle, uint32_t node, void *ptr);
  122. };
  123. /* Return the next available id for a data interface */
  124. int starpu_data_interface_get_next_id(void);
  125. void starpu_data_register(starpu_data_handle_t *handleptr, uint32_t home_node, void *data_interface, struct starpu_data_interface_ops *ops);
  126. void starpu_data_register_same(starpu_data_handle_t *handledst, starpu_data_handle_t handlesrc);
  127. /* Return the pointer associated with HANDLE on node NODE or NULL if HANDLE's
  128. * interface does not support this operation or data for this handle is not
  129. * allocated on that node. */
  130. void *starpu_handle_to_pointer(starpu_data_handle_t handle, uint32_t node);
  131. /* Return the local pointer associated with HANDLE or NULL if HANDLE's
  132. * interface does not have data allocated locally */
  133. void *starpu_handle_get_local_ptr(starpu_data_handle_t handle);
  134. /* "node" means memory node: 0 for main RAM, then 1, 2, etc. for various GPUs,
  135. * etc.
  136. *
  137. * On registration, the source of data is usually a pointer in RAM, in which
  138. * case 0 should be passed.
  139. */
  140. void *starpu_data_get_interface_on_node(starpu_data_handle_t handle, unsigned memory_node);
  141. #ifdef STARPU_DEVEL
  142. # warning the declaration below is needed for the spvm example (dw_block_spmv.c:110) which filters a data in sub-data with a different interface. However exposing a private object is certainly not something to do. Either turn the object public or find another way to specify interfaces when filtering
  143. #endif /* STARPU_DEVEL */
  144. extern struct starpu_data_interface_ops _starpu_interface_matrix_ops;
  145. /* Matrix interface for dense matrices */
  146. struct starpu_matrix_interface
  147. {
  148. uintptr_t ptr;
  149. uintptr_t dev_handle;
  150. size_t offset;
  151. uint32_t nx;
  152. uint32_t ny;
  153. uint32_t ld;
  154. size_t elemsize;
  155. };
  156. void starpu_matrix_data_register(starpu_data_handle_t *handle, uint32_t home_node, uintptr_t ptr, uint32_t ld, uint32_t nx, uint32_t ny, size_t elemsize);
  157. uint32_t starpu_matrix_get_nx(starpu_data_handle_t handle);
  158. uint32_t starpu_matrix_get_ny(starpu_data_handle_t handle);
  159. uint32_t starpu_matrix_get_local_ld(starpu_data_handle_t handle);
  160. uintptr_t starpu_matrix_get_local_ptr(starpu_data_handle_t handle);
  161. size_t starpu_matrix_get_elemsize(starpu_data_handle_t handle);
  162. /* helper methods */
  163. #define STARPU_MATRIX_GET_PTR(interface) (((struct starpu_matrix_interface *)(interface))->ptr)
  164. #define STARPU_MATRIX_GET_DEV_HANDLE(interface) (((struct starpu_matrix_interface *)(interface))->dev_handle)
  165. #define STARPU_MATRIX_GET_OFFSET(interface) (((struct starpu_matrix_interface *)(interface))->offset)
  166. #define STARPU_MATRIX_GET_NX(interface) (((struct starpu_matrix_interface *)(interface))->nx)
  167. #define STARPU_MATRIX_GET_NY(interface) (((struct starpu_matrix_interface *)(interface))->ny)
  168. #define STARPU_MATRIX_GET_LD(interface) (((struct starpu_matrix_interface *)(interface))->ld)
  169. #define STARPU_MATRIX_GET_ELEMSIZE(interface) (((struct starpu_matrix_interface *)(interface))->elemsize)
  170. /* BLOCK interface for 3D dense blocks */
  171. /* TODO: rename to 3dmatrix? */
  172. struct starpu_block_interface
  173. {
  174. uintptr_t ptr;
  175. uintptr_t dev_handle;
  176. size_t offset;
  177. uint32_t nx;
  178. uint32_t ny;
  179. uint32_t nz;
  180. uint32_t ldy; /* number of elements between two lines */
  181. uint32_t ldz; /* number of elements between two planes */
  182. size_t elemsize;
  183. };
  184. void starpu_block_data_register(starpu_data_handle_t *handle, uint32_t home_node, uintptr_t ptr, uint32_t ldy, uint32_t ldz, uint32_t nx, uint32_t ny, uint32_t nz, size_t elemsize);
  185. uint32_t starpu_block_get_nx(starpu_data_handle_t handle);
  186. uint32_t starpu_block_get_ny(starpu_data_handle_t handle);
  187. uint32_t starpu_block_get_nz(starpu_data_handle_t handle);
  188. uint32_t starpu_block_get_local_ldy(starpu_data_handle_t handle);
  189. uint32_t starpu_block_get_local_ldz(starpu_data_handle_t handle);
  190. uintptr_t starpu_block_get_local_ptr(starpu_data_handle_t handle);
  191. size_t starpu_block_get_elemsize(starpu_data_handle_t handle);
  192. /* helper methods */
  193. #define STARPU_BLOCK_GET_PTR(interface) (((struct starpu_block_interface *)(interface))->ptr)
  194. #define STARPU_BLOCK_GET_DEV_HANDLE(interface) (((struct starpu_block_interface *)(interface))->dev_handle)
  195. #define STARPU_BLOCK_GET_OFFSET(interface) (((struct starpu_block_interface *)(interface))->offset)
  196. #define STARPU_BLOCK_GET_NX(interface) (((struct starpu_block_interface *)(interface))->nx)
  197. #define STARPU_BLOCK_GET_NY(interface) (((struct starpu_block_interface *)(interface))->ny)
  198. #define STARPU_BLOCK_GET_NZ(interface) (((struct starpu_block_interface *)(interface))->nz)
  199. #define STARPU_BLOCK_GET_LDY(interface) (((struct starpu_block_interface *)(interface))->ldy)
  200. #define STARPU_BLOCK_GET_LDZ(interface) (((struct starpu_block_interface *)(interface))->ldz)
  201. #define STARPU_BLOCK_GET_ELEMSIZE(interface) (((struct starpu_block_interface *)(interface))->elemsize)
  202. /* vector interface for contiguous (non-strided) buffers */
  203. struct starpu_vector_interface
  204. {
  205. uintptr_t ptr;
  206. uintptr_t dev_handle;
  207. size_t offset;
  208. uint32_t nx;
  209. size_t elemsize;
  210. };
  211. void starpu_vector_data_register(starpu_data_handle_t *handle, uint32_t home_node, uintptr_t ptr, uint32_t nx, size_t elemsize);
  212. uint32_t starpu_vector_get_nx(starpu_data_handle_t handle);
  213. size_t starpu_vector_get_elemsize(starpu_data_handle_t handle);
  214. uintptr_t starpu_vector_get_local_ptr(starpu_data_handle_t handle);
  215. /* helper methods */
  216. #define STARPU_VECTOR_GET_PTR(interface) (((struct starpu_vector_interface *)(interface))->ptr)
  217. #define STARPU_VECTOR_GET_DEV_HANDLE(interface) (((struct starpu_vector_interface *)(interface))->dev_handle)
  218. #define STARPU_VECTOR_GET_OFFSET(interface) (((struct starpu_vector_interface *)(interface))->offset)
  219. #define STARPU_VECTOR_GET_NX(interface) (((struct starpu_vector_interface *)(interface))->nx)
  220. #define STARPU_VECTOR_GET_ELEMSIZE(interface) (((struct starpu_vector_interface *)(interface))->elemsize)
  221. /* variable interface for a single data (not a vector, a matrix, a list, ...) */
  222. struct starpu_variable_interface
  223. {
  224. uintptr_t ptr;
  225. size_t elemsize;
  226. /* No dev_handle, since it can not be filtered, offset will always be zero */
  227. };
  228. void starpu_variable_data_register(starpu_data_handle_t *handle, uint32_t home_node, uintptr_t ptr, size_t size);
  229. size_t starpu_variable_get_elemsize(starpu_data_handle_t handle);
  230. uintptr_t starpu_variable_get_local_ptr(starpu_data_handle_t handle);
  231. /* helper methods */
  232. #define STARPU_VARIABLE_GET_PTR(interface) (((struct starpu_variable_interface *)(interface))->ptr)
  233. #define STARPU_VARIABLE_GET_ELEMSIZE(interface) (((struct starpu_variable_interface *)(interface))->elemsize)
  234. /* void interface. There is no data really associated to that interface, but it
  235. * may be used as a synchronization mechanism. It also permits to express an
  236. * abstract piece of data that is managed by the application internally: this
  237. * makes it possible to forbid the concurrent execution of different tasks
  238. * accessing the same "void" data in read-write concurrently. */
  239. void starpu_void_data_register(starpu_data_handle_t *handle);
  240. /* CSR interface for sparse matrices (compressed sparse row representation) */
  241. struct starpu_csr_interface
  242. {
  243. uint32_t nnz; /* number of non-zero entries */
  244. uint32_t nrow; /* number of rows */
  245. uintptr_t nzval; /* non-zero values */
  246. uint32_t *colind; /* position of non-zero entries on the row */
  247. uint32_t *rowptr; /* index (in nzval) of the first entry of the row */
  248. /* k for k-based indexing (0 or 1 usually) */
  249. /* also useful when partitionning the matrix ... */
  250. uint32_t firstentry;
  251. size_t elemsize;
  252. };
  253. void starpu_csr_data_register(starpu_data_handle_t *handle, uint32_t home_node, uint32_t nnz, uint32_t nrow, uintptr_t nzval, uint32_t *colind, uint32_t *rowptr, uint32_t firstentry, size_t elemsize);
  254. uint32_t starpu_csr_get_nnz(starpu_data_handle_t handle);
  255. uint32_t starpu_csr_get_nrow(starpu_data_handle_t handle);
  256. uint32_t starpu_csr_get_firstentry(starpu_data_handle_t handle);
  257. uintptr_t starpu_csr_get_local_nzval(starpu_data_handle_t handle);
  258. uint32_t *starpu_csr_get_local_colind(starpu_data_handle_t handle);
  259. uint32_t *starpu_csr_get_local_rowptr(starpu_data_handle_t handle);
  260. size_t starpu_csr_get_elemsize(starpu_data_handle_t handle);
  261. #define STARPU_CSR_GET_NNZ(interface) (((struct starpu_csr_interface *)(interface))->nnz)
  262. #define STARPU_CSR_GET_NROW(interface) (((struct starpu_csr_interface *)(interface))->nrow)
  263. #define STARPU_CSR_GET_NZVAL(interface) (((struct starpu_csr_interface *)(interface))->nzval)
  264. #define STARPU_CSR_GET_COLIND(interface) (((struct starpu_csr_interface *)(interface))->colind)
  265. #define STARPU_CSR_GET_ROWPTR(interface) (((struct starpu_csr_interface *)(interface))->rowptr)
  266. #define STARPU_CSR_GET_FIRSTENTRY(interface) (((struct starpu_csr_interface *)(interface))->firstentry)
  267. #define STARPU_CSR_GET_ELEMSIZE(interface) (((struct starpu_csr_interface *)(interface))->elemsize)
  268. /* BCSR interface for sparse matrices (blocked compressed sparse row
  269. * representation) */
  270. struct starpu_bcsr_interface
  271. {
  272. uint32_t nnz; /* number of non-zero BLOCKS */
  273. uint32_t nrow; /* number of rows (in terms of BLOCKS) */
  274. uintptr_t nzval; /* non-zero values */
  275. uint32_t *colind; /* position of non-zero entried on the row */
  276. /* uint32_t *rowind; */ /* position of non-zero entried on the col */
  277. uint32_t *rowptr; /* index (in nzval) of the first entry of the row */
  278. /* k for k-based indexing (0 or 1 usually) */
  279. /* also useful when partitionning the matrix ... */
  280. uint32_t firstentry;
  281. /* size of the blocks */
  282. uint32_t r;
  283. uint32_t c;
  284. size_t elemsize;
  285. };
  286. void starpu_bcsr_data_register(starpu_data_handle_t *handle, uint32_t home_node, uint32_t nnz, uint32_t nrow, uintptr_t nzval, uint32_t *colind, uint32_t *rowptr, uint32_t firstentry, uint32_t r, uint32_t c, size_t elemsize);
  287. #define STARPU_BCSR_GET_NNZ(interface) (((struct starpu_bcsr_interface *)(interface))->nnz)
  288. #define STARPU_BCSR_GET_NZVAL(interface) (((struct starpu_bcsr_interface *)(interface))->nzval)
  289. #define STARPU_BCSR_GET_COLIND(interface) (((struct starpu_bcsr_interface *)(interface))->colind)
  290. #define STARPU_BCSR_GET_ROWPTR(interface) (((struct starpu_bcsr_interface *)(interface))->rowptr)
  291. uint32_t starpu_bcsr_get_nnz(starpu_data_handle_t handle);
  292. uint32_t starpu_bcsr_get_nrow(starpu_data_handle_t handle);
  293. uint32_t starpu_bcsr_get_firstentry(starpu_data_handle_t handle);
  294. uintptr_t starpu_bcsr_get_local_nzval(starpu_data_handle_t handle);
  295. uint32_t *starpu_bcsr_get_local_colind(starpu_data_handle_t handle);
  296. uint32_t *starpu_bcsr_get_local_rowptr(starpu_data_handle_t handle);
  297. uint32_t starpu_bcsr_get_r(starpu_data_handle_t handle);
  298. uint32_t starpu_bcsr_get_c(starpu_data_handle_t handle);
  299. size_t starpu_bcsr_get_elemsize(starpu_data_handle_t handle);
  300. /*
  301. * Multiformat interface
  302. */
  303. struct starpu_multiformat_data_interface_ops
  304. {
  305. size_t cpu_elemsize;
  306. size_t opencl_elemsize;
  307. struct starpu_codelet *cpu_to_opencl_cl;
  308. struct starpu_codelet *opencl_to_cpu_cl;
  309. size_t cuda_elemsize;
  310. struct starpu_codelet *cpu_to_cuda_cl;
  311. struct starpu_codelet *cuda_to_cpu_cl;
  312. };
  313. struct starpu_multiformat_interface
  314. {
  315. void *cpu_ptr;
  316. void *cuda_ptr;
  317. void *opencl_ptr;
  318. uint32_t nx;
  319. struct starpu_multiformat_data_interface_ops *ops;
  320. };
  321. void starpu_multiformat_data_register(starpu_data_handle_t *handle, uint32_t home_node, void *ptr, uint32_t nobjects, struct starpu_multiformat_data_interface_ops *format_ops);
  322. #define STARPU_MULTIFORMAT_GET_CPU_PTR(interface) (((struct starpu_multiformat_interface *)(interface))->cpu_ptr)
  323. #define STARPU_MULTIFORMAT_GET_CUDA_PTR(interface) (((struct starpu_multiformat_interface *)(interface))->cuda_ptr)
  324. #define STARPU_MULTIFORMAT_GET_OPENCL_PTR(interface) (((struct starpu_multiformat_interface *)(interface))->opencl_ptr)
  325. #define STARPU_MULTIFORMAT_GET_NX(interface) (((struct starpu_multiformat_interface *)(interface))->nx)
  326. enum starpu_data_interface_id starpu_handle_get_interface_id(starpu_data_handle_t handle);
  327. int starpu_handle_pack_data(starpu_data_handle_t handle, void **ptr);
  328. int starpu_handle_unpack_data(starpu_data_handle_t handle, void *ptr);
  329. size_t starpu_handle_get_size(starpu_data_handle_t handle);
  330. /* Lookup a ram pointer into a StarPU handle */
  331. extern starpu_data_handle_t starpu_data_lookup(const void *ptr);
  332. #ifdef __cplusplus
  333. }
  334. #endif
  335. #endif /* __STARPU_DATA_INTERFACES_H__ */