starpu_data_interfaces.h 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2010-2011 Université de Bordeaux 1
  4. * Copyright (C) 2010, 2011 Centre National de la Recherche Scientifique
  5. * Copyright (C) 2011 Institut National de Recherche en Informatique et Automatique
  6. *
  7. * StarPU is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU Lesser General Public License as published by
  9. * the Free Software Foundation; either version 2.1 of the License, or (at
  10. * your option) any later version.
  11. *
  12. * StarPU is distributed in the hope that it will be useful, but
  13. * WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  15. *
  16. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  17. */
  18. #ifndef __STARPU_DATA_INTERFACES_H__
  19. #define __STARPU_DATA_INTERFACES_H__
  20. #include <starpu.h>
  21. #include <starpu_data.h>
  22. #include <starpu_util.h>
  23. #ifdef STARPU_USE_GORDON
  24. /* to get the gordon_strideSize_t data structure from gordon */
  25. #include <gordon.h>
  26. #endif
  27. #ifdef STARPU_USE_CUDA
  28. /* to use CUDA streams */
  29. #include <cuda_runtime.h>
  30. #endif
  31. #ifdef __cplusplus
  32. extern "C" {
  33. #endif
  34. /* The following structures are used to describe data interfaces */
  35. /* This structure contains the different methods to transfer data between the
  36. * different types of memory nodes */
  37. struct starpu_data_copy_methods {
  38. /* src type is ram */
  39. int (*ram_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  40. int (*ram_to_cuda)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  41. int (*ram_to_opencl)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  42. int (*ram_to_spu)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  43. /* src type is cuda */
  44. int (*cuda_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  45. int (*cuda_to_cuda)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  46. int (*cuda_to_opencl)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  47. int (*cuda_to_spu)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  48. /* src type is spu */
  49. int (*spu_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  50. int (*spu_to_cuda)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  51. int (*spu_to_opencl)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  52. int (*spu_to_spu)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  53. /* src type is opencl */
  54. int (*opencl_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  55. int (*opencl_to_cuda)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  56. int (*opencl_to_opencl)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  57. int (*opencl_to_spu)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
  58. #ifdef STARPU_USE_CUDA
  59. /* for asynchronous CUDA transfers */
  60. int (*ram_to_cuda_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);
  61. int (*cuda_to_ram_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);
  62. int (*cuda_to_cuda_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cudaStream_t stream);
  63. #endif
  64. #ifdef STARPU_USE_OPENCL
  65. /* for asynchronous OpenCL transfers */
  66. /* XXX we do not use a cl_event *event type for the last argument
  67. * because nvcc does not like when we have to include OpenCL headers */
  68. int (*ram_to_opencl_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, /* cl_event * */ void *event);
  69. int (*opencl_to_ram_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, /* cl_event * */ void *event);
  70. int (*opencl_to_opencl_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, /* cl_event * */ void *event);
  71. #endif
  72. };
  73. struct starpu_data_interface_ops_t {
  74. /* Register an existing interface into a data handle. */
  75. void (*register_data_handle)(starpu_data_handle handle,
  76. uint32_t home_node, void *data_interface);
  77. /* Allocate data for the interface on a given node. */
  78. starpu_ssize_t (*allocate_data_on_node)(void *data_interface, uint32_t node);
  79. /* Free data of the interface on a given node. */
  80. void (*free_data_on_node)(void *data_interface, uint32_t node);
  81. /* ram/cuda/spu/opencl synchronous and asynchronous transfer methods */
  82. const struct starpu_data_copy_methods *copy_methods;
  83. /* Return the current pointer (if any) for the handle on the given node. */
  84. void * (*handle_to_pointer)(starpu_data_handle handle, uint32_t node);
  85. /* Return an estimation of the size of data, for performance models */
  86. size_t (*get_size)(starpu_data_handle handle);
  87. /* Return a 32bit footprint which characterizes the data size */
  88. uint32_t (*footprint)(starpu_data_handle handle);
  89. /* Compare the data size of two interfaces */
  90. int (*compare)(void *data_interface_a, void *data_interface_b);
  91. /* Dump the sizes of a handle to a file */
  92. void (*display)(starpu_data_handle handle, FILE *f);
  93. #ifdef STARPU_USE_GORDON
  94. /* Convert the data size to the spu size format */
  95. int (*convert_to_gordon)(void *data_interface, uint64_t *ptr, gordon_strideSize_t *ss);
  96. #endif
  97. /* an identifier that is unique to each interface */
  98. unsigned interfaceid;
  99. /* The size of the interface data descriptor */
  100. size_t interface_size;
  101. };
  102. void starpu_data_register(starpu_data_handle *handleptr, uint32_t home_node,
  103. void *data_interface,
  104. struct starpu_data_interface_ops_t *ops);
  105. /* Return the pointer associated with HANDLE on node NODE or NULL if HANDLE's
  106. * interface does not support this operation or data for this handle is not
  107. * allocated on that node. */
  108. void *starpu_handle_to_pointer(starpu_data_handle handle, uint32_t node);
  109. /* Return the local pointer associated with HANDLE or NULL if HANDLE's
  110. * interface does not have data allocated locally */
  111. void *starpu_handle_get_local_ptr(starpu_data_handle handle);
  112. extern struct starpu_data_interface_ops_t _starpu_interface_matrix_ops;
  113. /* "node" means memory node: 0 for main RAM, then 1, 2, etc. for various GPUs,
  114. * etc.
  115. *
  116. * On registration, the source of data is usually a pointer in RAM, in which
  117. * case 0 should be passed.
  118. */
  119. void *starpu_data_get_interface_on_node(starpu_data_handle handle, unsigned memory_node);
  120. /* Matrix interface for dense matrices */
  121. typedef struct starpu_matrix_interface_s {
  122. uintptr_t ptr;
  123. uintptr_t dev_handle;
  124. size_t offset;
  125. uint32_t nx;
  126. uint32_t ny;
  127. uint32_t ld;
  128. size_t elemsize;
  129. } starpu_matrix_interface_t;
  130. void starpu_matrix_data_register(starpu_data_handle *handle, uint32_t home_node,
  131. uintptr_t ptr, uint32_t ld, uint32_t nx,
  132. uint32_t ny, size_t elemsize);
  133. uint32_t starpu_matrix_get_nx(starpu_data_handle handle);
  134. uint32_t starpu_matrix_get_ny(starpu_data_handle handle);
  135. uint32_t starpu_matrix_get_local_ld(starpu_data_handle handle);
  136. uintptr_t starpu_matrix_get_local_ptr(starpu_data_handle handle);
  137. size_t starpu_matrix_get_elemsize(starpu_data_handle handle);
  138. /* helper methods */
  139. #define STARPU_MATRIX_GET_PTR(interface) (((starpu_matrix_interface_t *)(interface))->ptr)
  140. #define STARPU_MATRIX_GET_NX(interface) (((starpu_matrix_interface_t *)(interface))->nx)
  141. #define STARPU_MATRIX_GET_NY(interface) (((starpu_matrix_interface_t *)(interface))->ny)
  142. #define STARPU_MATRIX_GET_LD(interface) (((starpu_matrix_interface_t *)(interface))->ld)
  143. #define STARPU_MATRIX_GET_ELEMSIZE(interface) (((starpu_matrix_interface_t *)(interface))->elemsize)
  144. /* BLOCK interface for 3D dense blocks */
  145. /* TODO: rename to 3dmatrix? */
  146. typedef struct starpu_block_interface_s {
  147. uintptr_t ptr;
  148. uintptr_t dev_handle;
  149. size_t offset;
  150. uint32_t nx;
  151. uint32_t ny;
  152. uint32_t nz;
  153. uint32_t ldy; /* number of elements between two lines */
  154. uint32_t ldz; /* number of elements between two planes */
  155. size_t elemsize;
  156. } starpu_block_interface_t;
  157. void starpu_block_data_register(starpu_data_handle *handle, uint32_t home_node,
  158. uintptr_t ptr, uint32_t ldy, uint32_t ldz, uint32_t nx,
  159. uint32_t ny, uint32_t nz, size_t elemsize);
  160. uint32_t starpu_block_get_nx(starpu_data_handle handle);
  161. uint32_t starpu_block_get_ny(starpu_data_handle handle);
  162. uint32_t starpu_block_get_nz(starpu_data_handle handle);
  163. uint32_t starpu_block_get_local_ldy(starpu_data_handle handle);
  164. uint32_t starpu_block_get_local_ldz(starpu_data_handle handle);
  165. uintptr_t starpu_block_get_local_ptr(starpu_data_handle handle);
  166. size_t starpu_block_get_elemsize(starpu_data_handle handle);
  167. /* helper methods */
  168. #define STARPU_BLOCK_GET_PTR(interface) (((starpu_block_interface_t *)(interface))->ptr)
  169. #define STARPU_BLOCK_GET_NX(interface) (((starpu_block_interface_t *)(interface))->nx)
  170. #define STARPU_BLOCK_GET_NY(interface) (((starpu_block_interface_t *)(interface))->ny)
  171. #define STARPU_BLOCK_GET_NZ(interface) (((starpu_block_interface_t *)(interface))->nz)
  172. #define STARPU_BLOCK_GET_LDY(interface) (((starpu_block_interface_t *)(interface))->ldy)
  173. #define STARPU_BLOCK_GET_LDZ(interface) (((starpu_block_interface_t *)(interface))->ldz)
  174. #define STARPU_BLOCK_GET_ELEMSIZE(interface) (((starpu_block_interface_t *)(interface))->elemsize)
  175. /* vector interface for contiguous (non-strided) buffers */
  176. typedef struct starpu_vector_interface_s {
  177. uintptr_t ptr;
  178. uintptr_t dev_handle;
  179. size_t offset;
  180. uint32_t nx;
  181. size_t elemsize;
  182. } starpu_vector_interface_t;
  183. void starpu_vector_data_register(starpu_data_handle *handle, uint32_t home_node,
  184. uintptr_t ptr, uint32_t nx, size_t elemsize);
  185. uint32_t starpu_vector_get_nx(starpu_data_handle handle);
  186. size_t starpu_vector_get_elemsize(starpu_data_handle handle);
  187. uintptr_t starpu_vector_get_local_ptr(starpu_data_handle handle);
  188. /* helper methods */
  189. #define STARPU_VECTOR_GET_PTR(interface) (((starpu_vector_interface_t *)(interface))->ptr)
  190. #define STARPU_VECTOR_GET_NX(interface) (((starpu_vector_interface_t *)(interface))->nx)
  191. #define STARPU_VECTOR_GET_ELEMSIZE(interface) (((starpu_vector_interface_t *)(interface))->elemsize)
  192. /* variable interface for a single data (not a vector, a matrix, a list, ...) */
  193. typedef struct starpu_variable_interface_s {
  194. uintptr_t ptr;
  195. size_t elemsize;
  196. } starpu_variable_interface_t;
  197. void starpu_variable_data_register(starpu_data_handle *handle, uint32_t home_node,
  198. uintptr_t ptr, size_t elemsize);
  199. size_t starpu_variable_get_elemsize(starpu_data_handle handle);
  200. uintptr_t starpu_variable_get_local_ptr(starpu_data_handle handle);
  201. /* helper methods */
  202. #define STARPU_VARIABLE_GET_PTR(interface) (((starpu_variable_interface_t *)(interface))->ptr)
  203. #define STARPU_VARIABLE_GET_ELEMSIZE(interface) (((starpu_variable_interface_t *)(interface))->elemsize)
  204. /* void interface. There is no data really associated to that interface, but it
  205. * may be used as a synchronization mechanism. It also permits to express an
  206. * abstract piece of data that is managed by the application internally: this
  207. * makes it possible to forbid the concurrent execution of different tasks
  208. * accessing the same "void" data in read-write concurrently. */
  209. void starpu_void_data_register(starpu_data_handle *handleptr);
  210. /* CSR interface for sparse matrices (compressed sparse row representation) */
  211. typedef struct starpu_csr_interface_s {
  212. uint32_t nnz; /* number of non-zero entries */
  213. uint32_t nrow; /* number of rows */
  214. uintptr_t nzval; /* non-zero values */
  215. uint32_t *colind; /* position of non-zero entried on the row */
  216. uint32_t *rowptr; /* index (in nzval) of the first entry of the row */
  217. /* k for k-based indexing (0 or 1 usually) */
  218. /* also useful when partitionning the matrix ... */
  219. uint32_t firstentry;
  220. size_t elemsize;
  221. } starpu_csr_interface_t;
  222. void starpu_csr_data_register(starpu_data_handle *handle, uint32_t home_node, uint32_t nnz, uint32_t nrow,
  223. uintptr_t nzval, uint32_t *colind, uint32_t *rowptr, uint32_t firstentry, size_t elemsize);
  224. uint32_t starpu_csr_get_nnz(starpu_data_handle handle);
  225. uint32_t starpu_csr_get_nrow(starpu_data_handle handle);
  226. uint32_t starpu_csr_get_firstentry(starpu_data_handle handle);
  227. uintptr_t starpu_csr_get_local_nzval(starpu_data_handle handle);
  228. uint32_t *starpu_csr_get_local_colind(starpu_data_handle handle);
  229. uint32_t *starpu_csr_get_local_rowptr(starpu_data_handle handle);
  230. size_t starpu_csr_get_elemsize(starpu_data_handle handle);
  231. #define STARPU_CSR_GET_NNZ(interface) (((starpu_csr_interface_t *)(interface))->nnz)
  232. #define STARPU_CSR_GET_NROW(interface) (((starpu_csr_interface_t *)(interface))->nrow)
  233. #define STARPU_CSR_GET_NZVAL(interface) (((starpu_csr_interface_t *)(interface))->nzval)
  234. #define STARPU_CSR_GET_COLIND(interface) (((starpu_csr_interface_t *)(interface))->colind)
  235. #define STARPU_CSR_GET_ROWPTR(interface) (((starpu_csr_interface_t *)(interface))->rowptr)
  236. #define STARPU_CSR_GET_FIRSTENTRY(interface) (((starpu_csr_interface_t *)(interface))->firstentry)
  237. #define STARPU_CSR_GET_ELEMSIZE(interface) (((starpu_csr_interface_t *)(interface))->elemsize)
  238. /* BCSR interface for sparse matrices (blocked compressed sparse row
  239. * representation) */
  240. typedef struct starpu_bcsr_interface_s {
  241. uint32_t nnz; /* number of non-zero BLOCKS */
  242. uint32_t nrow; /* number of rows (in terms of BLOCKS) */
  243. uintptr_t nzval; /* non-zero values */
  244. uint32_t *colind; /* position of non-zero entried on the row */
  245. /* uint32_t *rowind; */ /* position of non-zero entried on the col */
  246. uint32_t *rowptr; /* index (in nzval) of the first entry of the row */
  247. /* k for k-based indexing (0 or 1 usually) */
  248. /* also useful when partitionning the matrix ... */
  249. uint32_t firstentry;
  250. /* size of the blocks */
  251. uint32_t r;
  252. uint32_t c;
  253. size_t elemsize;
  254. } starpu_bcsr_interface_t;
  255. void starpu_bcsr_data_register(starpu_data_handle *handle, uint32_t home_node, uint32_t nnz, uint32_t nrow,
  256. uintptr_t nzval, uint32_t *colind, uint32_t *rowptr, uint32_t firstentry, uint32_t r, uint32_t c, size_t elemsize);
  257. uint32_t starpu_bcsr_get_nnz(starpu_data_handle);
  258. uint32_t starpu_bcsr_get_nrow(starpu_data_handle);
  259. uint32_t starpu_bcsr_get_firstentry(starpu_data_handle);
  260. uintptr_t starpu_bcsr_get_local_nzval(starpu_data_handle);
  261. uint32_t *starpu_bcsr_get_local_colind(starpu_data_handle);
  262. uint32_t *starpu_bcsr_get_local_rowptr(starpu_data_handle);
  263. uint32_t starpu_bcsr_get_r(starpu_data_handle);
  264. uint32_t starpu_bcsr_get_c(starpu_data_handle);
  265. size_t starpu_bcsr_get_elemsize(starpu_data_handle);
  266. #define STARPU_MATRIX_INTERFACE_ID 0
  267. #define STARPU_BLOCK_INTERFACE_ID 1
  268. #define STARPU_VECTOR_INTERFACE_ID 2
  269. #define STARPU_CSR_INTERFACE_ID 3
  270. #define STARPU_BCSR_INTERFACE_ID 4
  271. #define STARPU_VARIABLE_INTERFACE_ID 5
  272. #define STARPU_VOID_INTERFACE_ID 6
  273. #define STARPU_NINTERFACES_ID 7 /* number of data interfaces */
  274. unsigned starpu_get_handle_interface_id(starpu_data_handle);
  275. /* Lookup a ram pointer into a StarPU handle */
  276. extern starpu_data_handle starpu_data_lookup(const void *ptr);
  277. #ifdef __cplusplus
  278. }
  279. #endif
  280. #endif /* __STARPU_DATA_INTERFACES_H__ */