command.c 8.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2010,2011 University of Bordeaux
  4. *
  5. * StarPU is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * StarPU is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #include "socl.h"
  17. #include <string.h>
  18. /* Forward extern declaration */
  19. extern void soclEnqueueNDRangeKernel_task(void *descr[], void *args);
  20. void command_init_ex(cl_command cmd, cl_command_type typ, void (*cb)(void*)) {
  21. gc_entity_init(&cmd->_entity, cb);
  22. cmd->typ = typ;
  23. cmd->num_events = 0;
  24. cmd->events = NULL;
  25. cmd->event = event_create();
  26. cmd->event->command = cmd;
  27. cmd->cq = NULL;
  28. cmd->task = NULL;
  29. cmd->submitted = 0;
  30. }
  31. void command_submit_ex(cl_command cmd) {
  32. #define SUBMIT(typ,name) case typ:\
  33. name##_submit((name)cmd);\
  34. break;
  35. assert(cmd->submitted == 0);
  36. switch(cmd->typ) {
  37. SUBMIT(CL_COMMAND_NDRANGE_KERNEL, command_ndrange_kernel)
  38. SUBMIT(CL_COMMAND_TASK, command_ndrange_kernel)
  39. SUBMIT(CL_COMMAND_READ_BUFFER, command_read_buffer)
  40. SUBMIT(CL_COMMAND_WRITE_BUFFER, command_write_buffer)
  41. SUBMIT(CL_COMMAND_COPY_BUFFER, command_copy_buffer)
  42. SUBMIT(CL_COMMAND_MAP_BUFFER, command_map_buffer)
  43. SUBMIT(CL_COMMAND_UNMAP_MEM_OBJECT, command_unmap_mem_object)
  44. SUBMIT(CL_COMMAND_MARKER, command_marker)
  45. SUBMIT(CL_COMMAND_BARRIER, command_barrier)
  46. default:
  47. ERROR_STOP("Trying to submit unknown command (type %x)", cmd->typ);
  48. }
  49. cmd->submitted = 1;
  50. #undef SUBMIT
  51. }
  52. cl_int command_submit_deep_ex(cl_command cmd) {
  53. if (cmd->submitted == 1)
  54. return CL_SUCCESS;
  55. /* We set this in order to avoid cyclic dependencies */
  56. cmd->submitted = 1;
  57. unsigned int i;
  58. for (i=0; i<cmd->num_events; i++)
  59. command_submit_deep(cmd->events[i]->command);
  60. cmd->submitted = 0;
  61. command_submit_ex(cmd);
  62. return CL_SUCCESS;
  63. }
  64. void command_graph_dump_ex(cl_command cmd) {
  65. unsigned int i;
  66. for (i=0; i<cmd->num_events; i++)
  67. command_graph_dump_ex(cmd->events[i]->command);
  68. const char * typ_str = (cmd->typ == CL_COMMAND_NDRANGE_KERNEL ? "ndrange_kernel" :
  69. cmd->typ == CL_COMMAND_TASK ? "task" :
  70. cmd->typ == CL_COMMAND_READ_BUFFER ? "read_buffer" :
  71. cmd->typ == CL_COMMAND_WRITE_BUFFER ? "write_buffer" :
  72. cmd->typ == CL_COMMAND_COPY_BUFFER ? "copy_buffer" :
  73. cmd->typ == CL_COMMAND_MAP_BUFFER ? "map_buffer" :
  74. cmd->typ == CL_COMMAND_UNMAP_MEM_OBJECT ? "unmap_mem_object" :
  75. cmd->typ == CL_COMMAND_MARKER ? "marker" :
  76. cmd->typ == CL_COMMAND_BARRIER ? "barrier" : "unknown");
  77. printf("CMD %p TYPE %s DEPS", cmd, typ_str);
  78. for (i=0; i<cmd->num_events; i++)
  79. printf(" %p", cmd->events[i]->command);
  80. printf("\n");
  81. }
  82. #define nullOrDup(name,size) cmd->name = memdup_safe(name,size)
  83. #define nullOrFree(name) if (cmd->name != NULL) free((void*)cmd->name)
  84. #define dup(name) cmd->name = name
  85. void command_ndrange_kernel_release(void * arg) {
  86. command_ndrange_kernel cmd = (command_ndrange_kernel)arg;
  87. gc_entity_unstore(&cmd->kernel);
  88. nullOrFree(global_work_offset);
  89. nullOrFree(global_work_size);
  90. nullOrFree(local_work_size);
  91. free(cmd->arg_sizes);
  92. free(cmd->arg_types);
  93. unsigned int i;
  94. for (i=0; i<cmd->num_args; i++)
  95. free(cmd->args[i]);
  96. free(cmd->args);
  97. }
  98. command_ndrange_kernel command_ndrange_kernel_create (
  99. cl_kernel kernel,
  100. cl_uint work_dim,
  101. const size_t * global_work_offset,
  102. const size_t * global_work_size,
  103. const size_t * local_work_size)
  104. {
  105. command_ndrange_kernel cmd = calloc(1, sizeof(struct command_ndrange_kernel_t));
  106. command_init(cmd, CL_COMMAND_NDRANGE_KERNEL, command_ndrange_kernel_release);
  107. gc_entity_store(&cmd->kernel, kernel);
  108. dup(work_dim);
  109. nullOrDup(global_work_offset, work_dim*sizeof(size_t));
  110. nullOrDup(global_work_size, work_dim*sizeof(size_t));
  111. nullOrDup(local_work_size, work_dim*sizeof(size_t));
  112. starpu_codelet_init(&cmd->codelet);
  113. cmd->codelet.where = STARPU_OPENCL;
  114. cmd->codelet.power_model = NULL;
  115. cmd->codelet.opencl_funcs[0] = &soclEnqueueNDRangeKernel_task;
  116. cmd->codelet.opencl_funcs[1] = NULL;
  117. /* Kernel is mutable, so we duplicate its parameters... */
  118. cmd->num_args = kernel->num_args;
  119. cmd->arg_sizes = memdup(kernel->arg_size, sizeof(size_t) * kernel->num_args);
  120. cmd->arg_types = memdup(kernel->arg_type, sizeof(enum kernel_arg_type) * kernel->num_args);
  121. cmd->args = memdup_deep_varsize_safe(kernel->arg_value, kernel->num_args, kernel->arg_size);
  122. return cmd;
  123. }
  124. command_ndrange_kernel command_task_create (cl_kernel kernel) {
  125. static cl_uint task_work_dim = 3;
  126. static const size_t task_global_work_offset[3] = {0,0,0};
  127. static const size_t task_global_work_size[3] = {1,1,1};
  128. static const size_t * task_local_work_size = NULL;
  129. command_ndrange_kernel cmd = command_ndrange_kernel_create(
  130. kernel, task_work_dim, task_global_work_offset,
  131. task_global_work_size, task_local_work_size);
  132. /* This is the only difference with command_ndrange_kernel_create */
  133. cmd->_command.typ = CL_COMMAND_TASK;
  134. return cmd;
  135. }
  136. command_barrier command_barrier_create () {
  137. command_barrier cmd = malloc(sizeof(struct command_barrier_t));
  138. command_init(cmd, CL_COMMAND_BARRIER, NULL);
  139. return cmd;
  140. }
  141. command_marker command_marker_create () {
  142. command_marker cmd = malloc(sizeof(struct command_marker_t));
  143. command_init(cmd, CL_COMMAND_MARKER, NULL);
  144. return cmd;
  145. }
  146. void command_map_buffer_release(void * arg) {
  147. command_map_buffer cmd = (command_map_buffer)arg;
  148. /* We DO NOT unstore (release) the buffer as unmap will do it
  149. gc_entity_unstore(&cmd->buffer); */
  150. gc_entity_unstore(&cmd->event);
  151. }
  152. command_map_buffer command_map_buffer_create(
  153. cl_mem buffer,
  154. cl_map_flags map_flags,
  155. size_t offset,
  156. size_t cb,
  157. cl_event event
  158. ) {
  159. command_map_buffer cmd = malloc(sizeof(struct command_map_buffer_t));
  160. command_init(cmd, CL_COMMAND_MAP_BUFFER, command_map_buffer_release);
  161. gc_entity_store(&cmd->buffer, buffer);
  162. dup(map_flags);
  163. dup(offset);
  164. dup(cb);
  165. gc_entity_store(&cmd->event, event);
  166. return cmd;
  167. }
  168. void command_unmap_mem_object_release(void * arg) {
  169. command_unmap_mem_object cmd = (command_unmap_mem_object)arg;
  170. /* We release the buffer twice because map buffer command did not */
  171. gc_entity_release(cmd->buffer);
  172. gc_entity_unstore(&cmd->buffer);
  173. }
  174. command_unmap_mem_object command_unmap_mem_object_create(cl_mem buffer, void * ptr) {
  175. command_unmap_mem_object cmd = malloc(sizeof(struct command_unmap_mem_object_t));
  176. command_init(cmd, CL_COMMAND_UNMAP_MEM_OBJECT, command_unmap_mem_object_release);
  177. gc_entity_store(&cmd->buffer, buffer);
  178. dup(ptr);
  179. return cmd;
  180. }
  181. void command_read_buffer_release(void *arg) {
  182. command_read_buffer cmd = (command_read_buffer)arg;
  183. gc_entity_unstore(&cmd->buffer);
  184. }
  185. command_read_buffer command_read_buffer_create(cl_mem buffer, size_t offset, size_t cb, void * ptr) {
  186. command_read_buffer cmd = malloc(sizeof(struct command_read_buffer_t));
  187. command_init(cmd, CL_COMMAND_READ_BUFFER, command_read_buffer_release);
  188. gc_entity_store(&cmd->buffer, buffer);
  189. dup(offset);
  190. dup(cb);
  191. dup(ptr);
  192. return cmd;
  193. }
  194. void command_write_buffer_release(void *arg) {
  195. command_write_buffer cmd = (command_write_buffer)arg;
  196. gc_entity_unstore(&cmd->buffer);
  197. }
  198. command_write_buffer command_write_buffer_create(cl_mem buffer, size_t offset, size_t cb, const void * ptr) {
  199. command_write_buffer cmd = malloc(sizeof(struct command_write_buffer_t));
  200. command_init(cmd, CL_COMMAND_WRITE_BUFFER, command_write_buffer_release);
  201. gc_entity_store(&cmd->buffer, buffer);
  202. dup(offset);
  203. dup(cb);
  204. dup(ptr);
  205. return cmd;
  206. }
  207. void command_copy_buffer_release(void *arg) {
  208. command_copy_buffer cmd = (command_copy_buffer)arg;
  209. gc_entity_unstore(&cmd->src_buffer);
  210. gc_entity_unstore(&cmd->dst_buffer);
  211. }
  212. command_copy_buffer command_copy_buffer_create( cl_mem src_buffer, cl_mem dst_buffer,
  213. size_t src_offset, size_t dst_offset, size_t cb)
  214. {
  215. command_copy_buffer cmd = malloc(sizeof(struct command_copy_buffer_t));
  216. command_init(cmd, CL_COMMAND_COPY_BUFFER, command_copy_buffer_release);
  217. gc_entity_store(&cmd->src_buffer, src_buffer);
  218. gc_entity_store(&cmd->dst_buffer, dst_buffer);
  219. dup(src_offset);
  220. dup(dst_offset);
  221. dup(cb);
  222. return cmd;
  223. }
  224. #undef nullOrDup
  225. #undef nodeNullOrDup
  226. #undef dup
  227. #undef nodeDup
  228. #undef memdup