command.c 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2011,2012,2014,2017 CNRS
  4. * Copyright (C) 2010-2014,2016 Université de Bordeaux
  5. * Copyright (C) 2011,2012 Inria
  6. *
  7. * StarPU is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU Lesser General Public License as published by
  9. * the Free Software Foundation; either version 2.1 of the License, or (at
  10. * your option) any later version.
  11. *
  12. * StarPU is distributed in the hope that it will be useful, but
  13. * WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  15. *
  16. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  17. */
  18. #include "socl.h"
  19. #include <string.h>
  20. /* Forward extern declaration */
  21. extern void soclEnqueueNDRangeKernel_task(void *descr[], void *args);
  22. cl_event command_event_get_ex(cl_command cmd)
  23. {
  24. cl_event ev = cmd->event;
  25. gc_entity_retain(ev);
  26. return ev;
  27. }
  28. static void command_release_callback(void *a)
  29. {
  30. cl_command cmd = (cl_command)a;
  31. // Call command specific release callback
  32. if (cmd->release_callback != NULL)
  33. cmd->release_callback(cmd);
  34. // Generic command destructor
  35. cl_uint i;
  36. for (i=0; i<cmd->num_events; i++)
  37. {
  38. gc_entity_unstore(&cmd->events[i]);
  39. }
  40. cmd->num_events = 0;
  41. free(cmd->events);
  42. /* Remove from command queue */
  43. cl_command_queue cq = cmd->event->cq;
  44. if (cq != NULL)
  45. {
  46. /* Lock command queue */
  47. STARPU_PTHREAD_MUTEX_LOCK(&cq->mutex);
  48. /* Remove barrier if applicable */
  49. if (cq->barrier == cmd)
  50. cq->barrier = NULL;
  51. /* Remove from the list of out-of-order commands */
  52. cq->commands = command_list_remove(cq->commands, cmd);
  53. /* Unlock command queue */
  54. STARPU_PTHREAD_MUTEX_UNLOCK(&cq->mutex);
  55. }
  56. // Events may survive to commands that created them
  57. cmd->event->command = NULL;
  58. gc_entity_unstore(&cmd->event);
  59. }
  60. void command_init_ex(cl_command cmd, cl_command_type typ, void (*cb)(void*))
  61. {
  62. gc_entity_init(&cmd->_entity, command_release_callback, "command");
  63. cmd->release_callback = cb;
  64. cmd->typ = typ;
  65. cmd->num_events = 0;
  66. cmd->events = NULL;
  67. cmd->event = event_create(); // we do not use gc_entity_store here because if nobody requires the event, it should be destroyed with the command
  68. cmd->event->command = cmd;
  69. cmd->task = NULL;
  70. cmd->submitted = 0;
  71. }
  72. void command_submit_ex(cl_command cmd)
  73. {
  74. #define SUBMIT(typ,name) case typ: \
  75. name##_submit((name)cmd); \
  76. break;
  77. assert(cmd->submitted == 0);
  78. switch(cmd->typ)
  79. {
  80. SUBMIT(CL_COMMAND_NDRANGE_KERNEL, command_ndrange_kernel);
  81. SUBMIT(CL_COMMAND_TASK, command_ndrange_kernel);
  82. SUBMIT(CL_COMMAND_READ_BUFFER, command_read_buffer);
  83. SUBMIT(CL_COMMAND_WRITE_BUFFER, command_write_buffer);
  84. SUBMIT(CL_COMMAND_COPY_BUFFER, command_copy_buffer);
  85. SUBMIT(CL_COMMAND_MAP_BUFFER, command_map_buffer);
  86. SUBMIT(CL_COMMAND_UNMAP_MEM_OBJECT, command_unmap_mem_object);
  87. SUBMIT(CL_COMMAND_MARKER, command_marker);
  88. SUBMIT(CL_COMMAND_BARRIER, command_barrier);
  89. default:
  90. ERROR_STOP("Trying to submit unknown command (type %x)", cmd->typ);
  91. }
  92. cmd->submitted = 1;
  93. #undef SUBMIT
  94. }
  95. cl_int command_submit_deep_ex(cl_command cmd)
  96. {
  97. if (cmd->submitted == 1)
  98. return CL_SUCCESS;
  99. /* We set this in order to avoid cyclic dependencies */
  100. cmd->submitted = 1;
  101. unsigned int i;
  102. for (i=0; i<cmd->num_events; i++)
  103. command_submit_deep(cmd->events[i]->command);
  104. cmd->submitted = 0;
  105. command_submit_ex(cmd);
  106. return CL_SUCCESS;
  107. }
  108. void command_graph_dump_ex(cl_command cmd)
  109. {
  110. unsigned int i;
  111. for (i=0; i<cmd->num_events; i++)
  112. command_graph_dump_ex(cmd->events[i]->command);
  113. const char * typ_str = (cmd->typ == CL_COMMAND_NDRANGE_KERNEL ? "ndrange_kernel" :
  114. cmd->typ == CL_COMMAND_TASK ? "task" :
  115. cmd->typ == CL_COMMAND_READ_BUFFER ? "read_buffer" :
  116. cmd->typ == CL_COMMAND_WRITE_BUFFER ? "write_buffer" :
  117. cmd->typ == CL_COMMAND_COPY_BUFFER ? "copy_buffer" :
  118. cmd->typ == CL_COMMAND_MAP_BUFFER ? "map_buffer" :
  119. cmd->typ == CL_COMMAND_UNMAP_MEM_OBJECT ? "unmap_mem_object" :
  120. cmd->typ == CL_COMMAND_MARKER ? "marker" :
  121. cmd->typ == CL_COMMAND_BARRIER ? "barrier" : "unknown");
  122. printf("CMD %p TYPE %s DEPS", cmd, typ_str);
  123. for (i=0; i<cmd->num_events; i++)
  124. printf(" %p", cmd->events[i]->command);
  125. printf("\n");
  126. }
  127. #define nullOrDup(name,size) cmd->name = memdup_safe(name,size)
  128. #define nullOrFree(name) if (cmd->name != NULL) free((void*)cmd->name)
  129. #define dup(name) cmd->name = name
  130. void command_ndrange_kernel_release(void * arg)
  131. {
  132. command_ndrange_kernel cmd = (command_ndrange_kernel)arg;
  133. gc_entity_unstore(&cmd->kernel);
  134. nullOrFree(global_work_offset);
  135. nullOrFree(global_work_size);
  136. nullOrFree(local_work_size);
  137. free(cmd->arg_sizes);
  138. free(cmd->arg_types);
  139. unsigned int i;
  140. for (i=0; i<cmd->num_args; i++)
  141. {
  142. free(cmd->args[i]);
  143. cmd->args[i] = NULL;
  144. }
  145. free(cmd->args);
  146. for (i=0; i<cmd->num_buffers; i++)
  147. gc_entity_unstore(&cmd->buffers[i]);
  148. free(cmd->buffers);
  149. }
  150. command_ndrange_kernel command_ndrange_kernel_create(cl_kernel kernel,
  151. cl_uint work_dim,
  152. const size_t * global_work_offset,
  153. const size_t * global_work_size,
  154. const size_t * local_work_size)
  155. {
  156. command_ndrange_kernel cmd = calloc(1, sizeof(struct command_ndrange_kernel_t));
  157. command_init(cmd, CL_COMMAND_NDRANGE_KERNEL, command_ndrange_kernel_release);
  158. gc_entity_store(&cmd->kernel, kernel);
  159. dup(work_dim);
  160. nullOrDup(global_work_offset, work_dim*sizeof(size_t));
  161. nullOrDup(global_work_size, work_dim*sizeof(size_t));
  162. nullOrDup(local_work_size, work_dim*sizeof(size_t));
  163. starpu_codelet_init(&cmd->codelet);
  164. cmd->codelet.where = STARPU_OPENCL;
  165. cmd->codelet.energy_model = NULL;
  166. cmd->codelet.opencl_funcs[0] = &soclEnqueueNDRangeKernel_task;
  167. /* Kernel is mutable, so we duplicate its parameters... */
  168. cmd->num_args = kernel->num_args;
  169. cmd->arg_sizes = memdup(kernel->arg_size, sizeof(size_t) * kernel->num_args);
  170. cmd->arg_types = memdup(kernel->arg_type, sizeof(enum kernel_arg_type) * kernel->num_args);
  171. cmd->args = memdup_deep_varsize_safe(kernel->arg_value, kernel->num_args, kernel->arg_size);
  172. return cmd;
  173. }
  174. command_ndrange_kernel command_task_create (cl_kernel kernel)
  175. {
  176. static cl_uint task_work_dim = 3;
  177. static const size_t task_global_work_offset[3] = {0,0,0};
  178. static const size_t task_global_work_size[3] = {1,1,1};
  179. static const size_t * task_local_work_size = NULL;
  180. command_ndrange_kernel cmd = command_ndrange_kernel_create(kernel, task_work_dim, task_global_work_offset,
  181. task_global_work_size, task_local_work_size);
  182. /* This is the only difference with command_ndrange_kernel_create */
  183. cmd->_command.typ = CL_COMMAND_TASK;
  184. return cmd;
  185. }
  186. command_barrier command_barrier_create ()
  187. {
  188. command_barrier cmd = malloc(sizeof(struct command_barrier_t));
  189. command_init(cmd, CL_COMMAND_BARRIER, NULL);
  190. return cmd;
  191. }
  192. command_marker command_marker_create ()
  193. {
  194. command_marker cmd = malloc(sizeof(struct command_marker_t));
  195. command_init(cmd, CL_COMMAND_MARKER, NULL);
  196. return cmd;
  197. }
  198. void command_map_buffer_release(void * UNUSED(arg))
  199. {
  200. /* We DO NOT unstore (release) the buffer as unmap will do it
  201. gc_entity_unstore(&cmd->buffer); */
  202. }
  203. command_map_buffer command_map_buffer_create(cl_mem buffer,
  204. cl_map_flags map_flags,
  205. size_t offset,
  206. size_t cb
  207. )
  208. {
  209. command_map_buffer cmd = malloc(sizeof(struct command_map_buffer_t));
  210. command_init(cmd, CL_COMMAND_MAP_BUFFER, command_map_buffer_release);
  211. gc_entity_store(&cmd->buffer, buffer);
  212. dup(map_flags);
  213. dup(offset);
  214. dup(cb);
  215. return cmd;
  216. }
  217. void command_unmap_mem_object_release(void * arg)
  218. {
  219. command_unmap_mem_object cmd = (command_unmap_mem_object)arg;
  220. /* We release the buffer twice because map buffer command did not */
  221. gc_entity_release(cmd->buffer);
  222. gc_entity_unstore(&cmd->buffer);
  223. }
  224. command_unmap_mem_object command_unmap_mem_object_create(cl_mem buffer, void * ptr)
  225. {
  226. command_unmap_mem_object cmd = malloc(sizeof(struct command_unmap_mem_object_t));
  227. command_init(cmd, CL_COMMAND_UNMAP_MEM_OBJECT, command_unmap_mem_object_release);
  228. gc_entity_store(&cmd->buffer, buffer);
  229. dup(ptr);
  230. return cmd;
  231. }
  232. void command_read_buffer_release(void *arg)
  233. {
  234. command_read_buffer cmd = (command_read_buffer)arg;
  235. gc_entity_unstore(&cmd->buffer);
  236. }
  237. command_read_buffer command_read_buffer_create(cl_mem buffer, size_t offset, size_t cb, void * ptr)
  238. {
  239. command_read_buffer cmd = malloc(sizeof(struct command_read_buffer_t));
  240. command_init(cmd, CL_COMMAND_READ_BUFFER, command_read_buffer_release);
  241. gc_entity_store(&cmd->buffer, buffer);
  242. dup(offset);
  243. dup(cb);
  244. dup(ptr);
  245. return cmd;
  246. }
  247. void command_write_buffer_release(void *arg)
  248. {
  249. command_write_buffer cmd = (command_write_buffer)arg;
  250. gc_entity_unstore(&cmd->buffer);
  251. }
  252. command_write_buffer command_write_buffer_create(cl_mem buffer, size_t offset, size_t cb, const void * ptr)
  253. {
  254. command_write_buffer cmd = malloc(sizeof(struct command_write_buffer_t));
  255. command_init(cmd, CL_COMMAND_WRITE_BUFFER, command_write_buffer_release);
  256. gc_entity_store(&cmd->buffer, buffer);
  257. dup(offset);
  258. dup(cb);
  259. dup(ptr);
  260. return cmd;
  261. }
  262. void command_copy_buffer_release(void *arg)
  263. {
  264. command_copy_buffer cmd = (command_copy_buffer)arg;
  265. gc_entity_unstore(&cmd->src_buffer);
  266. gc_entity_unstore(&cmd->dst_buffer);
  267. }
  268. command_copy_buffer command_copy_buffer_create( cl_mem src_buffer, cl_mem dst_buffer,
  269. size_t src_offset, size_t dst_offset, size_t cb)
  270. {
  271. command_copy_buffer cmd = malloc(sizeof(struct command_copy_buffer_t));
  272. command_init(cmd, CL_COMMAND_COPY_BUFFER, command_copy_buffer_release);
  273. gc_entity_store(&cmd->src_buffer, src_buffer);
  274. gc_entity_store(&cmd->dst_buffer, dst_buffer);
  275. dup(src_offset);
  276. dup(dst_offset);
  277. dup(cb);
  278. return cmd;
  279. }
  280. #undef nullOrDup
  281. #undef nodeNullOrDup
  282. #undef dup
  283. #undef nodeDup
  284. #undef memdup