starpu_data_cpy.c 5.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2011,2012 Inria
  4. * Copyright (C) 2010-2018 Université de Bordeaux
  5. * Copyright (C) 2011-2013,2016,2017,2019 CNRS
  6. * Copyright (C) 2013 Thibaut Lambert
  7. *
  8. * StarPU is free software; you can redistribute it and/or modify
  9. * it under the terms of the GNU Lesser General Public License as published by
  10. * the Free Software Foundation; either version 2.1 of the License, or (at
  11. * your option) any later version.
  12. *
  13. * StarPU is distributed in the hope that it will be useful, but
  14. * WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  16. *
  17. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  18. */
  19. #include <starpu.h>
  20. #include <common/config.h>
  21. #include <core/task.h>
  22. #include <core/workers.h>
  23. #include <datawizard/datawizard.h>
  24. #include <util/starpu_data_cpy.h>
  25. #include <starpu_mic.h>
  26. static void common_data_cpy_func(void *descr[], void *cl_arg)
  27. {
  28. unsigned interface_id = *(unsigned *)cl_arg;
  29. const struct starpu_data_interface_ops *interface_ops = _starpu_data_interface_get_ops(interface_id);
  30. const struct starpu_data_copy_methods *copy_methods = interface_ops->copy_methods;
  31. int workerid = starpu_worker_get_id_check();
  32. enum starpu_worker_archtype type = starpu_worker_get_type(workerid);
  33. unsigned memory_node = starpu_worker_get_memory_node(workerid);
  34. void *dst_interface = descr[0];
  35. void *src_interface = descr[1];
  36. switch (type)
  37. {
  38. case STARPU_CPU_WORKER:
  39. if (copy_methods->ram_to_ram)
  40. {
  41. copy_methods->ram_to_ram(src_interface, memory_node, dst_interface, memory_node);
  42. return;
  43. }
  44. break;
  45. #ifdef STARPU_USE_CUDA
  46. case STARPU_CUDA_WORKER:
  47. {
  48. cudaStream_t stream = starpu_cuda_get_local_stream();
  49. if (copy_methods->cuda_to_cuda_async)
  50. {
  51. copy_methods->cuda_to_cuda_async(src_interface, memory_node, dst_interface, memory_node, stream);
  52. return;
  53. }
  54. else if (copy_methods->cuda_to_cuda)
  55. {
  56. copy_methods->cuda_to_cuda(src_interface, memory_node, dst_interface, memory_node);
  57. return;
  58. }
  59. break;
  60. }
  61. #endif
  62. case STARPU_OPENCL_WORKER:
  63. if (copy_methods->opencl_to_opencl)
  64. {
  65. copy_methods->opencl_to_opencl(src_interface, memory_node, dst_interface, memory_node);
  66. return;
  67. }
  68. break;
  69. default:
  70. /* unknown architecture */
  71. STARPU_ABORT();
  72. }
  73. STARPU_ASSERT(copy_methods->any_to_any);
  74. copy_methods->any_to_any(src_interface, memory_node, dst_interface, memory_node, NULL);
  75. }
  76. void mp_cpy_kernel(void *descr[], void *cl_arg)
  77. {
  78. unsigned interface_id = *(unsigned *)cl_arg;
  79. const struct starpu_data_interface_ops *interface_ops = _starpu_data_interface_get_ops(interface_id);
  80. const struct starpu_data_copy_methods *copy_methods = interface_ops->copy_methods;
  81. void *dst_interface = descr[0];
  82. void *src_interface = descr[1];
  83. if(copy_methods->ram_to_ram)
  84. copy_methods->ram_to_ram(src_interface, STARPU_MAIN_RAM, dst_interface, STARPU_MAIN_RAM);
  85. else if(copy_methods->any_to_any)
  86. copy_methods->any_to_any(src_interface, STARPU_MAIN_RAM, dst_interface, STARPU_MAIN_RAM, NULL);
  87. else
  88. STARPU_ABORT();
  89. }
  90. static starpu_mic_kernel_t mic_cpy_func()
  91. {
  92. #ifdef STARPU_USE_MIC
  93. starpu_mic_func_symbol_t mic_symbol = NULL;
  94. starpu_mic_register_kernel(&mic_symbol, "mp_cpy_kernel");
  95. return starpu_mic_get_kernel(mic_symbol);
  96. #else
  97. STARPU_ABORT();
  98. return NULL;
  99. #endif
  100. }
  101. struct starpu_perfmodel copy_model =
  102. {
  103. .type = STARPU_HISTORY_BASED,
  104. .symbol = "starpu_data_cpy"
  105. };
  106. static struct starpu_codelet copy_cl =
  107. {
  108. .where = STARPU_CPU|STARPU_CUDA|STARPU_OPENCL|STARPU_MIC,
  109. .cpu_funcs = {common_data_cpy_func},
  110. .cuda_funcs = {common_data_cpy_func},
  111. .opencl_funcs = {common_data_cpy_func},
  112. .mic_funcs = {mic_cpy_func},
  113. .nbuffers = 2,
  114. .modes = {STARPU_W, STARPU_R},
  115. .model = &copy_model
  116. };
  117. int _starpu_data_cpy(starpu_data_handle_t dst_handle, starpu_data_handle_t src_handle,
  118. int asynchronous, void (*callback_func)(void*), void *callback_arg,
  119. int reduction, struct starpu_task *reduction_dep_task)
  120. {
  121. struct starpu_task *task = starpu_task_create();
  122. STARPU_ASSERT(task);
  123. task->name = "data_cpy";
  124. struct _starpu_job *j = _starpu_get_job_associated_to_task(task);
  125. if (reduction)
  126. {
  127. j->reduction_task = reduction;
  128. if (reduction_dep_task)
  129. starpu_task_declare_deps_array(task, 1, &reduction_dep_task);
  130. }
  131. task->cl = &copy_cl;
  132. unsigned *interface_id;
  133. _STARPU_MALLOC(interface_id, sizeof(*interface_id));
  134. *interface_id = dst_handle->ops->interfaceid;
  135. task->cl_arg = interface_id;
  136. task->cl_arg_size = sizeof(*interface_id);
  137. task->cl_arg_free = 1;
  138. task->callback_func = callback_func;
  139. task->callback_arg = callback_arg;
  140. STARPU_TASK_SET_HANDLE(task, dst_handle, 0);
  141. STARPU_TASK_SET_HANDLE(task, src_handle, 1);
  142. task->synchronous = !asynchronous;
  143. int ret = _starpu_task_submit_internally(task);
  144. STARPU_ASSERT(!ret);
  145. return 0;
  146. }
  147. int starpu_data_cpy(starpu_data_handle_t dst_handle, starpu_data_handle_t src_handle,
  148. int asynchronous, void (*callback_func)(void*), void *callback_arg)
  149. {
  150. return _starpu_data_cpy(dst_handle, src_handle, asynchronous, callback_func, callback_arg, 0, NULL);
  151. }