123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122 |
- /* StarPU --- Runtime system for heterogeneous multicore architectures.
- *
- * Copyright (C) 2010, 2012-2013 Université de Bordeaux 1
- *
- * StarPU is free software; you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation; either version 2.1 of the License, or (at
- * your option) any later version.
- *
- * StarPU is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- *
- * See the GNU Lesser General Public License in COPYING.LGPL for more details.
- */
- #include <starpu.h>
- #include <common/config.h>
- #include <core/task.h>
- #include <datawizard/datawizard.h>
- #include <util/starpu_data_cpy.h>
- static void data_cpy_func(void *descr[], void *cl_arg)
- {
- const struct starpu_data_copy_methods *copy_methods = (const struct starpu_data_copy_methods *) cl_arg;
- int workerid = starpu_worker_get_id();
- enum starpu_worker_archtype type = starpu_worker_get_type(workerid);
- unsigned memory_node = starpu_worker_get_memory_node(workerid);
- void *dst_interface = descr[0];
- void *src_interface = descr[1];
- switch (type)
- {
- case STARPU_CPU_WORKER:
- if (copy_methods->ram_to_ram)
- {
- copy_methods->ram_to_ram(src_interface, memory_node, dst_interface, memory_node);
- return;
- }
- break;
- case STARPU_CUDA_WORKER:
- if (copy_methods->cuda_to_cuda)
- {
- copy_methods->cuda_to_cuda(src_interface, memory_node, dst_interface, memory_node);
- return;
- }
- break;
- case STARPU_OPENCL_WORKER:
- if (copy_methods->opencl_to_opencl)
- {
- copy_methods->opencl_to_opencl(src_interface, memory_node, dst_interface, memory_node);
- return;
- }
- break;
- default:
- /* unknown architecture */
- STARPU_ABORT();
- }
- STARPU_ASSERT(copy_methods->any_to_any);
- copy_methods->any_to_any(src_interface, memory_node, dst_interface, memory_node, NULL);
- }
- struct starpu_perfmodel copy_model =
- {
- .type = STARPU_HISTORY_BASED,
- .symbol = "starpu_data_cpy"
- };
- static struct starpu_codelet copy_cl =
- {
- .where = STARPU_CPU|STARPU_CUDA|STARPU_OPENCL,
- .cpu_funcs = {data_cpy_func, NULL},
- .cuda_funcs = {data_cpy_func, NULL},
- .opencl_funcs = {data_cpy_func, NULL},
- .nbuffers = 2,
- .modes = {STARPU_W, STARPU_R},
- .model = ©_model
- };
- int _starpu_data_cpy(starpu_data_handle_t dst_handle, starpu_data_handle_t src_handle,
- int asynchronous, void (*callback_func)(void*), void *callback_arg,
- int reduction, struct starpu_task *reduction_dep_task)
- {
- const struct starpu_data_copy_methods *copy_methods = dst_handle->ops->copy_methods;
- struct starpu_task *task = starpu_task_create();
- STARPU_ASSERT(task);
- struct _starpu_job *j = _starpu_get_job_associated_to_task(task);
- if (reduction)
- {
- j->reduction_task = reduction;
- if (reduction_dep_task)
- starpu_task_declare_deps_array(task, 1, &reduction_dep_task);
- }
- task->cl = ©_cl;
- task->cl_arg = (void *)copy_methods;
- task->callback_func = callback_func;
- task->callback_arg = callback_arg;
- STARPU_TASK_SET_HANDLE(task, dst_handle, 0);
- STARPU_TASK_SET_HANDLE(task, src_handle, 1);
- task->synchronous = !asynchronous;
- int ret = _starpu_task_submit_internally(task);
- STARPU_ASSERT(!ret);
- return 0;
- }
- int starpu_data_cpy(starpu_data_handle_t dst_handle, starpu_data_handle_t src_handle,
- int asynchronous, void (*callback_func)(void*), void *callback_arg)
- {
- return _starpu_data_cpy(dst_handle, src_handle, asynchronous, callback_func, callback_arg, 0, NULL);
- }
|