driver_fpga.c 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2009-2020 Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
  4. * Copyright (C) 2010 Mehdi Juhoor <mjuhoor@gmail.com>
  5. * Copyright (C) 2011 Télécom-SudParis
  6. *
  7. * StarPU is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU Lesser General Public License as published by
  9. * the Free Software Foundation; either version 2.1 of the License, or (at
  10. * your option) any later version.
  11. *
  12. * StarPU is distributed in the hope that it will be useful, but
  13. * WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  15. *
  16. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  17. */
  18. #include <starpu.h>
  19. #include <starpu_fpga.h>
  20. #include <starpu_profiling.h>
  21. #include <common/utils.h>
  22. #include <common/config.h>
  23. #include <core/debug.h>
  24. #include <drivers/driver_common/driver_common.h>
  25. #include "driver_fpga.h"
  26. #include <core/sched_policy.h>
  27. #include <datawizard/memory_manager.h>
  28. #include <datawizard/memory_nodes.h>
  29. #include <datawizard/malloc.h>
  30. //#include <MaxSLiCInterface.h>
  31. #define KNRM "\x1B[0m"
  32. #define KRED "\x1B[31m"
  33. #define KGRN "\x1B[32m"
  34. #define KYEL "\x1B[33m"
  35. #define KBLU "\x1B[34m"
  36. #define KMAG "\x1B[35m"
  37. #define KCYN "\x1B[36m"
  38. #define KWHT "\x1B[37m"
  39. #define FPGA_OK KGRN
  40. #define FPGA_ERROR KRED
  41. #define NORMAL KNRM
  42. #define FPGA_OK KGRN
  43. //#define STARPU_MAXFPGADEVS 4
  44. /* the number of FPGA devices */
  45. static unsigned nfpgafpgas = -1;
  46. static struct starpu_fpga_device_properties props[STARPU_MAXFPGADEVS];
  47. static size_t global_mem[STARPU_MAXFPGADEVS] = { 128ULL*1024*1024*1024 };
  48. static void _starpu_fpga_limit_global_mem(unsigned );
  49. static size_t _starpu_fpga_get_global_mem_size(unsigned devid);
  50. void fpga_msg(char *msg)
  51. {
  52. printf(FPGA_OK "%s\n" NORMAL, msg);
  53. }
  54. void _starpu_init_fpga()
  55. {
  56. nfpgafpgas = starpu_get_env_number("STARPU_NUM_FPGA_FPGA");
  57. if(nfpgafpgas == -1)
  58. nfpgafpgas =1;
  59. STARPU_ASSERT( nfpgafpgas <= STARPU_MAXFPGADEVS);
  60. //LMemInterface addLMemInterface()
  61. //// pour récupérer l'accès à la LMem
  62. }
  63. #if 0
  64. int fpga_allocate_memory(fpga_mem *ptr, size_t size)
  65. {
  66. //This allocates BYTES
  67. char *msg1="You asked to allocate ";
  68. //printf(KCYN "%s%d*%d\n" KBLU, msg1,size,sizeof(unsigned));
  69. printf(FPGA_OK "%s%lu bytes\n" NORMAL, msg1,size);
  70. *ptr =(fpga_mem) malloc(size);
  71. if (*ptr == NULL)
  72. return 0;
  73. else
  74. return 1;
  75. }
  76. #endif
  77. int starpu_fpga_get_device_properties(struct starpu_fpga_device_properties *props, unsigned devid)
  78. {
  79. //TODO
  80. props->totalGlobalMem=1*1024*1024;
  81. props->concurrentKernels=4;
  82. props->name="Fpga_Props_Name";
  83. return 0;
  84. }
  85. void _starpu_fpga_discover_devices (struct _starpu_machine_config *config)
  86. {
  87. //TODO: This is statically assigned, in the next round of integration
  88. // I will have to read from the struct fpga in fpga
  89. config->topology.nhwfpgafpgas = nfpgafpgas;
  90. }
  91. unsigned _starpu_fpga_get_device_count(void)
  92. {
  93. return nfpgafpgas;
  94. }
  95. static void _starpu_fpga_limit_global_mem(unsigned devid)
  96. {
  97. starpu_ssize_t limit=-1;
  98. //TODO
  99. limit = starpu_get_env_number("STARPU_LIMIT_FPGA_MEM");
  100. if(limit != -1)
  101. global_mem[devid] = limit*1024*1024;
  102. }
  103. static size_t _starpu_fpga_get_global_mem_size(unsigned devid)
  104. {
  105. return global_mem[devid];
  106. }
  107. static void init_fpga_worker_context(unsigned workerid)
  108. {
  109. //starpu_fpgaStreamCreate(&streams[devid][i]);
  110. }
  111. static void init_device_context(unsigned devid)
  112. {
  113. unsigned i;
  114. //TODO: starpu_fpga_set_device
  115. starpu_fpga_set_device(devid);
  116. starpu_fpga_get_device_properties(&props[devid], devid);
  117. //TODO: Do we need the streams? I think no
  118. //cures = starpu_fpgaStreamCreate(&in_transfer_streams[devid]);
  119. //cures = starpu_fpgaStreamCreate(&out_transfer_streams[devid]);
  120. for (i = 0; i < nfpgafpgas; i++)
  121. {
  122. //starpu_fpgaStreamCreate(&in_peer_transfer_streams[i][devid]);
  123. //starpu_fpgaStreamCreate(&out_peer_transfer_streams[devid][i]);
  124. }
  125. }
  126. int _starpu_fpga_driver_init(struct _starpu_worker *worker)
  127. {
  128. int devid = worker->devid;
  129. //fpga_msg("successful till here");
  130. _starpu_driver_start(worker, _STARPU_FUT_CPU_KEY, 1);
  131. /* FIXME: when we have NUMA support, properly turn node number into NUMA node number */
  132. // TODO: drop test when we allocated a memory node for fpga
  133. if (worker->memory_node != STARPU_MAIN_RAM)
  134. _starpu_memory_manager_set_global_memory_size(worker->memory_node, _starpu_fpga_get_global_mem_size(worker->devid));
  135. snprintf(worker->name, sizeof(worker->name), "FPGA %d", devid);
  136. snprintf(worker->short_name, sizeof(worker->short_name), "FPGA %d", devid);
  137. starpu_pthread_setname(worker->short_name);
  138. _STARPU_TRACE_WORKER_INIT_END(worker->workerid);
  139. /* tell the main thread that we are ready */
  140. STARPU_PTHREAD_MUTEX_LOCK(&worker->mutex);
  141. worker->status = STATUS_UNKNOWN;
  142. worker->worker_is_initialized = 1;
  143. STARPU_PTHREAD_COND_SIGNAL(&worker->ready_cond);
  144. STARPU_PTHREAD_MUTEX_UNLOCK(&worker->mutex);
  145. return 0;
  146. }
  147. static int execute_job_on_fpga(struct _starpu_job *j, struct starpu_task *worker_task, struct _starpu_worker *fpga_args, int rank, struct starpu_perfmodel_arch* perf_arch)
  148. {
  149. int ret;
  150. int profiling = starpu_profiling_status_get();
  151. struct starpu_task *task = j->task;
  152. struct starpu_codelet *cl = task->cl;
  153. STARPU_ASSERT(cl);
  154. /* TODO: use asynchronous */
  155. ret = _starpu_fetch_task_input(task, j, 0);
  156. if (ret != 0)
  157. {
  158. /* there was not enough memory so the codelet cannot be executed right now ... */
  159. /* push the codelet back and try another one ... */
  160. return -EAGAIN;
  161. }
  162. /* Give profiling variable */
  163. _starpu_driver_start_job(fpga_args, j, perf_arch, rank, profiling);
  164. /* In case this is a Fork-join parallel task, the worker does not
  165. * execute the kernel at all. */
  166. if ((rank == 0) || (cl->type != STARPU_FORKJOIN))
  167. {
  168. _starpu_cl_func_t func = _starpu_task_get_fpga_nth_implementation(cl, j->nimpl);
  169. //char *kernel_type = _starpu_task_get_fpga_kernel_type_nth_implementation(cl, j->nimpl);
  170. //printf("chanel reserved: %d \n",chnl);
  171. STARPU_ASSERT_MSG(func, "when STARPU_FPGA is defined in 'where', fpga_func or fpga_funcs has to be defined");
  172. if (_starpu_get_disable_kernels() <= 0)
  173. {
  174. _STARPU_TRACE_START_EXECUTING();
  175. //int chnl = fpga_reserve_chanel_of_kernel_type(kernel_type);
  176. //_starpu_fpga_transfer_data(_STARPU_TASK_GET_INTERFACES(task), j, chnl);
  177. //fpga_release_chanel(chnl);
  178. func(_STARPU_TASK_GET_INTERFACES(task), task->cl_arg);
  179. _STARPU_TRACE_END_EXECUTING();
  180. }
  181. }
  182. _starpu_driver_end_job(fpga_args, j, perf_arch, rank, profiling);
  183. _starpu_driver_update_job_feedback(j, fpga_args, perf_arch, profiling);
  184. _starpu_push_task_output(j);
  185. return 0;
  186. }
  187. int _starpu_fpga_driver_run_once(struct _starpu_worker *fpga_worker)
  188. {
  189. unsigned memnode = fpga_worker->memory_node;
  190. int workerid = fpga_worker->workerid;
  191. _STARPU_TRACE_START_PROGRESS(memnode);
  192. _starpu_datawizard_progress(1);
  193. if (memnode != STARPU_MAIN_RAM)
  194. {
  195. _starpu_datawizard_progress(1);
  196. }
  197. _STARPU_TRACE_END_PROGRESS(memnode);
  198. struct _starpu_job *j;
  199. struct starpu_task *task;
  200. int res;
  201. task = _starpu_get_worker_task(fpga_worker, workerid, memnode);
  202. if (!task)
  203. return 0;
  204. j = _starpu_get_job_associated_to_task(task);
  205. /* can a cpu perform that task ? */
  206. if (!_STARPU_FPGA_MAY_PERFORM(j))
  207. {
  208. /* put it and the end of the queue ... XXX */
  209. _starpu_push_task_to_workers(task);
  210. return 0;
  211. }
  212. int rank = 0;
  213. int is_parallel_task = (j->task_size > 1);
  214. struct starpu_perfmodel_arch* perf_arch;
  215. if (is_parallel_task)
  216. {
  217. STARPU_PTHREAD_MUTEX_LOCK(&j->sync_mutex);
  218. rank = j->active_task_alias_count++;
  219. STARPU_PTHREAD_MUTEX_UNLOCK(&j->sync_mutex);
  220. if(j->combined_workerid != -1)
  221. {
  222. struct _starpu_combined_worker *combined_worker;
  223. combined_worker = _starpu_get_combined_worker_struct(j->combined_workerid);
  224. fpga_worker->combined_workerid = j->combined_workerid;
  225. fpga_worker->worker_size = combined_worker->worker_size;
  226. fpga_worker->current_rank = rank;
  227. perf_arch = &combined_worker->perf_arch;
  228. }
  229. else
  230. {
  231. struct _starpu_sched_ctx *sched_ctx = _starpu_sched_ctx_get_sched_ctx_for_worker_and_job(fpga_worker, j);
  232. STARPU_ASSERT_MSG(sched_ctx != NULL, "there should be a worker %d in the ctx of this job \n", fpga_worker->workerid);
  233. perf_arch = &sched_ctx->perf_arch;
  234. }
  235. }
  236. else
  237. {
  238. fpga_worker->combined_workerid = fpga_worker->workerid;
  239. fpga_worker->worker_size = 1;
  240. fpga_worker->current_rank = 0;
  241. perf_arch = &fpga_worker->perf_arch;
  242. }
  243. _starpu_set_current_task(j->task);
  244. fpga_worker->current_task = j->task;
  245. res = execute_job_on_fpga(j, task, fpga_worker, rank, perf_arch);
  246. _starpu_set_current_task(NULL);
  247. fpga_worker->current_task = NULL;
  248. if (res)
  249. {
  250. switch (res)
  251. {
  252. case -EAGAIN:
  253. _starpu_push_task_to_workers(task);
  254. return 0;
  255. default:
  256. STARPU_ABORT();
  257. }
  258. }
  259. /* In the case of combined workers, we need to inform the
  260. * scheduler each worker's execution is over.
  261. * Then we free the workers' task alias */
  262. if (is_parallel_task)
  263. {
  264. _starpu_sched_post_exec_hook(task);
  265. free(task);
  266. }
  267. if (rank == 0)
  268. _starpu_handle_job_termination(j);
  269. return 0;
  270. }
  271. int _starpu_fpga_driver_deinit(struct _starpu_worker *fpga_worker)
  272. {
  273. _STARPU_TRACE_WORKER_DEINIT_START;
  274. unsigned memnode = fpga_worker->memory_node;
  275. _starpu_handle_all_pending_node_data_requests(memnode);
  276. /* In case there remains some memory that was automatically
  277. * allocated by StarPU, we release it now. Note that data
  278. * coherency is not maintained anymore at that point ! */
  279. _starpu_free_all_automatically_allocated_buffers(memnode);
  280. fpga_worker->worker_is_initialized = 0;
  281. _STARPU_TRACE_WORKER_DEINIT_END(_STARPU_FUT_CPU_KEY);
  282. return 0;
  283. }
  284. void *_starpu_fpga_worker(void *_arg)
  285. {
  286. struct _starpu_worker* worker = _arg;
  287. unsigned memnode = worker->memory_node;
  288. _starpu_fpga_driver_init(worker);
  289. _STARPU_TRACE_START_PROGRESS(memnode);
  290. while (_starpu_machine_is_running())
  291. {
  292. _starpu_may_pause();
  293. //fpga_msg("\tEntered the main loop\n");
  294. _starpu_fpga_driver_run_once(worker);
  295. }
  296. _STARPU_TRACE_END_PROGRESS(memnode);
  297. _starpu_fpga_driver_deinit(worker);
  298. return NULL;
  299. }
  300. uintptr_t _starpu_fpga_allocate_memory(unsigned dst_node, size_t size, int flags)
  301. {
  302. (void) flags;
  303. unsigned devid = starpu_memory_node_get_devid(dst_node);
  304. STARPU_ASSERT(devid == 0); // For now
  305. /* 0 would be seen as NULL, i.e. allocation failed... */
  306. // FIXME: Maxeler FPGAs want 192-byte alignment
  307. static fpga_mem current_address = 8192*192;
  308. fpga_mem addr;
  309. // TODO: vérifier si current_address + size > taille de la LMEm
  310. addr = current_address;
  311. current_address += size;
  312. printf("fpga mem returned from allocation @: %p - %p\n",addr, addr + size);
  313. //success = 0
  314. return (uintptr_t) addr;
  315. }
  316. int _starpu_fpga_copy_ram_to_fpga(void *src, void *dst, size_t size)
  317. {
  318. printf("ram to fpga, fpga @= %p\n",dst);
  319. memcpy(dst,src,size);
  320. return 0;
  321. // LMemLoopback_writeLMem(dst, size, src);
  322. }
  323. /* Transfert SIZE bytes from the address pointed by SRC in the SRC_NODE memory
  324. * * node to the address pointed by DST in the DST_NODE memory node
  325. * */
  326. void copy_ram_to_fpga(void *src, void *dst, size_t size)
  327. {
  328. printf("ram to fpga, fpga @= %p\n",dst);
  329. // LMemLoopback_writeLMem(size, dst, src);
  330. }
  331. void copy_fpga_to_ram(void *src, void *dst, size_t size)
  332. {
  333. printf("ram to fpga, fpga @= %p\n",src);
  334. //LMemLoopback_readLMem(size, src, dst);
  335. }
  336. /* Transfert SIZE bytes from the address pointed by SRC in the SRC_NODE memory
  337. * node to the address pointed by DST in the DST_NODE memory node
  338. */
  339. int _starpu_fpga_copy_fpga_to_ram(void *src, void *dst, size_t size)
  340. {
  341. printf("fpga to ram, fpga @= %p\n",src);
  342. memcpy(dst,src,size);
  343. return 0;
  344. //LMemLoopback_readLMem(src, size, dst);
  345. }
  346. /* Transfert SIZE bytes from the address pointed by SRC in the SRC_NODE memory
  347. * node to the address pointed by DST in the DST_NODE memory node
  348. */
  349. int _starpu_fpga_copy_fpga_to_fpga(void *src, void *dst, size_t size)
  350. {
  351. printf("fpga to ram, fpga @= %p\n",src);
  352. memcpy(dst,src,size);
  353. return 0;
  354. //LMemLoopback_XXXLMem(src, size, dst);
  355. }
  356. /* Asynchronous transfers */
  357. int _starpu_fpga_copy_ram_to_fpga_async(void *src, void *dst, size_t size)
  358. {
  359. printf("ram to fpga, fpga @= %p\n",dst);
  360. memcpy(dst,src,size);
  361. return 0;
  362. // Trouver dans la doc une version asynchrone de LMemLoopback_writeLMem();
  363. }
  364. int _starpu_fpga_copy_fpga_to_ram_async(void *src, void *dst, size_t size)
  365. {
  366. printf("fpga to ram, fpga @= %p\n",src);
  367. memcpy(dst,src,size);
  368. return 0;
  369. }
  370. int _starpu_run_fpga(struct _starpu_worker *workerarg)
  371. {
  372. /* Let's go ! */
  373. _starpu_fpga_worker(workerarg);
  374. fpga_msg("\t !!!!! ~~~ I AM IN THE DRIVER ~~~\n");
  375. return 0;
  376. }
  377. void _starpu_fpga_transfer_data(void *buffers[], struct _starpu_job *j, int chnl)
  378. {
  379. struct starpu_task *task = j->task;
  380. unsigned nbuffers = STARPU_TASK_GET_NBUFFERS(task);
  381. unsigned index;
  382. for (index = 0; index < nbuffers; index++)
  383. {
  384. starpu_data_handle_t handle = STARPU_TASK_GET_HANDLE(task, index);
  385. // enum starpu_data_access_mode mode = STARPU_TASK_GET_MODE(task, index);
  386. unsigned *interface_id = (unsigned *)malloc(sizeof(unsigned));
  387. *interface_id = handle->ops->interfaceid;
  388. switch (*interface_id)
  389. {
  390. case STARPU_VARIABLE_INTERFACE_ID:
  391. {
  392. void *ptr = (void*) STARPU_VARIABLE_GET_PTR(buffers[index]);
  393. size_t size = STARPU_VARIABLE_GET_ELEMSIZE(buffers[index]);
  394. //fpga_data_send(chnl,ptr,size);
  395. printf("Driver Fpga @: %p, size %lu \n",ptr,size);
  396. break;
  397. }
  398. case STARPU_MATRIX_INTERFACE_ID:
  399. case STARPU_BLOCK_INTERFACE_ID:
  400. case STARPU_VECTOR_INTERFACE_ID:
  401. case STARPU_CSR_INTERFACE_ID:
  402. case STARPU_BCSR_INTERFACE_ID:
  403. case STARPU_MULTIFORMAT_INTERFACE_ID:
  404. fpga_msg("Interface not supported yet");
  405. default:
  406. STARPU_ABORT();
  407. }
  408. }
  409. }
  410. int _starpu_fpga_copy_data_from_cpu_to_fpga(uintptr_t src, size_t src_offset, unsigned src_node, uintptr_t dst, size_t dst_offset, unsigned dst_node, size_t ssize, struct _starpu_async_channel *async_channel)
  411. {
  412. return _starpu_fpga_copy_ram_to_fpga((void*) src + src_offset, (void*) dst + dst_offset, ssize);
  413. }
  414. int _starpu_fpga_copy_data_from_fpga_to_cpu(uintptr_t src, size_t src_offset, unsigned src_node, uintptr_t dst, size_t dst_offset, unsigned dst_node, size_t ssize, struct _starpu_async_channel *async_channel)
  415. {
  416. return _starpu_fpga_copy_fpga_to_ram((void*) src + src_offset, (void*) dst + dst_offset, ssize);
  417. }
  418. int _starpu_fpga_copy_data_from_fpga_to_fpga(uintptr_t src, size_t src_offset, unsigned src_node, uintptr_t dst, size_t dst_offset, unsigned dst_node, size_t ssize, struct _starpu_async_channel *async_channel)
  419. {
  420. return _starpu_fpga_copy_fpga_to_fpga((void*) src + src_offset, (void*) dst + dst_offset, ssize);
  421. }
  422. int _starpu_fpga_copy_interface_from_fpga_to_cpu(starpu_data_handle_t handle, void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, struct _starpu_data_request *req)
  423. {
  424. int src_kind = starpu_node_get_kind(src_node);
  425. int dst_kind = starpu_node_get_kind(dst_node);
  426. STARPU_ASSERT(src_kind == STARPU_FPGA_RAM && dst_kind == STARPU_CPU_RAM);
  427. int ret = 1;
  428. const struct starpu_data_copy_methods *copy_methods = handle->ops->copy_methods;
  429. if (!req || starpu_asynchronous_copy_disabled() || starpu_asynchronous_fpga_copy_disabled() ||
  430. !(copy_methods->fpga_to_ram_async || copy_methods->any_to_any))
  431. {
  432. /* this is not associated to a request so it's synchronous */
  433. STARPU_ASSERT(copy_methods->fpga_to_ram || copy_methods->any_to_any);
  434. if (copy_methods->fpga_to_ram)
  435. copy_methods->fpga_to_ram(src_interface, src_node, dst_interface, dst_node);
  436. else
  437. copy_methods->any_to_any(src_interface, src_node, dst_interface, dst_node, NULL);
  438. }
  439. else
  440. {
  441. //req->async_channel.type = STARPU_FPGA_RAM;
  442. if (copy_methods->fpga_to_ram_async)
  443. ret = copy_methods->fpga_to_ram_async(src_interface, src_node, dst_interface, dst_node);
  444. else
  445. {
  446. STARPU_ASSERT(copy_methods->any_to_any);
  447. ret = copy_methods->any_to_any(src_interface, src_node, dst_interface, dst_node, &req->async_channel);
  448. }
  449. //_starpu_fpga_init_event(&(req->async_channel.event.fpga_event), src_node);
  450. }
  451. return ret;
  452. }
  453. int _starpu_fpga_copy_interface_from_cpu_to_fpga(starpu_data_handle_t handle, void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, struct _starpu_data_request *req)
  454. {
  455. int src_kind = starpu_node_get_kind(src_node);
  456. int dst_kind = starpu_node_get_kind(dst_node);
  457. STARPU_ASSERT(src_kind == STARPU_CPU_RAM && dst_kind == STARPU_FPGA_RAM);
  458. const struct starpu_data_copy_methods *copy_methods = handle->ops->copy_methods;
  459. if (!req || starpu_asynchronous_copy_disabled() || starpu_asynchronous_fpga_copy_disabled() ||
  460. !(copy_methods->ram_to_fpga_async || copy_methods->any_to_any))
  461. {
  462. /* this is not associated to a request so it's synchronous */
  463. STARPU_ASSERT(copy_methods->ram_to_fpga || copy_methods->any_to_any);
  464. if (copy_methods->ram_to_fpga)
  465. copy_methods->ram_to_fpga(src_interface, src_node, dst_interface, dst_node);
  466. else
  467. copy_methods->any_to_any(src_interface, src_node, dst_interface, dst_node, NULL);
  468. }
  469. else
  470. {
  471. //req->async_channel.type = STARPU_FPGA_RAM;
  472. if (copy_methods->ram_to_fpga_async)
  473. copy_methods->ram_to_fpga_async(src_interface, src_node, dst_interface, dst_node);
  474. else
  475. {
  476. STARPU_ASSERT(copy_methods->any_to_any);
  477. copy_methods->any_to_any(src_interface, src_node, dst_interface, dst_node, &req->async_channel);
  478. }
  479. //_starpu_fpga_init_event(&(req->async_channel.event.fpga_event), dst_node);
  480. }
  481. return 0;
  482. }
  483. struct _starpu_driver_ops _starpu_driver_fpga_ops =
  484. {
  485. .init = _starpu_fpga_driver_init,
  486. .run = _starpu_run_fpga,
  487. .run_once = _starpu_fpga_driver_run_once,
  488. .deinit = _starpu_fpga_driver_deinit
  489. };
  490. // TODO: structure node_ops, comme dans driver_cuda.c, avec starpu_fpga_allocate_memory, etc.
  491. struct _starpu_node_ops _starpu_driver_fpga_node_ops =
  492. {
  493. .copy_data_to[STARPU_UNUSED] = NULL,
  494. .copy_data_to[STARPU_CPU_RAM] = _starpu_fpga_copy_data_from_fpga_to_cpu,
  495. .copy_data_to[STARPU_FPGA_RAM] = _starpu_fpga_copy_data_from_fpga_to_fpga,
  496. .copy_data_to[STARPU_OPENCL_RAM] = NULL,
  497. .copy_data_to[STARPU_DISK_RAM] = NULL,
  498. .copy_data_to[STARPU_MIC_RAM] = NULL,
  499. .copy_data_to[STARPU_MPI_MS_RAM] = NULL,
  500. .copy_interface_to[STARPU_UNUSED] = NULL,
  501. .copy_interface_to[STARPU_CPU_RAM] = _starpu_fpga_copy_interface_from_fpga_to_cpu,
  502. .copy_interface_to[STARPU_FPGA_RAM] = NULL,
  503. .copy_interface_to[STARPU_OPENCL_RAM] = NULL,
  504. .copy_interface_to[STARPU_DISK_RAM] = NULL,
  505. .copy_interface_to[STARPU_MIC_RAM] = NULL,
  506. .copy_interface_to[STARPU_MPI_MS_RAM] = NULL,
  507. .wait_request_completion = NULL,
  508. .test_request_completion = NULL,
  509. .is_direct_access_supported = NULL,
  510. .malloc_on_node = _starpu_fpga_allocate_memory,
  511. .free_on_node = NULL,
  512. .name = "fpga driver"
  513. };