fstarpu.c 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2016 Inria
  4. *
  5. * StarPU is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * StarPU is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #include <stdlib.h>
  17. #include <stdio.h>
  18. #include <string.h>
  19. #include <starpu.h>
  20. #define _FSTARPU_ERROR(msg) do {fprintf(stderr, "fstarpu error: %s\n", (msg));abort();} while(0)
  21. typedef void (*_starpu_callback_func_t)(void *);
  22. static const intptr_t fstarpu_r = STARPU_R;
  23. static const intptr_t fstarpu_w = STARPU_W;
  24. static const intptr_t fstarpu_rw = STARPU_RW;
  25. static const intptr_t fstarpu_scratch = STARPU_SCRATCH;
  26. static const intptr_t fstarpu_redux = STARPU_REDUX;
  27. static const intptr_t fstarpu_commute = STARPU_COMMUTE;
  28. static const intptr_t fstarpu_ssend = STARPU_SSEND;
  29. static const intptr_t fstarpu_locality = STARPU_LOCALITY;
  30. static const intptr_t fstarpu_data_array = STARPU_DATA_ARRAY;
  31. static const intptr_t fstarpu_data_mode_array = STARPU_DATA_MODE_ARRAY;
  32. static const intptr_t fstarpu_cl_args = STARPU_CL_ARGS;
  33. static const intptr_t fstarpu_callback = STARPU_CALLBACK;
  34. static const intptr_t fstarpu_callback_with_arg = STARPU_CALLBACK_WITH_ARG;
  35. static const intptr_t fstarpu_callback_arg = STARPU_CALLBACK_ARG;
  36. static const intptr_t fstarpu_prologue_callback = STARPU_PROLOGUE_CALLBACK;
  37. static const intptr_t fstarpu_prologue_callback_arg = STARPU_PROLOGUE_CALLBACK_ARG;
  38. static const intptr_t fstarpu_prologue_callback_pop = STARPU_PROLOGUE_CALLBACK_POP;
  39. static const intptr_t fstarpu_prologue_callback_pop_arg = STARPU_PROLOGUE_CALLBACK_POP_ARG;
  40. static const intptr_t fstarpu_priority = STARPU_PRIORITY;
  41. static const intptr_t fstarpu_execute_on_node = STARPU_EXECUTE_ON_NODE;
  42. static const intptr_t fstarpu_execute_on_data = STARPU_EXECUTE_ON_DATA;
  43. static const intptr_t fstarpu_execute_on_worker = STARPU_EXECUTE_ON_WORKER;
  44. static const intptr_t fstarpu_worker_order = STARPU_WORKER_ORDER;
  45. static const intptr_t fstarpu_hypervisor_tag = STARPU_HYPERVISOR_TAG;
  46. static const intptr_t fstarpu_possibly_parallel = STARPU_POSSIBLY_PARALLEL;
  47. static const intptr_t fstarpu_flops = STARPU_FLOPS;
  48. static const intptr_t fstarpu_tag = STARPU_TAG;
  49. static const intptr_t fstarpu_tag_only = STARPU_TAG_ONLY;
  50. static const intptr_t fstarpu_name = STARPU_NAME;
  51. static const intptr_t fstarpu_node_selection_policy = STARPU_NODE_SELECTION_POLICY;
  52. static const intptr_t fstarpu_value = STARPU_VALUE;
  53. static const intptr_t fstarpu_sched_ctx = STARPU_SCHED_CTX;
  54. static const intptr_t fstarpu_cpu_worker = STARPU_CPU_WORKER;
  55. static const intptr_t fstarpu_cuda_worker = STARPU_CUDA_WORKER;
  56. static const intptr_t fstarpu_opencl_worker = STARPU_OPENCL_WORKER;
  57. static const intptr_t fstarpu_mic_worker = STARPU_MIC_WORKER;
  58. static const intptr_t fstarpu_scc_worker = STARPU_SCC_WORKER;
  59. static const intptr_t fstarpu_any_worker = STARPU_ANY_WORKER;
  60. static const intptr_t fstarpu_nmaxbufs = STARPU_NMAXBUFS;
  61. static const intptr_t fstarpu_sched_ctx_policy_name = STARPU_SCHED_CTX_POLICY_NAME;
  62. static const intptr_t fstarpu_sched_ctx_policy_struct = STARPU_SCHED_CTX_POLICY_STRUCT;
  63. static const intptr_t fstarpu_sched_ctx_policy_min_prio = STARPU_SCHED_CTX_POLICY_MIN_PRIO;
  64. static const intptr_t fstarpu_sched_ctx_policy_max_prio = STARPU_SCHED_CTX_POLICY_MAX_PRIO;
  65. static const intptr_t fstarpu_sched_ctx_hierarchy_level = STARPU_SCHED_CTX_HIERARCHY_LEVEL;
  66. static const intptr_t fstarpu_sched_ctx_nested = STARPU_SCHED_CTX_NESTED;
  67. static const intptr_t fstarpu_sched_ctx_awake_workers = STARPU_SCHED_CTX_AWAKE_WORKERS;
  68. static const intptr_t fstarpu_sched_ctx_policy_init = STARPU_SCHED_CTX_POLICY_INIT;
  69. static const intptr_t fstarpu_sched_ctx_user_data = STARPU_SCHED_CTX_USER_DATA;
  70. static const intptr_t fstarpu_starpu_nowhere = STARPU_NOWHERE;
  71. static const intptr_t fstarpu_starpu_cpu = STARPU_CPU;
  72. static const intptr_t fstarpu_starpu_cuda = STARPU_CUDA;
  73. static const intptr_t fstarpu_starpu_opencl = STARPU_OPENCL;
  74. static const intptr_t fstarpu_starpu_mic = STARPU_MIC;
  75. static const intptr_t fstarpu_starpu_scc = STARPU_SCC;
  76. static const intptr_t fstarpu_starpu_codelet_simgrid_execute = STARPU_CODELET_SIMGRID_EXECUTE;
  77. static const intptr_t fstarpu_starpu_cuda_async = STARPU_CUDA_ASYNC;
  78. static const intptr_t fstarpu_starpu_opencl_async = STARPU_OPENCL_ASYNC;
  79. intptr_t fstarpu_get_constant(char *s)
  80. {
  81. if (!strcmp(s, "FSTARPU_R")) { return fstarpu_r; }
  82. else if (!strcmp(s, "FSTARPU_W")) { return fstarpu_w; }
  83. else if (!strcmp(s, "FSTARPU_RW")) { return fstarpu_rw; }
  84. else if (!strcmp(s, "FSTARPU_SCRATCH")) { return fstarpu_scratch; }
  85. else if (!strcmp(s, "FSTARPU_REDUX")) { return fstarpu_redux; }
  86. else if (!strcmp(s, "FSTARPU_COMMUTE")) { return fstarpu_commute; }
  87. else if (!strcmp(s, "FSTARPU_SSEND")) { return fstarpu_ssend; }
  88. else if (!strcmp(s, "FSTARPU_LOCALITY")) { return fstarpu_locality; }
  89. else if (!strcmp(s, "FSTARPU_DATA_ARRAY")) { return fstarpu_data_array; }
  90. else if (!strcmp(s, "FSTARPU_DATA_MODE_ARRAY")) { return fstarpu_data_mode_array; }
  91. else if (!strcmp(s, "FSTARPU_CL_ARGS")) { return fstarpu_cl_args; }
  92. else if (!strcmp(s, "FSTARPU_CALLBACK")) { return fstarpu_callback; }
  93. else if (!strcmp(s, "FSTARPU_CALLBACK_WITH_ARG")) { return fstarpu_callback_with_arg; }
  94. else if (!strcmp(s, "FSTARPU_CALLBACK_ARG")) { return fstarpu_callback_arg; }
  95. else if (!strcmp(s, "FSTARPU_PROLOGUE_CALLBACK")) { return fstarpu_prologue_callback; }
  96. else if (!strcmp(s, "FSTARPU_PROLOGUE_CALLBACK_ARG")) { return fstarpu_prologue_callback_arg; }
  97. else if (!strcmp(s, "FSTARPU_PROLOGUE_CALLBACK_POP")) { return fstarpu_prologue_callback_pop; }
  98. else if (!strcmp(s, "FSTARPU_PROLOGUE_CALLBACK_POP_ARG")) { return fstarpu_prologue_callback_pop_arg; }
  99. else if (!strcmp(s, "FSTARPU_PRIORITY")) { return fstarpu_priority; }
  100. else if (!strcmp(s, "FSTARPU_EXECUTE_ON_NODE")) { return fstarpu_execute_on_node; }
  101. else if (!strcmp(s, "FSTARPU_EXECUTE_ON_DATA")) { return fstarpu_execute_on_data; }
  102. else if (!strcmp(s, "FSTARPU_EXECUTE_ON_WORKER")) { return fstarpu_execute_on_worker; }
  103. else if (!strcmp(s, "FSTARPU_WORKER_ORDER")) { return fstarpu_worker_order; }
  104. else if (!strcmp(s, "FSTARPU_HYPERVISOR_TAG")) { return fstarpu_hypervisor_tag; }
  105. else if (!strcmp(s, "FSTARPU_POSSIBLY_PARALLEL")) { return fstarpu_possibly_parallel; }
  106. else if (!strcmp(s, "FSTARPU_FLOPS")) { return fstarpu_flops; }
  107. else if (!strcmp(s, "FSTARPU_TAG")) { return fstarpu_tag; }
  108. else if (!strcmp(s, "FSTARPU_TAG_ONLY")) { return fstarpu_tag_only; }
  109. else if (!strcmp(s, "FSTARPU_NAME")) { return fstarpu_name; }
  110. else if (!strcmp(s, "FSTARPU_NODE_SELECTION_POLICY")) { return fstarpu_node_selection_policy; }
  111. else if (!strcmp(s, "FSTARPU_VALUE")) { return fstarpu_value; }
  112. else if (!strcmp(s, "FSTARPU_SCHED_CTX")) { return fstarpu_sched_ctx; }
  113. else if (!strcmp(s, "FSTARPU_CPU_WORKER")) { return fstarpu_cpu_worker; }
  114. else if (!strcmp(s, "FSTARPU_CUDA_WORKER")) { return fstarpu_cuda_worker; }
  115. else if (!strcmp(s, "FSTARPU_OPENCL_WORKER")) { return fstarpu_opencl_worker; }
  116. else if (!strcmp(s, "FSTARPU_MIC_WORKER")) { return fstarpu_mic_worker; }
  117. else if (!strcmp(s, "FSTARPU_SCC_WORKER")) { return fstarpu_scc_worker; }
  118. else if (!strcmp(s, "FSTARPU_ANY_WORKER")) { return fstarpu_any_worker; }
  119. else if (!strcmp(s, "FSTARPU_NMAXBUFS")) { return fstarpu_nmaxbufs; }
  120. else if (!strcmp(s, "FSTARPU_SCHED_CTX_POLICY_NAME")) { return fstarpu_sched_ctx_policy_name; }
  121. else if (!strcmp(s, "FSTARPU_SCHED_CTX_POLICY_STRUCT")) { return fstarpu_sched_ctx_policy_struct; }
  122. else if (!strcmp(s, "FSTARPU_SCHED_CTX_POLICY_MIN_PRIO")) { return fstarpu_sched_ctx_policy_min_prio; }
  123. else if (!strcmp(s, "FSTARPU_SCHED_CTX_POLICY_MAX_PRIO")) { return fstarpu_sched_ctx_policy_max_prio; }
  124. else if (!strcmp(s, "FSTARPU_SCHED_CTX_HIERARCHY_LEVEL")) { return fstarpu_sched_ctx_hierarchy_level; }
  125. else if (!strcmp(s, "FSTARPU_SCHED_CTX_NESTED")) { return fstarpu_sched_ctx_nested; }
  126. else if (!strcmp(s, "FSTARPU_SCHED_CTX_AWAKE_WORKERS")) { return fstarpu_sched_ctx_awake_workers; }
  127. else if (!strcmp(s, "FSTARPU_SCHED_CTX_POLICY_INIT")) { return fstarpu_sched_ctx_policy_init; }
  128. else if (!strcmp(s, "FSTARPU_SCHED_CTX_USER_DATA")) { return fstarpu_sched_ctx_user_data; }
  129. else if (!strcmp(s, "FSTARPU_NOWHERE")) { return fstarpu_starpu_nowhere; }
  130. else if (!strcmp(s, "FSTARPU_CPU")) { return fstarpu_starpu_cpu; }
  131. else if (!strcmp(s, "FSTARPU_CUDA")) { return fstarpu_starpu_cuda; }
  132. else if (!strcmp(s, "FSTARPU_OPENCL")) { return fstarpu_starpu_opencl; }
  133. else if (!strcmp(s, "FSTARPU_MIC")) { return fstarpu_starpu_mic; }
  134. else if (!strcmp(s, "FSTARPU_SCC")) { return fstarpu_starpu_scc; }
  135. else if (!strcmp(s, "FSTARPU_CODELET_SIMGRID_EXECUTE")) { return fstarpu_starpu_codelet_simgrid_execute; }
  136. else if (!strcmp(s, "FSTARPU_CUDA_ASYNC")) { return fstarpu_starpu_cuda_async; }
  137. else if (!strcmp(s, "FSTARPU_OPENCL_ASYNC")) { return fstarpu_starpu_opencl_async; }
  138. else { _FSTARPU_ERROR("unknown constant"); }
  139. }
  140. struct starpu_conf *fstarpu_conf_allocate(void)
  141. {
  142. struct starpu_conf *conf;
  143. _STARPU_MALLOC(conf, sizeof(*conf));
  144. starpu_conf_init(conf);
  145. return conf;
  146. }
  147. void fstarpu_conf_free(struct starpu_conf *conf)
  148. {
  149. memset(conf, 0, sizeof(*conf));
  150. free(conf);
  151. }
  152. void fstarpu_conf_set_sched_policy_name(struct starpu_conf *conf, const char *sched_policy_name)
  153. {
  154. conf->sched_policy_name = sched_policy_name;
  155. }
  156. void fstarpu_conf_set_min_prio(struct starpu_conf *conf, int min_prio)
  157. {
  158. conf->global_sched_ctx_min_priority = min_prio;
  159. }
  160. void fstarpu_conf_set_max_prio(struct starpu_conf *conf, int max_prio)
  161. {
  162. conf->global_sched_ctx_max_priority = max_prio;
  163. }
  164. void fstarpu_conf_set_ncpu(struct starpu_conf *conf, int ncpu)
  165. {
  166. STARPU_ASSERT(ncpu >= 0 && ncpu <= STARPU_NMAXWORKERS);
  167. conf->ncpus = ncpu;
  168. }
  169. void fstarpu_conf_set_ncuda(struct starpu_conf *conf, int ncuda)
  170. {
  171. STARPU_ASSERT(ncuda >= 0 && ncuda <= STARPU_NMAXWORKERS);
  172. conf->ncuda = ncuda;
  173. }
  174. void fstarpu_conf_set_nopencl(struct starpu_conf *conf, int nopencl)
  175. {
  176. STARPU_ASSERT(nopencl >= 0 && nopencl <= STARPU_NMAXWORKERS);
  177. conf->nopencl = nopencl;
  178. }
  179. void fstarpu_conf_set_nmic(struct starpu_conf *conf, int nmic)
  180. {
  181. STARPU_ASSERT(nmic >= 0 && nmic <= STARPU_NMAXWORKERS);
  182. conf->nmic = nmic;
  183. }
  184. void fstarpu_conf_set_nscc(struct starpu_conf *conf, int nscc)
  185. {
  186. STARPU_ASSERT(nscc >= 0 && nscc <= STARPU_NMAXWORKERS);
  187. conf->nscc = nscc;
  188. }
  189. void fstarpu_conf_set_calibrate(struct starpu_conf *conf, int calibrate)
  190. {
  191. STARPU_ASSERT(calibrate == 0 || calibrate == 1);
  192. conf->calibrate = calibrate;
  193. }
  194. void fstarpu_conf_set_bus_calibrate(struct starpu_conf *conf, int bus_calibrate)
  195. {
  196. STARPU_ASSERT(bus_calibrate == 0 || bus_calibrate == 1);
  197. conf->bus_calibrate = bus_calibrate;
  198. }
  199. void fstarpu_topology_print(void)
  200. {
  201. starpu_topology_print(stderr);
  202. }
  203. struct starpu_codelet *fstarpu_codelet_allocate(void)
  204. {
  205. struct starpu_codelet *cl;
  206. _STARPU_MALLOC(cl, sizeof(*cl));
  207. starpu_codelet_init(cl);
  208. return cl;
  209. }
  210. void fstarpu_codelet_free(struct starpu_codelet *cl)
  211. {
  212. memset(cl, 0, sizeof(*cl));
  213. free(cl);
  214. }
  215. void fstarpu_codelet_set_name(struct starpu_codelet *cl, const char *cl_name)
  216. {
  217. cl->name = cl_name;
  218. }
  219. void fstarpu_codelet_add_cpu_func(struct starpu_codelet *cl, void *f_ptr)
  220. {
  221. const size_t max_cpu_funcs = sizeof(cl->cpu_funcs)/sizeof(cl->cpu_funcs[0])-1;
  222. size_t i;
  223. for (i = 0; i < max_cpu_funcs; i++)
  224. {
  225. if (cl->cpu_funcs[i] == NULL)
  226. {
  227. cl->cpu_funcs[i] = f_ptr;
  228. return;
  229. }
  230. }
  231. _FSTARPU_ERROR("fstarpu: too many cpu functions in Fortran codelet");
  232. }
  233. void fstarpu_codelet_add_cuda_func(struct starpu_codelet *cl, void *f_ptr)
  234. {
  235. const size_t max_cuda_funcs = sizeof(cl->cuda_funcs)/sizeof(cl->cuda_funcs[0])-1;
  236. unsigned i;
  237. for (i = 0; i < max_cuda_funcs; i++)
  238. {
  239. if (cl->cuda_funcs[i] == NULL)
  240. {
  241. cl->cuda_funcs[i] = f_ptr;
  242. return;
  243. }
  244. }
  245. _FSTARPU_ERROR("fstarpu: too many cuda functions in Fortran codelet");
  246. }
  247. void fstarpu_codelet_add_cuda_flags(struct starpu_codelet *cl, intptr_t flags)
  248. {
  249. const size_t max_cuda_flags = sizeof(cl->cuda_flags)/sizeof(cl->cuda_flags[0])-1;
  250. unsigned i;
  251. for (i = 0; i < max_cuda_flags; i++)
  252. {
  253. if (cl->cuda_flags[i] == 0)
  254. {
  255. cl->cuda_flags[i] = (char)flags;
  256. return;
  257. }
  258. }
  259. _FSTARPU_ERROR("fstarpu: too many cuda flags in Fortran codelet");
  260. }
  261. void fstarpu_codelet_add_opencl_func(struct starpu_codelet *cl, void *f_ptr)
  262. {
  263. const size_t max_opencl_funcs = sizeof(cl->opencl_funcs)/sizeof(cl->opencl_funcs[0])-1;
  264. unsigned i;
  265. for (i = 0; i < max_opencl_funcs; i++)
  266. {
  267. if (cl->opencl_funcs[i] == NULL)
  268. {
  269. cl->opencl_funcs[i] = f_ptr;
  270. return;
  271. }
  272. }
  273. _FSTARPU_ERROR("fstarpu: too many opencl functions in Fortran codelet");
  274. }
  275. void fstarpu_codelet_add_opencl_flags(struct starpu_codelet *cl, intptr_t flags)
  276. {
  277. const size_t max_opencl_flags = sizeof(cl->opencl_flags)/sizeof(cl->opencl_flags[0])-1;
  278. unsigned i;
  279. for (i = 0; i < max_opencl_flags; i++)
  280. {
  281. if (cl->opencl_flags[i] == 0)
  282. {
  283. cl->opencl_flags[i] = (char)flags;
  284. return;
  285. }
  286. }
  287. _FSTARPU_ERROR("fstarpu: too many opencl flags in Fortran codelet");
  288. }
  289. void fstarpu_codelet_add_mic_func(struct starpu_codelet *cl, void *f_ptr)
  290. {
  291. const size_t max_mic_funcs = sizeof(cl->mic_funcs)/sizeof(cl->mic_funcs[0])-1;
  292. unsigned i;
  293. for (i = 0; i < max_mic_funcs; i++)
  294. {
  295. if (cl->mic_funcs[i] == NULL)
  296. {
  297. cl->mic_funcs[i] = f_ptr;
  298. return;
  299. }
  300. }
  301. _FSTARPU_ERROR("fstarpu: too many mic functions in Fortran codelet");
  302. }
  303. void fstarpu_codelet_add_scc_func(struct starpu_codelet *cl, void *f_ptr)
  304. {
  305. const size_t max_scc_funcs = sizeof(cl->scc_funcs)/sizeof(cl->scc_funcs[0])-1;
  306. unsigned i;
  307. for (i = 0; i < max_scc_funcs; i++)
  308. {
  309. if (cl->scc_funcs[i] == NULL)
  310. {
  311. cl->scc_funcs[i] = f_ptr;
  312. return;
  313. }
  314. }
  315. _FSTARPU_ERROR("fstarpu: too many scc functions in Fortran codelet");
  316. }
  317. void fstarpu_codelet_add_buffer(struct starpu_codelet *cl, intptr_t _mode)
  318. {
  319. enum starpu_data_access_mode mode = (enum starpu_data_access_mode) _mode;
  320. const size_t max_modes = sizeof(cl->modes)/sizeof(cl->modes[0])-1;
  321. if ((mode & (STARPU_ACCESS_MODE_MAX-1)) != mode)
  322. {
  323. _FSTARPU_ERROR("fstarpu: invalid data mode");
  324. }
  325. if (cl->nbuffers < (int) max_modes)
  326. {
  327. cl->modes[cl->nbuffers] = (unsigned int)mode;
  328. cl->nbuffers++;
  329. }
  330. else
  331. {
  332. _FSTARPU_ERROR("fstarpu: too many buffers in Fortran codelet");
  333. }
  334. }
  335. void fstarpu_codelet_set_variable_nbuffers(struct starpu_codelet *cl)
  336. {
  337. cl->nbuffers = STARPU_VARIABLE_NBUFFERS;
  338. }
  339. void fstarpu_codelet_set_nbuffers(struct starpu_codelet *cl, int nbuffers)
  340. {
  341. if (nbuffers >= 0)
  342. {
  343. cl->nbuffers = nbuffers;
  344. }
  345. else
  346. {
  347. _FSTARPU_ERROR("fstarpu: invalid nbuffers parameter");
  348. }
  349. }
  350. void fstarpu_codelet_set_flags(struct starpu_codelet *cl, intptr_t flags)
  351. {
  352. cl->flags = (int)flags;
  353. }
  354. void fstarpu_codelet_set_where(struct starpu_codelet *cl, intptr_t where)
  355. {
  356. STARPU_ASSERT(where >= 0);
  357. cl->where = (uint32_t)where;
  358. }
  359. void * fstarpu_variable_get_ptr(void *buffers[], int i)
  360. {
  361. return (void *)STARPU_VECTOR_GET_PTR(buffers[i]);
  362. }
  363. void * fstarpu_vector_get_ptr(void *buffers[], int i)
  364. {
  365. return (void *)STARPU_VECTOR_GET_PTR(buffers[i]);
  366. }
  367. int fstarpu_vector_get_nx(void *buffers[], int i)
  368. {
  369. return STARPU_VECTOR_GET_NX(buffers[i]);
  370. }
  371. void * fstarpu_matrix_get_ptr(void *buffers[], int i)
  372. {
  373. return (void *)STARPU_MATRIX_GET_PTR(buffers[i]);
  374. }
  375. int fstarpu_matrix_get_ld(void *buffers[], int i)
  376. {
  377. return STARPU_MATRIX_GET_LD(buffers[i]);
  378. }
  379. int fstarpu_matrix_get_nx(void *buffers[], int i)
  380. {
  381. return STARPU_MATRIX_GET_NX(buffers[i]);
  382. }
  383. int fstarpu_matrix_get_ny(void *buffers[], int i)
  384. {
  385. return STARPU_MATRIX_GET_NY(buffers[i]);
  386. }
  387. void * fstarpu_block_get_ptr(void *buffers[], int i)
  388. {
  389. return (void *)STARPU_BLOCK_GET_PTR(buffers[i]);
  390. }
  391. int fstarpu_block_get_ldy(void *buffers[], int i)
  392. {
  393. return STARPU_BLOCK_GET_LDY(buffers[i]);
  394. }
  395. int fstarpu_block_get_ldz(void *buffers[], int i)
  396. {
  397. return STARPU_BLOCK_GET_LDZ(buffers[i]);
  398. }
  399. int fstarpu_block_get_nx(void *buffers[], int i)
  400. {
  401. return STARPU_BLOCK_GET_NX(buffers[i]);
  402. }
  403. int fstarpu_block_get_ny(void *buffers[], int i)
  404. {
  405. return STARPU_BLOCK_GET_NY(buffers[i]);
  406. }
  407. int fstarpu_block_get_nz(void *buffers[], int i)
  408. {
  409. return STARPU_BLOCK_GET_NZ(buffers[i]);
  410. }
  411. void fstarpu_data_acquire(starpu_data_handle_t handle, intptr_t mode)
  412. {
  413. STARPU_ASSERT(mode == fstarpu_r || mode == fstarpu_w || mode == fstarpu_rw);
  414. starpu_data_acquire(handle, (int)mode);
  415. }
  416. void fstarpu_unpack_arg(char *cl_arg, void ***_buffer_list)
  417. {
  418. void **buffer_list = *_buffer_list;
  419. size_t current_arg_offset = 0;
  420. int nargs, arg;
  421. /* We fill the different pointers with the appropriate arguments */
  422. memcpy(&nargs, cl_arg, sizeof(nargs));
  423. current_arg_offset += sizeof(nargs);
  424. for (arg = 0; arg < nargs; arg++)
  425. {
  426. void *argptr = buffer_list[arg];
  427. /* If not reading all cl_args */
  428. if(argptr == NULL)
  429. break;
  430. size_t arg_size;
  431. memcpy(&arg_size, cl_arg+current_arg_offset, sizeof(arg_size));
  432. current_arg_offset += sizeof(arg_size);
  433. memcpy(argptr, cl_arg+current_arg_offset, arg_size);
  434. current_arg_offset += arg_size;
  435. }
  436. free(cl_arg);
  437. }
  438. void fstarpu_sched_ctx_display_workers(int ctx)
  439. {
  440. starpu_sched_ctx_display_workers((unsigned)ctx, stderr);
  441. }
  442. intptr_t fstarpu_worker_get_type(int workerid)
  443. {
  444. return (intptr_t)starpu_worker_get_type(workerid);
  445. }
  446. int fstarpu_worker_get_count_by_type(intptr_t type)
  447. {
  448. return starpu_worker_get_count_by_type((enum starpu_worker_archtype)type);
  449. }
  450. unsigned fstarpu_worker_get_ids_by_type(intptr_t type, int *workerids, unsigned maxsize)
  451. {
  452. return starpu_worker_get_ids_by_type((enum starpu_worker_archtype)type, workerids, maxsize);
  453. }
  454. int fstarpu_worker_get_by_type(intptr_t type, int num)
  455. {
  456. return starpu_worker_get_by_type((enum starpu_worker_archtype)type, num);
  457. }
  458. int fstarpu_worker_get_by_devid(intptr_t type, int devid)
  459. {
  460. return starpu_worker_get_by_type((enum starpu_worker_archtype)type, devid);
  461. }
  462. void fstarpu_worker_get_type_as_string(intptr_t type, char *dst, size_t maxlen)
  463. {
  464. const char *str = starpu_worker_get_type_as_string((enum starpu_worker_archtype)type);
  465. snprintf(dst, maxlen, "%s", str);
  466. }
  467. struct starpu_data_handle *fstarpu_data_handle_array_alloc(int nb)
  468. {
  469. void *ptr;
  470. _STARPU_CALLOC(ptr, (size_t)nb, sizeof(starpu_data_handle_t));
  471. return ptr;
  472. }
  473. void fstarpu_data_handle_array_free(starpu_data_handle_t *handles)
  474. {
  475. free(handles);
  476. }
  477. void fstarpu_data_handle_array_set(starpu_data_handle_t *handles, int i, starpu_data_handle_t handle)
  478. {
  479. handles[i] = handle;
  480. }
  481. struct starpu_data_descr *fstarpu_data_descr_array_alloc(int nb)
  482. {
  483. void *ptr;
  484. _STARPU_CALLOC(ptr, (size_t)nb, sizeof(struct starpu_data_descr));
  485. return ptr;
  486. }
  487. struct starpu_data_descr *fstarpu_data_descr_alloc(void)
  488. {
  489. return fstarpu_data_descr_array_alloc(1);
  490. }
  491. void fstarpu_data_descr_array_free(struct starpu_data_descr *descrs)
  492. {
  493. free(descrs);
  494. }
  495. void fstarpu_data_descr_free(struct starpu_data_descr *descr)
  496. {
  497. fstarpu_data_descr_array_free(descr);
  498. }
  499. void fstarpu_data_descr_array_set(struct starpu_data_descr *descrs, int i, starpu_data_handle_t handle, intptr_t mode)
  500. {
  501. descrs[i].handle = handle;
  502. descrs[i].mode = (enum starpu_data_access_mode)mode;
  503. }
  504. void fstarpu_data_descr_set(struct starpu_data_descr *descr, starpu_data_handle_t handle, intptr_t mode)
  505. {
  506. fstarpu_data_descr_array_set(descr, 1, handle, mode);
  507. }
  508. struct starpu_data_filter *fstarpu_data_filter_allocate(void)
  509. {
  510. struct starpu_data_filter *filter;
  511. _STARPU_CALLOC(filter, 1, sizeof(*filter));
  512. return filter;
  513. }
  514. /* Note: use fstarpu_df_alloc_ prefix instead of fstarpu_data_filter_allocate_ to fit within the
  515. * Fortran id length limit */
  516. #define _FSTARPU_DATA_FILTER_ALLOCATOR(name) \
  517. struct starpu_data_filter *fstarpu_df_alloc_##name(void) \
  518. { \
  519. struct starpu_data_filter *filter = fstarpu_data_filter_allocate(); \
  520. filter->filter_func = starpu_##name; \
  521. return filter; \
  522. }
  523. _FSTARPU_DATA_FILTER_ALLOCATOR(bcsr_filter_canonical_block);
  524. _FSTARPU_DATA_FILTER_ALLOCATOR(csr_filter_vertical_block);
  525. _FSTARPU_DATA_FILTER_ALLOCATOR(matrix_filter_block);
  526. _FSTARPU_DATA_FILTER_ALLOCATOR(matrix_filter_block_shadow);
  527. _FSTARPU_DATA_FILTER_ALLOCATOR(matrix_filter_vertical_block);
  528. _FSTARPU_DATA_FILTER_ALLOCATOR(matrix_filter_vertical_block_shadow);
  529. _FSTARPU_DATA_FILTER_ALLOCATOR(vector_filter_block);
  530. _FSTARPU_DATA_FILTER_ALLOCATOR(vector_filter_block_shadow);
  531. _FSTARPU_DATA_FILTER_ALLOCATOR(vector_filter_list);
  532. _FSTARPU_DATA_FILTER_ALLOCATOR(vector_filter_divide_in_2);
  533. _FSTARPU_DATA_FILTER_ALLOCATOR(block_filter_block);
  534. _FSTARPU_DATA_FILTER_ALLOCATOR(block_filter_block_shadow);
  535. _FSTARPU_DATA_FILTER_ALLOCATOR(block_filter_vertical_block);
  536. _FSTARPU_DATA_FILTER_ALLOCATOR(block_filter_vertical_block_shadow);
  537. #undef _FSTARPU_DATA_FILTER_ALLOCATOR
  538. void fstarpu_data_filter_free(struct starpu_data_filter *filter) {
  539. memset(filter, 0, sizeof(*filter));
  540. free(filter);
  541. }
  542. void fstarpu_data_filter_set_filter_func(struct starpu_data_filter *filter, void *f_ptr)
  543. {
  544. STARPU_ASSERT(f_ptr != NULL);
  545. filter->filter_func = f_ptr;
  546. }
  547. void fstarpu_data_filter_set_nchildren(struct starpu_data_filter *filter, int nchildren)
  548. {
  549. STARPU_ASSERT(nchildren >= 0);
  550. filter->nchildren = nchildren;
  551. }
  552. void fstarpu_data_filter_set_get_nchildren_func(struct starpu_data_filter *filter, void *f_ptr)
  553. {
  554. filter->get_nchildren = f_ptr;
  555. }
  556. void fstarpu_data_filter_set_get_child_ops_func(struct starpu_data_filter *filter, void *f_ptr)
  557. {
  558. filter->get_child_ops = f_ptr;
  559. }
  560. void fstarpu_data_filter_set_filter_arg(struct starpu_data_filter *filter, int filter_arg)
  561. {
  562. STARPU_ASSERT(filter_arg >= 0); /* starpu_data_filter.filter_arg is unsigned, but
  563. * Fortran does not support unsigned types */
  564. filter->filter_arg = (unsigned)filter_arg;
  565. }
  566. void fstarpu_data_filter_set_filter_arg_ptr(struct starpu_data_filter *filter, void *filter_arg_ptr)
  567. {
  568. filter->filter_arg_ptr = filter_arg_ptr;
  569. }